Spaces:
Running
on
Zero
Running
on
Zero
use fp8 version of qwen3 30ba3b & 32b
Browse files
app.py
CHANGED
@@ -24,8 +24,8 @@ cancel_event = threading.Event()
|
|
24 |
# Torch-Compatible Model Definitions with Adjusted Descriptions
|
25 |
# ------------------------------
|
26 |
MODELS = {
|
27 |
-
"
|
28 |
-
"Qwen/Qwen3-32B-
|
29 |
"DeepSeek-R1-0528-Qwen3-8B": {"repo_id": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", "description": "DeepSeek-R1-0528-Qwen3-8B"},
|
30 |
"Nemotron-Research-Reasoning-Qwen-1.5B": {"repo_id": "nvidia/Nemotron-Research-Reasoning-Qwen-1.5B", "description": "Nemotron-Research-Reasoning-Qwen-1.5B"},
|
31 |
"Qwen2.5-Taiwan-1.5B-Instruct": {"repo_id": "benchang1110/Qwen2.5-Taiwan-1.5B-Instruct", "description": "Qwen2.5-Taiwan-1.5B-Instruct"},
|
|
|
24 |
# Torch-Compatible Model Definitions with Adjusted Descriptions
|
25 |
# ------------------------------
|
26 |
MODELS = {
|
27 |
+
"Qwen/Qwen3-30B-A3B-FP8": {"repo_id": "Qwen/Qwen3-30B-A3B-FP8", "description": "Qwen/Qwen3-30B-A3B-FP8"},
|
28 |
+
"Qwen/Qwen3-32B-FP8": {"repo_id": "Qwen/Qwen3-32B-FP8", "description": "Qwen/Qwen3-32B-FP8"},
|
29 |
"DeepSeek-R1-0528-Qwen3-8B": {"repo_id": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", "description": "DeepSeek-R1-0528-Qwen3-8B"},
|
30 |
"Nemotron-Research-Reasoning-Qwen-1.5B": {"repo_id": "nvidia/Nemotron-Research-Reasoning-Qwen-1.5B", "description": "Nemotron-Research-Reasoning-Qwen-1.5B"},
|
31 |
"Qwen2.5-Taiwan-1.5B-Instruct": {"repo_id": "benchang1110/Qwen2.5-Taiwan-1.5B-Instruct", "description": "Qwen2.5-Taiwan-1.5B-Instruct"},
|