Spaces:
Sleeping
Sleeping
Commit
·
27234fe
1
Parent(s):
d02a9d8
Update Qwen model repo to AWQ quantized version
Browse files
app.py
CHANGED
|
@@ -105,7 +105,7 @@ ROUTER_SYSTEM_PROMPT = """You are the Router Agent coordinating Math, Code, and
|
|
| 105 |
|
| 106 |
MODELS = {
|
| 107 |
"Router-Qwen3-32B-AWQ": {
|
| 108 |
-
"repo_id": "Alovestocode/router-qwen3-32b-merged",
|
| 109 |
"description": "Router checkpoint on Qwen3 32B merged, optimized with AWQ quantization via vLLM.",
|
| 110 |
"params_b": 32.0,
|
| 111 |
"quantization": "awq", # vLLM will auto-detect AWQ
|
|
|
|
| 105 |
|
| 106 |
MODELS = {
|
| 107 |
"Router-Qwen3-32B-AWQ": {
|
| 108 |
+
"repo_id": "Alovestocode/router-qwen3-32b-merged-awq", # AWQ quantized model
|
| 109 |
"description": "Router checkpoint on Qwen3 32B merged, optimized with AWQ quantization via vLLM.",
|
| 110 |
"params_b": 32.0,
|
| 111 |
"quantization": "awq", # vLLM will auto-detect AWQ
|