Alikestocode commited on
Commit
27234fe
·
1 Parent(s): d02a9d8

Update Qwen model repo to AWQ quantized version

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -105,7 +105,7 @@ ROUTER_SYSTEM_PROMPT = """You are the Router Agent coordinating Math, Code, and
105
 
106
  MODELS = {
107
  "Router-Qwen3-32B-AWQ": {
108
- "repo_id": "Alovestocode/router-qwen3-32b-merged",
109
  "description": "Router checkpoint on Qwen3 32B merged, optimized with AWQ quantization via vLLM.",
110
  "params_b": 32.0,
111
  "quantization": "awq", # vLLM will auto-detect AWQ
 
105
 
106
  MODELS = {
107
  "Router-Qwen3-32B-AWQ": {
108
+ "repo_id": "Alovestocode/router-qwen3-32b-merged-awq", # AWQ quantized model
109
  "description": "Router checkpoint on Qwen3 32B merged, optimized with AWQ quantization via vLLM.",
110
  "params_b": 32.0,
111
  "quantization": "awq", # vLLM will auto-detect AWQ