Spaces:

Alovestocode
/

ZeroGPU-LLM-Inference

Sleeping

Alikestocode commited on Nov 10, 2025

Commit

f0033ab

1 Parent(s): 2326498

Fix AWQModifier import path: use modifiers.awq instead of modifiers.quantization

- Correct import: from llmcompressor.modifiers.awq import AWQModifier
- Wrong import: from llmcompressor.modifiers.quantization import AWQModifier
- Updated all files with correct import path
- Added upgrade suggestion in error message

Files changed (4) hide show

LLM_COMPRESSOR_FEATURES.md +2 -2
QUANTIZE_AWQ.md +1 -1
app.py +3 -2
quantize_to_awq_colab.ipynb +4 -1

LLM_COMPRESSOR_FEATURES.md CHANGED Viewed

@@ -10,7 +10,7 @@ LLM Compressor supports multiple quantization methods beyond AWQ:
 #### AWQModifier (Activation-aware Weight Quantization)
 ```python
-from llmcompressor.modifiers.quantization import AWQModifier
 AWQModifier(
     w_bit=4,              # Weight bits (4 or 8)
@@ -60,7 +60,7 @@ You can combine multiple modifiers for maximum compression:
 ```python
 from llmcompressor import oneshot
-from llmcompressor.modifiers.quantization import AWQModifier
 from llmcompressor.modifiers.pruning import MagnitudePruningModifier
 oneshot(

 #### AWQModifier (Activation-aware Weight Quantization)
 ```python
+from llmcompressor.modifiers.awq import AWQModifier
 AWQModifier(
     w_bit=4,              # Weight bits (4 or 8)
 ```python
 from llmcompressor import oneshot
+from llmcompressor.modifiers.awq import AWQModifier
 from llmcompressor.modifiers.pruning import MagnitudePruningModifier
 oneshot(

QUANTIZE_AWQ.md CHANGED Viewed

@@ -73,7 +73,7 @@ If you prefer using llm-compressor (vLLM's quantization tool):
 ```python
 from llmcompressor import oneshot
-from llmcompressor.modifiers.quantization import AWQModifier
 # Quantize model
 oneshot(

 ```python
 from llmcompressor import oneshot
+from llmcompressor.modifiers.awq import AWQModifier
 # Quantize model
 oneshot(

app.py CHANGED Viewed

@@ -43,7 +43,8 @@ try:
     # Try both package names (llm-compressor and llmcompressor)
     try:
         from llmcompressor import oneshot
-        from llmcompressor.modifiers.quantization import AWQModifier
     except ImportError:
         # Try alternative package name
         import sys
@@ -55,7 +56,7 @@ try:
             if spec is None:
                 raise ImportError("llm-compressor not found")
             from llm_compressor import oneshot
-            from llm_compressor.modifiers.quantization import AWQModifier
         except ImportError:
             raise ImportError("Neither llmcompressor nor llm-compressor found")
     LLM_COMPRESSOR_AVAILABLE = True

     # Try both package names (llm-compressor and llmcompressor)
     try:
         from llmcompressor import oneshot
+        # Correct import path: AWQModifier is in modifiers.awq, not modifiers.quantization
+        from llmcompressor.modifiers.awq import AWQModifier
     except ImportError:
         # Try alternative package name
         import sys
             if spec is None:
                 raise ImportError("llm-compressor not found")
             from llm_compressor import oneshot
+            from llm_compressor.modifiers.awq import AWQModifier
         except ImportError:
             raise ImportError("Neither llmcompressor nor llm-compressor found")
     LLM_COMPRESSOR_AVAILABLE = True

quantize_to_awq_colab.ipynb CHANGED Viewed

@@ -148,7 +148,8 @@
         "# Import with error handling in case installation failed\n",
         "try:\n",
         "    from llmcompressor import oneshot\n",
-        "    from llmcompressor.modifiers.quantization import AWQModifier\n",
         "    LLM_COMPRESSOR_AVAILABLE = True\n",
         "    print(\"✅ LLM Compressor imported successfully\")\n",
         "except ImportError as e:\n",
@@ -157,6 +158,8 @@
         "    print(\"  %pip install llmcompressor\")\n",
         "    print(\"  OR\")\n",
         "    print(\"  %pip install git+https://github.com/vllm-project/llm-compressor.git\")\n",
         "    LLM_COMPRESSOR_AVAILABLE = False\n",
         "    raise\n",
         "\n",

         "# Import with error handling in case installation failed\n",
         "try:\n",
         "    from llmcompressor import oneshot\n",
+        "    # Correct import path: AWQModifier is in modifiers.awq, not modifiers.quantization\n",
+        "    from llmcompressor.modifiers.awq import AWQModifier\n",
         "    LLM_COMPRESSOR_AVAILABLE = True\n",
         "    print(\"✅ LLM Compressor imported successfully\")\n",
         "except ImportError as e:\n",
         "    print(\"  %pip install llmcompressor\")\n",
         "    print(\"  OR\")\n",
         "    print(\"  %pip install git+https://github.com/vllm-project/llm-compressor.git\")\n",
+        "    print(\"\\nNote: If import still fails, try:\")\n",
+        "    print(\"  %pip install --upgrade llmcompressor\")\n",
         "    LLM_COMPRESSOR_AVAILABLE = False\n",
         "    raise\n",
         "\n",