fix for quality check and update dep ver suggestions

chichun-charlie-liu · chichun-charlie-liu · commit d3f4127f834b · 2025-09-15T11:33:01.000-04:00
Signed-off-by: cliu-us &lt;cliu@us.ibm.com&gt;
diff --git a/examples/quantization_w8a8_fp8/README_granite4.md b/examples/quantization_w8a8_fp8/README_granite4.md
@@ -24,7 +24,7 @@ pip install llmcompressor
 ```
 
 This checkpoint format will need the latest vllm (ver >= 0.10.1.1) to run correctly. Additional dependencies and environment variables needed are:
-1. Dependencies:  `vllm=0.10.1.1, lm_eval=0.4.9.1, flash-attn=2.7.3, torch=2.7.1`
+1. Dependencies:  `vllm>=0.10.1.1, lm_eval>=0.4.9.1, flash-attn=2.7.3, torch>=2.7.1`
 2. ENV VAR:  `VLLM_USE_V1=0, VLLM_WORKER_MULTIPROC_METHOD=spawn`
 
 ## Quickstart
diff --git a/src/llmcompressor/modeling/granite4.py b/src/llmcompressor/modeling/granite4.py
@@ -1,6 +1,4 @@
 import torch
-from compressed_tensors.quantization import QuantizationStatus
-from compressed_tensors.utils import register_offload_parameter
 from transformers.models.granitemoehybrid.modeling_granitemoehybrid import (
     GraniteMoeHybridParallelExperts,
 )

Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,4 @@`
`1`	`1`	`import torch`
`2`		`-from compressed_tensors.quantization import QuantizationStatus`
`3`		`-from compressed_tensors.utils import register_offload_parameter`
`4`	`2`	`from transformers.models.granitemoehybrid.modeling_granitemoehybrid import (`
`5`	`3`	`GraniteMoeHybridParallelExperts,`
`6`	`4`	`)`