diff --git a/vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_wNa16.py b/vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_wNa16.py index 7f4dad70287b..3f1b4d883b79 100644 --- a/vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_wNa16.py +++ b/vllm/model_executor/layers/quantization/compressed_tensors/schemes/compressed_tensors_wNa16.py @@ -79,8 +79,8 @@ def __init__( @classmethod def get_min_capability(cls) -> int: - # ampere and up - return 80 + # Turing and up + return 75 def create_weights( self,