Merge pull request vllm-project#9 from ri938/organise

dont error if user doesnt have kernels installed
v1nc3nt27 · Aug 24, 2023 · 010b5bc · 010b5bc
2 parents 2617c55 + 5fcc1c4
commit 010b5bc
Showing 1 changed file with 8 additions and 4 deletions.
diff --git a/vllm/model_executor/layers/quant.py b/vllm/model_executor/layers/quant.py
@@ -5,11 +5,10 @@
 
 
 try:
-    import awq_inference_engine  # with CUDA kernels
+    import awq_inference_engine
+    KERNELS_INSTALLED = True
 except ImportError as ex:
-    raise ImportError(
-        "Unable to import awq_inference_engine: run setup.py"
-        " to install AWQ CUDA kernels")
+    KERNELS_INSTALLED = False
 
 
 class ScaledActivation(nn.Module):
@@ -34,6 +33,11 @@ def __init__(
         ):
         super().__init__()
 
+        if not KERNELS_INSTALLED:
+            raise ImportError(
+                "Unable to import awq_ext: run setup.py"
+                " to install AWQ CUDA kernels")
+
         if w_bit not in [4]:
             raise NotImplementedError("Only 4-bit are supported for now.")