We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 7cf54ef commit 5e00fc7Copy full SHA for 5e00fc7
vllm/model_executor/models/llama.py
@@ -57,7 +57,7 @@ def __init__(
57
hidden_size: int,
58
intermediate_size: int,
59
hidden_act: str,
60
- quant_config: Optional[QKVParallelLinear] = None,
+ quant_config: Optional[QuantizationConfig] = None,
61
bias: bool = False,
62
) -> None:
63
super().__init__()
0 commit comments