diff --git a/src/fastserve/models/vllm.py b/src/fastserve/models/vllm.py index db89fe0..12217d0 100644 --- a/src/fastserve/models/vllm.py +++ b/src/fastserve/models/vllm.py @@ -29,14 +29,11 @@ def __init__( model, batch_size=1, timeout=0.0, - *args, **kwargs, ): from vllm import LLM - self.llm = LLM(model) - self.args = args - self.kwargs = kwargs + self.llm = LLM(model, **kwargs) super().__init__( batch_size, timeout,