We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
max_seq_len_to_capture
1 parent 7a89ffb commit fa9c197Copy full SHA for fa9c197
vllm/engine/arg_utils.py
@@ -341,9 +341,9 @@ def add_cli_args(
341
help='Maximum context length covered by CUDA '
342
'graphs. When a sequence has context length '
343
'larger than this, we fall back to eager mode. '
344
- '(DEPRECATED. Use --max-seq_len-to-capture instead'
+ '(DEPRECATED. Use --max-seq-len-to-capture instead'
345
')')
346
- parser.add_argument('--max-seq_len-to-capture',
+ parser.add_argument('--max-seq-len-to-capture',
347
type=int,
348
default=EngineArgs.max_seq_len_to_capture,
349
help='Maximum sequence length covered by CUDA '
0 commit comments