We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 1542fbb commit 5310d13Copy full SHA for 5310d13
helm/vllm/values.yaml
@@ -16,7 +16,7 @@ vllm:
16
- /bin/sh
17
- -c
18
args:
19
- - "vllm serve openai/gpt-oss-20b --trust-remote-code --enable-chunked-prefill --enable-auto-tool-choice --tool-call-parser openai --reasoning-parser openai_gptoss"
+ - "vllm serve openai/gpt-oss-20b --trust-remote-code --enable-chunked-prefill --enable-auto-tool-choice --tool-call-parser openai --reasoning-parser openai_gptoss --max_tokens 10000"
20
gpu:
21
enabled: true
22
type: "nvidia"
0 commit comments