Spaces:
Sleeping
Sleeping
Update server.py
Browse files
server.py
CHANGED
|
@@ -20,8 +20,8 @@ def launch_vllm_server(beta=1.0):
|
|
| 20 |
"Qwen/Qwen3-4B",
|
| 21 |
"--tensor-parallel-size", "1",
|
| 22 |
"--enforce-eager",
|
| 23 |
-
"--max-model-len", "
|
| 24 |
-
"--max-seq-len-to-capture", "
|
| 25 |
"--max-num-seqs", "36",
|
| 26 |
"--host", "0.0.0.0",
|
| 27 |
"--port", "8000",
|
|
|
|
| 20 |
"Qwen/Qwen3-4B",
|
| 21 |
"--tensor-parallel-size", "1",
|
| 22 |
"--enforce-eager",
|
| 23 |
+
"--max-model-len", "4096",
|
| 24 |
+
"--max-seq-len-to-capture", "4096",
|
| 25 |
"--max-num-seqs", "36",
|
| 26 |
"--host", "0.0.0.0",
|
| 27 |
"--port", "8000",
|