Spaces:
Sleeping
Sleeping
update mem
Browse files
server.py
CHANGED
@@ -21,8 +21,10 @@ def launch_vllm_server(beta=1.0):
|
|
21 |
"Qwen/Qwen3-4B",
|
22 |
"--tensor-parallel-size", "1",
|
23 |
"--enforce-eager",
|
|
|
24 |
"--max-seq-len-to-capture", "2048",
|
25 |
-
"--max-num-seqs", "1"
|
|
|
26 |
]
|
27 |
subprocess.run(cmd, env=env)
|
28 |
|
|
|
21 |
"Qwen/Qwen3-4B",
|
22 |
"--tensor-parallel-size", "1",
|
23 |
"--enforce-eager",
|
24 |
+
"--max-model-len", "2048",
|
25 |
"--max-seq-len-to-capture", "2048",
|
26 |
+
"--max-num-seqs", "1",
|
27 |
+
"--port", "8000"
|
28 |
]
|
29 |
subprocess.run(cmd, env=env)
|
30 |
|