yzhuang commited on
Commit
4891247
·
1 Parent(s): 314161f

update mem

Browse files
Files changed (1) hide show
  1. server.py +3 -1
server.py CHANGED
@@ -21,8 +21,10 @@ def launch_vllm_server(beta=1.0):
21
  "Qwen/Qwen3-4B",
22
  "--tensor-parallel-size", "1",
23
  "--enforce-eager",
 
24
  "--max-seq-len-to-capture", "2048",
25
- "--max-num-seqs", "1"
 
26
  ]
27
  subprocess.run(cmd, env=env)
28
 
 
21
  "Qwen/Qwen3-4B",
22
  "--tensor-parallel-size", "1",
23
  "--enforce-eager",
24
+ "--max-model-len", "2048",
25
  "--max-seq-len-to-capture", "2048",
26
+ "--max-num-seqs", "1",
27
+ "--port", "8000"
28
  ]
29
  subprocess.run(cmd, env=env)
30