Files changed (1) hide show
  1. README.md +2 -1
README.md CHANGED
@@ -92,8 +92,9 @@ python -m sglang.launch_server \
92
  --pp-size 1 \
93
  --dp-size 1 \
94
  --trust-remote-code \
 
95
  --tool-call-parser qwen25 \
96
- --json-model-override-args '{"linear_backend": "seg_la", "torch_dtype": "bfloat16", "architectures": ["BailingMoeV2_5ForCausalLM"], "model_type": "bailing_hybrid", "rope_scaling": {"rope_type": "yarn", "factor": 2.0, "rope_theta": 6000000, "partial_rotary_factor": 0.5, "original_max_position_embeddings": 131072}}' \
97
  --dist-init-addr $MASTER_IP:2345 \
98
  --port $PORT \
99
  --nnodes 1
 
92
  --pp-size 1 \
93
  --dp-size 1 \
94
  --trust-remote-code \
95
+ --context-length 262144 \
96
  --tool-call-parser qwen25 \
97
+ --json-model-override-args '{"rope_scaling": {"rope_type": "yarn", "factor": 2.0, "rope_theta": 6000000, "partial_rotary_factor": 0.5, "original_max_position_embeddings": 131072}}' \
98
  --dist-init-addr $MASTER_IP:2345 \
99
  --port $PORT \
100
  --nnodes 1