change to sglang
This commit is contained in:
@@ -7,10 +7,8 @@ MODEL="/home/kongcunliang/workspace/pretrained-models/unsloth/NVIDIA-Nemotron-3-
|
||||
llama-server \
|
||||
--model $MODEL \
|
||||
--alias "nemotron-3-super" \
|
||||
--prio 1 \
|
||||
--min_p 0.01 \
|
||||
--temp 0.6 \
|
||||
--top-p 0.95 \
|
||||
--ctx-size 1048576 \
|
||||
--ctx-size 262144 \
|
||||
--host 0.0.0.0 \
|
||||
--port 8001
|
||||
--port 8001 \
|
||||
|
||||
Reference in New Issue
Block a user