Sumkh commited on
Commit
5695d95
·
verified ·
1 Parent(s): 19ad6b0

Update start.sh

Browse files
Files changed (1) hide show
  1. start.sh +1 -5
start.sh CHANGED
@@ -11,11 +11,7 @@ export USER_AGENT="vllm_huggingface_space"
11
  vllm serve unsloth/llama-3-70b-Instruct-bnb-4bit \
12
  --enable-auto-tool-choice \
13
  --tool-call-parser llama3_json \
14
- --chat-template examples/tool_chat_template_llama3.1_json.jinja \
15
- --quantization bitsandbytes \
16
- --load-format bitsandbytes \
17
- --gpu_memory_utilization 0.9 \
18
- --enforce-eager &
19
 
20
  # Wait to ensure the vLLM server is fully started (adjust if needed)
21
  sleep 10
 
11
  vllm serve unsloth/llama-3-70b-Instruct-bnb-4bit \
12
  --enable-auto-tool-choice \
13
  --tool-call-parser llama3_json \
14
+ --chat-template examples/tool_chat_template_llama3.1_json.jinja &
 
 
 
 
15
 
16
  # Wait to ensure the vLLM server is fully started (adjust if needed)
17
  sleep 10