Sumkh commited on
Commit
004f73b
·
verified ·
1 Parent(s): 6201226

Update start.sh

Browse files
Files changed (1) hide show
  1. start.sh +5 -2
start.sh CHANGED
@@ -12,10 +12,13 @@ vllm serve unsloth/llama-3-8b-Instruct-bnb-4bit \
12
  --enable-auto-tool-choice \
13
  --tool-call-parser llama3_json \
14
  --chat-template examples/tool_chat_template_llama3.1_json.jinja \
15
- --dtype half &
 
 
 
16
 
17
  # Wait to ensure the vLLM server is fully started (adjust if needed)
18
  sleep 10
19
 
20
  # Start the Gradio application using python3
21
- python3 app.py
 
12
  --enable-auto-tool-choice \
13
  --tool-call-parser llama3_json \
14
  --chat-template examples/tool_chat_template_llama3.1_json.jinja \
15
+ --quantization bitsandbytes \
16
+ --load-format bitsandbytes \
17
+ --dtype half \
18
+ --enforce-eager &
19
 
20
  # Wait to ensure the vLLM server is fully started (adjust if needed)
21
  sleep 10
22
 
23
  # Start the Gradio application using python3
24
+ python3 app.py