Moses25 commited on
Commit
3ea2a7d
1 Parent(s): 2f1aee7

Create run.sh

Browse files
Files changed (1) hide show
  1. run.sh +8 -0
run.sh ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ git clone https://huggingface.co/Moses25/Mistral-7B-Instruct-32K-AWQ
3
+ python -m vllm.entrypoints.openai.api_server --model=Mistral-7B-Instruct-32K-AWQ \
4
+ --trust-remote-code --host 0.0.0.0 --port 7777 \
5
+ --gpu-memory-utilization 0.8 \
6
+ --enforce-eager \
7
+ --max-model-len 8192 --chat-template llama2-chat-template.jinja \
8
+ --tensor-parallel-size 1 --served-model-name dewu-chat