yusufs commited on
Commit
0f3cd25
·
1 Parent(s): 0345d26

feat(sailorchat): using sailor chat model

Browse files
Files changed (2) hide show
  1. Dockerfile +1 -1
  2. run-sailor.sh +1 -1
Dockerfile CHANGED
@@ -32,4 +32,4 @@ EXPOSE 7860
32
  RUN chmod +x /app/run-llama.sh
33
  RUN chmod +x /app/run-sailor.sh
34
 
35
- CMD ["/app/run-llama.sh"]
 
32
  RUN chmod +x /app/run-llama.sh
33
  RUN chmod +x /app/run-sailor.sh
34
 
35
+ CMD ["/app/run-sailor.sh"]
run-sailor.sh CHANGED
@@ -27,4 +27,4 @@ python -u /app/openai_compatible_api_server.py \
27
  --max-model-len 32768 \
28
  --dtype float16 \
29
  --enforce-eager \
30
- --gpu-memory-utilization 0.9
 
27
  --max-model-len 32768 \
28
  --dtype float16 \
29
  --enforce-eager \
30
+ --gpu-memory-utilization 0.85