yusufs commited on
Commit
c0cde8e
·
1 Parent(s): 8c5a84b

feat(runner.sh): only enable prefix caching and disable log request

Browse files
Files changed (1) hide show
  1. runner.sh +2 -2
runner.sh CHANGED
@@ -53,5 +53,5 @@ python -u /app/openai_compatible_api_server.py \
53
  --dtype float16 \
54
  --enforce-eager \
55
  --gpu-memory-utilization 0.9 \
56
- --enable-chunked-prefill \
57
- --enable-prefix-caching
 
53
  --dtype float16 \
54
  --enforce-eager \
55
  --gpu-memory-utilization 0.9 \
56
+ --enable-prefix-caching \
57
+ --disable-log-requests