Spaces:
Paused
Paused
feat(runner.sh): only enable prefix caching and disable log request
Browse files
runner.sh
CHANGED
@@ -53,5 +53,5 @@ python -u /app/openai_compatible_api_server.py \
|
|
53 |
--dtype float16 \
|
54 |
--enforce-eager \
|
55 |
--gpu-memory-utilization 0.9 \
|
56 |
-
--enable-
|
57 |
-
--
|
|
|
53 |
--dtype float16 \
|
54 |
--enforce-eager \
|
55 |
--gpu-memory-utilization 0.9 \
|
56 |
+
--enable-prefix-caching \
|
57 |
+
--disable-log-requests
|