Spaces:
Sleeping
Sleeping
Damien Benveniste
commited on
Commit
·
a8f0134
1
Parent(s):
596dacb
modified
Browse files- Dockerfile +1 -1
- entrypoint.sh +2 -5
Dockerfile
CHANGED
@@ -10,7 +10,7 @@ ENV OUTLINES_CACHE_DIR="/tmp/outlines_cache"
|
|
10 |
ENV XDG_CONFIG_HOME="/.config"
|
11 |
ENV VLLM_USE_MODELSCOPE="false"
|
12 |
ENV VLLM_DISABLE_USAGE_STATS="true"
|
13 |
-
ENV VLLM_API_BASE_PATH="/v1"
|
14 |
|
15 |
# Ensure PATH includes common Python locations
|
16 |
ENV PATH="/usr/local/bin:/usr/bin:/bin:/usr/local/sbin:/usr/sbin:/sbin:$PATH"
|
|
|
10 |
ENV XDG_CONFIG_HOME="/.config"
|
11 |
ENV VLLM_USE_MODELSCOPE="false"
|
12 |
ENV VLLM_DISABLE_USAGE_STATS="true"
|
13 |
+
# ENV VLLM_API_BASE_PATH="/v1"
|
14 |
|
15 |
# Ensure PATH includes common Python locations
|
16 |
ENV PATH="/usr/local/bin:/usr/bin:/bin:/usr/local/sbin:/usr/sbin:/sbin:$PATH"
|
entrypoint.sh
CHANGED
@@ -1,7 +1,8 @@
|
|
1 |
#!/bin/bash
|
2 |
|
3 |
# Default values
|
4 |
-
MODEL=${MODEL:-"microsoft/Phi-3-mini-4k-instruct"}
|
|
|
5 |
DTYPE=${DTYPE:-"half"}
|
6 |
MAX_NUM_BATCHED_TOKENS=${MAX_NUM_BATCHED_TOKENS:-512}
|
7 |
MAX_NUM_SEQS=${MAX_NUM_SEQS:-16}
|
@@ -41,10 +42,6 @@ if [ "$ENFORCE_EAGER" = "true" ]; then
|
|
41 |
CMD="$CMD --enforce-eager"
|
42 |
fi
|
43 |
|
44 |
-
# Add base path if set
|
45 |
-
if [ -n "$VLLM_API_BASE_PATH" ]; then
|
46 |
-
CMD="$CMD --api-base-path $VLLM_API_BASE_PATH"
|
47 |
-
fi
|
48 |
|
49 |
# Execute the command
|
50 |
echo "Running command: $CMD"
|
|
|
1 |
#!/bin/bash
|
2 |
|
3 |
# Default values
|
4 |
+
# MODEL=${MODEL:-"microsoft/Phi-3-mini-4k-instruct"}
|
5 |
+
MODEL=${MODEL:-"EleutherAI/pythia-70m"}
|
6 |
DTYPE=${DTYPE:-"half"}
|
7 |
MAX_NUM_BATCHED_TOKENS=${MAX_NUM_BATCHED_TOKENS:-512}
|
8 |
MAX_NUM_SEQS=${MAX_NUM_SEQS:-16}
|
|
|
42 |
CMD="$CMD --enforce-eager"
|
43 |
fi
|
44 |
|
|
|
|
|
|
|
|
|
45 |
|
46 |
# Execute the command
|
47 |
echo "Running command: $CMD"
|