Spaces:

yusufs
/

vllm-inference

Paused

vllm-inference / Dockerfile

feat(download-model): add download model at runtime

fc30f26 6 months ago

665 Bytes

	FROM python:3.12

	# Declare your environment variables with the ARG directive
	ARG HF_TOKEN

	RUN useradd -m -u 1000 user
	USER user
	ENV PATH="/home/user/.local/bin:$PATH"

	WORKDIR /app

	COPY --chown=user ./requirements.txt requirements.txt
	RUN pip install --no-cache-dir -r requirements.txt --extra-index-url https://download.pytorch.org/whl/cu113

	COPY --chown=user . /app


	# Download at build time,
	# to ensure during restart we won't have to wait for the download from HF (only wait for docker pull).
	RUN python /app/download_model.py

	EXPOSE 7860

	#CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860"]

	RUN chmod +x /app/run.sh
	CMD ["/app/run.sh"]