llama-gpt/api/13B.Dockerfile

26 lines
647 B
Docker

# Define the image argument and provide a default value
ARG IMAGE=ghcr.io/abetlen/llama-cpp-python:latest
# Define the model file name and download url
ARG MODEL_FILE=llama-2-13b-chat.bin
ARG MODEL_DOWNLOAD_URL=https://huggingface.co/TheBloke/Nous-Hermes-Llama2-GGML/resolve/main/nous-hermes-llama2-13b.ggmlv3.q4_0.bin
FROM ${IMAGE}
ARG MODEL_FILE
ARG MODEL_DOWNLOAD_URL
# Download the model file
RUN apt-get update -y && \
apt-get install --yes curl && \
mkdir -p /models && \
curl -L -o /models/${MODEL_FILE} ${MODEL_DOWNLOAD_URL}
WORKDIR /app
COPY . .
EXPOSE 8000
# Run the server start script
CMD ["/bin/sh", "/app/run.sh"]