llama-gpt/docker-compose-13b.yml

27 lines
684 B
YAML

version: '3.6'
services:
llama-gpt-api-13b:
# image: 'ghcr.io/getumbrel/llama-gpt-api-llama-2-13b-chat:latest'
build:
context: ./api
dockerfile: 13B.Dockerfile
restart: on-failure
environment:
MODEL: '/models/llama-2-13b-chat.bin'
USE_MLOCK: 1
cap_add:
- IPC_LOCK
llama-gpt-ui:
image: 'ghcr.io/getumbrel/llama-gpt-ui:latest'
ports:
- 3000:3000
restart: on-failure
environment:
- 'OPENAI_API_KEY=sk-XXXXXXXXXXXXXXXXXXXX'
- 'OPENAI_API_HOST=http://llama-gpt-api-13b:8000'
- 'DEFAULT_MODEL=/models/llama-2-13b-chat.bin'
- 'WAIT_HOSTS=llama-gpt-api-13b:8000'
- 'WAIT_TIMEOUT=600'