File size: 600 Bytes
3f7cfab |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 |
version: '3'
services:
h2o-llm:
build:
context: ./
dockerfile: Dockerfile
args:
BUILDKIT_INLINE_CACHE: "0"
image: h2o-llm
shm_size: '64gb'
command: generate.py --load_8bit True --base_model 'EleutherAI/gpt-j-6B'
restart: unless-stopped
volumes:
- h2o-llm:/root/.cache # Location downloaded weights will be stored
ports:
- 7860:7860
deploy:
resources:
reservations:
devices:
- driver: nvidia
count: all
capabilities: [ gpu ]
volumes:
h2o-llm:
name: h2o-llm
|