From 75b9c50e7bd62a2a6a4bf80ec1023ce2e7cdff43 Mon Sep 17 00:00:00 2001 From: kyy Date: Tue, 14 Jan 2025 14:33:35 +0900 Subject: [PATCH] Initial commit --- docker-compose.yml | 74 ++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 74 insertions(+) create mode 100644 docker-compose.yml diff --git a/docker-compose.yml b/docker-compose.yml new file mode 100644 index 0000000..4371ae5 --- /dev/null +++ b/docker-compose.yml @@ -0,0 +1,74 @@ +version: "3.8" + +services: + llm-asyncio: + build: + context: . + dockerfile: Dockerfile + shm_size: "1000gb" + volumes: + - ./workspace:/opt/workspace/ + - ./cache:/root/.cache/ + - ../model:/opt/model/ + environment: + PYTORCH_CUDA_ALLOC_CONF: expandable_segments:True + PYTHONPATH: /opt/workspace/ + deploy: + resources: + reservations: + devices: + - driver: nvidia + count: "all" + capabilities: [gpu] + container_name: llm-asyncio + ports: + - "8000:8000" + networks: + - llm-network + entrypoint: > + /bin/bash -c " + uvicorn main:app --reload --host 0.0.0.0 --port 8000 + " + tty: true + + redis: + image: redis:latest + container_name: redis-server + ports: + - "6380:6380" + restart: always + networks: + - llm-network + + worker: + build: + context: . + dockerfile: Dockerfile + shm_size: "1000gb" + volumes: + - ./workspace:/opt/workspace/ + - ./cache:/root/.cache/ + - ../model:/opt/model/ + environment: + PYTORCH_CUDA_ALLOC_CONF: expandable_segments:True + PYTHONPATH: /opt/workspace/ + deploy: + resources: + reservations: + devices: + - driver: nvidia + count: "all" + capabilities: [gpu] + networks: + - llm-network + entrypoint: > + /bin/bash -c " + python /opt/workspace/worker.py + " + restart: always + tty: true + scale: 2 + +networks: + llm-network: + driver: bridge