Spaces:
Runtime error
Runtime error
| version: "3.9" | |
| services: | |
| fastchat-controller: | |
| build: | |
| context: . | |
| dockerfile: Dockerfile | |
| image: fastchat:latest | |
| ports: | |
| - "21001:21001" | |
| entrypoint: ["python3.9", "-m", "fastchat.serve.controller", "--host", "0.0.0.0", "--port", "21001"] | |
| fastchat-model-worker: | |
| build: | |
| context: . | |
| dockerfile: Dockerfile | |
| volumes: | |
| - huggingface:/root/.cache/huggingface | |
| image: fastchat:latest | |
| deploy: | |
| resources: | |
| reservations: | |
| devices: | |
| - driver: nvidia | |
| count: 1 | |
| capabilities: [gpu] | |
| entrypoint: ["python3.9", "-m", "fastchat.serve.model_worker", "--model-names", "${FASTCHAT_WORKER_MODEL_NAMES:-vicuna-7b-v1.5}", "--model-path", "${FASTCHAT_WORKER_MODEL_PATH:-lmsys/vicuna-7b-v1.5}", "--worker-address", "http://fastchat-model-worker:21002", "--controller-address", "http://fastchat-controller:21001", "--host", "0.0.0.0", "--port", "21002"] | |
| fastchat-api-server: | |
| build: | |
| context: . | |
| dockerfile: Dockerfile | |
| image: fastchat:latest | |
| ports: | |
| - "8000:8000" | |
| entrypoint: ["python3.9", "-m", "fastchat.serve.openai_api_server", "--controller-address", "http://fastchat-controller:21001", "--host", "0.0.0.0", "--port", "8000"] | |
| volumes: | |
| huggingface: | |