mirror of
https://github.com/fauxpilot/fauxpilot.git
synced 2025-08-21 13:54:29 -07:00
Initial commit
This commit is contained in:
commit
a23a1478f7
65 changed files with 157042 additions and 0 deletions
24
docker-compose.yaml
Normal file
24
docker-compose.yaml
Normal file
|
@ -0,0 +1,24 @@
|
|||
version: '3.3'
|
||||
services:
|
||||
triton:
|
||||
image: moyix/triton_with_ft:22.06
|
||||
command: bash -c "CUDA_VISIBLE_DEVICES=${GPUS} mpirun -n 1 --allow-run-as-root /opt/tritonserver/bin/tritonserver --model-repository=/model"
|
||||
shm_size: '2gb'
|
||||
volumes:
|
||||
- ${MODEL_DIR}:/model
|
||||
ports:
|
||||
- "8000:8000"
|
||||
- "8001:8001"
|
||||
- "8002:8002"
|
||||
deploy:
|
||||
resources:
|
||||
reservations:
|
||||
devices:
|
||||
- driver: nvidia
|
||||
count: all
|
||||
capabilities: [gpu]
|
||||
copilot_proxy:
|
||||
image: moyix/copilot_proxy:latest
|
||||
command: python3 -m flask run --host=0.0.0.0 --port=5000
|
||||
ports:
|
||||
- "5000:5000"
|
Loading…
Add table
Add a link
Reference in a new issue