Spaces:
Running
Running
services: | |
MPT-7B: | |
container_name: worker0 | |
image: mlenergy/tgi:v1.0.0 | |
command: ["--model-id", "mosaicml/mpt-7b-chat", "--num-shard", "1", "--otlp-endpoint", "http://jaeger:4317"] | |
shm_size: 1g | |
networks: | |
- leaderboard | |
volumes: | |
- /data/leaderboard/tgi-data:/data | |
deploy: | |
restart_policy: | |
condition: any | |
resources: | |
reservations: | |
devices: | |
- driver: nvidia | |
device_ids: ["0"] | |
capabilities: [gpu] | |
Llama2-7B: | |
container_name: worker1 | |
image: mlenergy/tgi:v1.0.0 | |
command: ["--model-id", "/weights/metaai/Llama-2-7b-chat-hf", "--num-shard", "1", "--otlp-endpoint", "http://jaeger:4317"] | |
shm_size: 1g | |
networks: | |
- leaderboard | |
volumes: | |
- /data/leaderboard/tgi-data:/data | |
- /data/leaderboard/weights:/weights | |
deploy: | |
restart_policy: | |
condition: any | |
resources: | |
reservations: | |
devices: | |
- driver: nvidia | |
device_ids: ["1"] | |
capabilities: [gpu] | |
Vicuna-13B: | |
container_name: worker2 | |
image: mlenergy/tgi:v1.0.0 | |
command: ["--model-id", "lmsys/vicuna-13b-v1.5", "--num-shard", "1", "--otlp-endpoint", "http://jaeger:4317"] | |
shm_size: 1g | |
networks: | |
- leaderboard | |
volumes: | |
- /data/leaderboard/tgi-data:/data | |
deploy: | |
restart_policy: | |
condition: any | |
resources: | |
reservations: | |
devices: | |
- driver: nvidia | |
device_ids: ["2"] | |
capabilities: [gpu] | |
Llama2-13B: | |
container_name: worker3 | |
image: mlenergy/tgi:v1.0.0 | |
command: ["--model-id", "/weights/metaai/Llama-2-13b-chat-hf", "--num-shard", "1", "--otlp-endpoint", "http://jaeger:4317"] | |
shm_size: 1g | |
networks: | |
- leaderboard | |
volumes: | |
- /data/leaderboard/tgi-data:/data | |
- /data/leaderboard/weights:/weights | |
deploy: | |
restart_policy: | |
condition: any | |
resources: | |
reservations: | |
devices: | |
- driver: nvidia | |
device_ids: ["3"] | |
capabilities: [gpu] | |
networks: | |
leaderboard: | |
name: leaderboard | |
external: true | |