Spaces:

ml-energy
/

leaderboard

Running

Jae-Won Chung commited on Feb 18, 2024

Commit

b3e31f5

1 Parent(s): e795d0f

Update docker-compose files

Files changed (2) hide show

deployment/docker-compose-0.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 services:
   MPT-7B:
     container_name: worker0
-    image: mlenergy/tgi:latest
     command: ["--model-id", "mosaicml/mpt-7b-chat", "--num-shard", "1", "--otlp-endpoint", "http://jaeger:4317"]
     shm_size: 1g
     networks:
@@ -19,7 +19,7 @@ services:
               capabilities: [gpu]
   Llama2-7B:
     container_name: worker1
-    image: mlenergy/tgi:latest
     command: ["--model-id", "/weights/metaai/Llama-2-7b-chat-hf", "--num-shard", "1", "--otlp-endpoint", "http://jaeger:4317"]
     shm_size: 1g
     networks:
@@ -38,7 +38,7 @@ services:
               capabilities: [gpu]
   Vicuna-13B:
     container_name: worker2
-    image: mlenergy/tgi:latest
     command: ["--model-id", "lmsys/vicuna-13b-v1.5", "--num-shard", "1", "--otlp-endpoint", "http://jaeger:4317"]
     shm_size: 1g
     networks:
@@ -56,7 +56,7 @@ services:
               capabilities: [gpu]
   Llama2-13B:
     container_name: worker3
-    image: mlenergy/tgi:latest
     command: ["--model-id", "/weights/metaai/Llama-2-13b-chat-hf", "--num-shard", "1", "--otlp-endpoint", "http://jaeger:4317"]
     shm_size: 1g
     networks:

 services:
   MPT-7B:
     container_name: worker0
+    image: mlenergy/tgi:v1.0.0
     command: ["--model-id", "mosaicml/mpt-7b-chat", "--num-shard", "1", "--otlp-endpoint", "http://jaeger:4317"]
     shm_size: 1g
     networks:
               capabilities: [gpu]
   Llama2-7B:
     container_name: worker1
+    image: mlenergy/tgi:v1.0.0
     command: ["--model-id", "/weights/metaai/Llama-2-7b-chat-hf", "--num-shard", "1", "--otlp-endpoint", "http://jaeger:4317"]
     shm_size: 1g
     networks:
               capabilities: [gpu]
   Vicuna-13B:
     container_name: worker2
+    image: mlenergy/tgi:v1.0.0
     command: ["--model-id", "lmsys/vicuna-13b-v1.5", "--num-shard", "1", "--otlp-endpoint", "http://jaeger:4317"]
     shm_size: 1g
     networks:
               capabilities: [gpu]
   Llama2-13B:
     container_name: worker3
+    image: mlenergy/tgi:v1.0.0
     command: ["--model-id", "/weights/metaai/Llama-2-13b-chat-hf", "--num-shard", "1", "--otlp-endpoint", "http://jaeger:4317"]
     shm_size: 1g
     networks:

deployment/docker-compose-1.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 services:
   Llama2-70B-INT8:
     container_name: worker4
-    image: mlenergy/tgi:latest
     command: ["--model-id", "meta-llama/Llama-2-70b-chat-hf", "--num-shard", "2", "--otlp-endpoint", "http://jaeger:4317", "--quantize", "bitsandbytes"]
     shm_size: 1g
     environment:
@@ -21,7 +21,7 @@ services:
               capabilities: [gpu]
   MPT-30B:
     container_name: worker5
-    image: mlenergy/tgi:latest
     command: ["--model-id", "mosaicml/mpt-30b-chat", "--num-shard", "2", "--otlp-endpoint", "http://jaeger:4317"]
     shm_size: 1g
     networks:

 services:
   Llama2-70B-INT8:
     container_name: worker4
+    image: mlenergy/tgi:v1.0.0
     command: ["--model-id", "meta-llama/Llama-2-70b-chat-hf", "--num-shard", "2", "--otlp-endpoint", "http://jaeger:4317", "--quantize", "bitsandbytes"]
     shm_size: 1g
     environment:
               capabilities: [gpu]
   MPT-30B:
     container_name: worker5
+    image: mlenergy/tgi:v1.0.0
     command: ["--model-id", "mosaicml/mpt-30b-chat", "--num-shard", "2", "--otlp-endpoint", "http://jaeger:4317"]
     shm_size: 1g
     networks: