dh-mc commited on
Commit
b05a046
1 Parent(s): bf1e59b

update tgi.sh

Browse files
Files changed (1) hide show
  1. tgi.sh +13 -4
tgi.sh CHANGED
@@ -1,9 +1,18 @@
1
  #!/bin/sh
2
 
3
- export HUGGINGFACE_MODEL_NAME_OR_PATH="meta-llama/Llama-2-7b-chat-hf"
 
 
 
4
 
5
- echo Running $HUGGINGFACE_MODEL_NAME_OR_PATH with TGI
6
 
7
- volume=$PWD/data # share a volume with the Docker container to avoid downloading weights every run
 
8
 
9
- docker run -e HUGGING_FACE_HUB_TOKEN=$HUGGINGFACE_AUTH_TOKEN --shm-size 1g -p 8081:80 -v $volume:/data ghcr.io/huggingface/text-generation-inference:1.0.0 --model-id $HUGGINGFACE_MODEL_NAME_OR_PATH
 
 
 
 
 
 
1
  #!/bin/sh
2
 
3
+ BASEDIR=$(dirname "$0")
4
+ cd $BASEDIR
5
+ echo Current Directory:
6
+ pwd
7
 
8
+ uname -a
9
 
10
+ # for $NGROK_AUTHTOKEN and $NGROK_EDGE
11
+ souce env/ngrok.conf
12
 
13
+ export MODEL_ID="meta-llama/Llama-2-7b-chat-hf"
14
+ export QUANTIZE=--quantize bitsandbytes-fp4
15
+
16
+ echo Running $MODEL_ID with TGI
17
+
18
+ text-generation-launcher --model-id $MODEL_ID --port $PORT --max-input-length 2048 --max-total-tokens 4096 --ngrok --ngrok-authtoken $NGROK_AUTHTOKEN --ngrok-edge NGROK_EDGE $QUANTIZE