hafidhsoekma commited on
Commit
9c40bcd
1 Parent(s): 6d2193e

Update entrypoint.sh.template

Browse files
Files changed (1) hide show
  1. entrypoint.sh.template +1 -3
entrypoint.sh.template CHANGED
@@ -5,9 +5,7 @@ mongod &
5
 
6
  # Start the text-generation-inference process
7
  pip3 install -U transformers && pip install -U transformers
8
- # mkdir /data/model_gptq
9
- # text-generation-server quantize ${MODEL_NAME} /data/model_gptq
10
- text-generation-launcher --model-id TheBloke/Llama-2-7B-GPTQ --quantize gptq --num-shard 1 --port 8080 &
11
 
12
  # Wait for text-generation-inference to start
13
  curl --retry 60 --retry-delay 10 --retry-connrefused http://127.0.0.1:8080/health
 
5
 
6
  # Start the text-generation-inference process
7
  pip3 install -U transformers && pip install -U transformers
8
+ text-generation-launcher --model-id ${MODEL_NAME} --quantize bitsandbytes-nf4 --num-shard 1 --port 8080 --trust-remote-code &
 
 
9
 
10
  # Wait for text-generation-inference to start
11
  curl --retry 60 --retry-delay 10 --retry-connrefused http://127.0.0.1:8080/health