Spaces:
Runtime error
Runtime error
Update entrypoint.sh.template
Browse files- entrypoint.sh.template +2 -2
entrypoint.sh.template
CHANGED
@@ -3,14 +3,14 @@
|
|
3 |
if [[ "$QUANTIZATION" == "false" ]]; then
|
4 |
text-generation-launcher --model-id $MODEL_NAME \
|
5 |
--num-shard 1 --port 8080 --trust-remote-code \
|
6 |
-
--max-concurrent-
|
7 |
--max-top-n-tokens $MAX_INPUT_LENGTH \
|
8 |
--max-input-length $MAX_TOTAL_TOKENS \
|
9 |
&
|
10 |
else
|
11 |
text-generation-launcher --model-id $MODEL_NAME \
|
12 |
--num-shard 1 --port 8080 --trust-remote-code \
|
13 |
-
--max-concurrent-
|
14 |
--max-top-n-tokens $MAX_INPUT_LENGTH \
|
15 |
--max-input-length $MAX_TOTAL_TOKENS \
|
16 |
--quantize $QUANTIZATION \
|
|
|
3 |
if [[ "$QUANTIZATION" == "false" ]]; then
|
4 |
text-generation-launcher --model-id $MODEL_NAME \
|
5 |
--num-shard 1 --port 8080 --trust-remote-code \
|
6 |
+
--max-concurrent-requests $MAX_CONCURRENT_REQUESTS \
|
7 |
--max-top-n-tokens $MAX_INPUT_LENGTH \
|
8 |
--max-input-length $MAX_TOTAL_TOKENS \
|
9 |
&
|
10 |
else
|
11 |
text-generation-launcher --model-id $MODEL_NAME \
|
12 |
--num-shard 1 --port 8080 --trust-remote-code \
|
13 |
+
--max-concurrent-requests $MAX_CONCURRENT_REQUESTS \
|
14 |
--max-top-n-tokens $MAX_INPUT_LENGTH \
|
15 |
--max-input-length $MAX_TOTAL_TOKENS \
|
16 |
--quantize $QUANTIZATION \
|