chansung commited on
Commit
73f0ed3
1 Parent(s): 6892c67

Update entrypoint.sh.template

Browse files
Files changed (1) hide show
  1. entrypoint.sh.template +2 -2
entrypoint.sh.template CHANGED
@@ -3,14 +3,14 @@
3
  if [[ "$QUANTIZATION" == "false" ]]; then
4
  text-generation-launcher --model-id $MODEL_NAME \
5
  --num-shard 1 --port 8080 --trust-remote-code \
6
- --max-concurrent-request $MAX_CONCURRENT_REQUESTS \
7
  --max-top-n-tokens $MAX_INPUT_LENGTH \
8
  --max-input-length $MAX_TOTAL_TOKENS \
9
  &
10
  else
11
  text-generation-launcher --model-id $MODEL_NAME \
12
  --num-shard 1 --port 8080 --trust-remote-code \
13
- --max-concurrent-request $MAX_CONCURRENT_REQUESTS \
14
  --max-top-n-tokens $MAX_INPUT_LENGTH \
15
  --max-input-length $MAX_TOTAL_TOKENS \
16
  --quantize $QUANTIZATION \
 
3
  if [[ "$QUANTIZATION" == "false" ]]; then
4
  text-generation-launcher --model-id $MODEL_NAME \
5
  --num-shard 1 --port 8080 --trust-remote-code \
6
+ --max-concurrent-requests $MAX_CONCURRENT_REQUESTS \
7
  --max-top-n-tokens $MAX_INPUT_LENGTH \
8
  --max-input-length $MAX_TOTAL_TOKENS \
9
  &
10
  else
11
  text-generation-launcher --model-id $MODEL_NAME \
12
  --num-shard 1 --port 8080 --trust-remote-code \
13
+ --max-concurrent-requests $MAX_CONCURRENT_REQUESTS \
14
  --max-top-n-tokens $MAX_INPUT_LENGTH \
15
  --max-input-length $MAX_TOTAL_TOKENS \
16
  --quantize $QUANTIZATION \