chansung commited on
Commit
8385e49
1 Parent(s): 491b3b6
Files changed (1) hide show
  1. entrypoint.sh.template +4 -4
entrypoint.sh.template CHANGED
@@ -4,15 +4,15 @@ if [[ "$QUANTIZATION" == "false" ]]; then
4
  text-generation-launcher --model-id $MODEL_NAME \
5
  --num-shard 1 --port 8080 --trust-remote-code \
6
  --max-concurrent-requests $MAX_CONCURRENT_REQUESTS \
7
- --max-top-n-tokens $MAX_INPUT_LENGTH \
8
- --max-input-length $MAX_TOTAL_TOKENS \
9
  &
10
  else
11
  text-generation-launcher --model-id $MODEL_NAME \
12
  --num-shard 1 --port 8080 --trust-remote-code \
13
  --max-concurrent-requests $MAX_CONCURRENT_REQUESTS \
14
- --max-top-n-tokens $MAX_INPUT_LENGTH \
15
- --max-input-length $MAX_TOTAL_TOKENS \
16
  --quantize $QUANTIZATION \
17
  &
18
  fi
 
4
  text-generation-launcher --model-id $MODEL_NAME \
5
  --num-shard 1 --port 8080 --trust-remote-code \
6
  --max-concurrent-requests $MAX_CONCURRENT_REQUESTS \
7
+ --max-input-length $MAX_INPUT_LENGTH \
8
+ --max-total-tokens $MAX_TOTAL_TOKENS \
9
  &
10
  else
11
  text-generation-launcher --model-id $MODEL_NAME \
12
  --num-shard 1 --port 8080 --trust-remote-code \
13
  --max-concurrent-requests $MAX_CONCURRENT_REQUESTS \
14
+ --max-input-length $MAX_INPUT_LENGTH \
15
+ --max-total-tokens $MAX_TOTAL_TOKENS \
16
  --quantize $QUANTIZATION \
17
  &
18
  fi