File size: 594 Bytes
433b752
 
 
d276b79
97dc701
6dee22b
 
bac467e
433b752
 
e11772a
433b752
6dee22b
94641ea
433b752
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
#!/bin/bash

# Start the text-generation-inference process
if [[ ${QUANTIZE} != "false" ]]; then
  text-generation-launcher --model-id ${MODEL_NAME} --num-shard 1 --port 8080 --trust-remote-code --quantize ${QUANTIZE} &
else
  text-generation-launcher --model-id ${MODEL_NAME} --num-shard 1 --port 8080 --trust-remote-code &
fi

# Wait for text-generation-inference to start
curl --retry 60 --retry-delay 10 --retry-connrefused http://127.0.0.1:8080/health

# Start the gradio
python app/main.py &

# Wait for any process to exit
wait -n

# Exit with status of process that exited first
exit $?