Spaces:

chansung
/

gradio_together_tgi

Sleeping

File size: 1,112 Bytes

433b752
 
2faeeb9
 
6cb335f
 
a47da2f
597f529
a47da2f
6cb335f
597f529
cd75e75
6cb335f
cd75e75
 
 
597f529
cd75e75
 
 
 
 
597f529
4e7d56d
cfffe9e
a47da2f
4e7d56d
597f529
bac467e
433b752
 
e11772a
433b752
6dee22b
f28f0b8
433b752

#!/bin/bash

echo "MODEL_NAME: $MODEL_NAME"
echo "QUANTIZE: $QUANTIZE"
echo "GRADIO_PORT: $GRADIO_PORT"

MODEL_NAME=$(echo $MODEL_NAME | sed 's/^[[:space:]]*//g;s/[[:space:]]*$//g')
QUANTIZATION=$(echo $QUANTIZATION | sed 's/^[[:space:]]*//g;s/[[:space:]]*$//g')
GRADIO_PORT=$(echo $GRADIO_PORT | sed 's/^[[:space:]]*//g;s/[[:space:]]*$//g')

if [[ "$QUANTIZATION" == "$QUANTIZATION" ]]; then
  echo "WTF1-1!"
else
  echo "WTF1-2!!"
fi

if [[ "$QUANTIZATION" == "false" ]]; then
  echo "WTF2-1!"
else
  echo "WTF2-2!!"
fi

if [[ "$QUANTIZATION" == false ]]; then
  echo "WTF3-1!"
  text-generation-launcher --model-id $MODEL_NAME --num-shard 1 --port 8080 --trust-remote-code &
else
  echo "WTF3-2!"
  text-generation-launcher --model-id $MODEL_NAME --num-shard 1 --port 8080 --trust-remote-code --quantize $QUANTIZATION &
fi

# Wait for text-generation-inference to start
curl --retry 60 --retry-delay 10 --retry-connrefused http://127.0.0.1:8080/health

# Start the gradio
python app/main.py --port $GRADIO_PORT &

# Wait for any process to exit
wait -n

# Exit with status of process that exited first
exit $?