File size: 2,677 Bytes
8333668
653bb2f
46a86c9
 
653bb2f
 
 
 
71b2874
52494dd
387fdbf
bc2999d
 
 
 
d3d1749
 
 
c10e90a
 
07a246c
4f68ff6
d3d1749
c7977b2
a87320f
062a3e1
21ed67c
 
 
 
 
 
 
 
062a3e1
fbe0301
062a3e1
8e20bcd
21ed67c
062a3e1
8e20bcd
 
 
48ade90
35dbef9
4f68ff6
fbe0301
 
21ed67c
fbe0301
 
 
 
 
4d27f4c
8e20bcd
fbe0301
 
21ed67c
fbe0301
 
 
 
 
4f68ff6
46a86c9
157fd87
092b6ff
a2ea222
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
#!/bin/bash

export HF_HOME="/data/.huggingface"

echo "PWD: $(pwd)"
echo $HF_TOKEN > .hf_token
echo "LS: $(ls -als)"

while true; do nvidia-smi; sleep 600; done &

python3 -c "import torch; \
    print(f\"is availeble = {torch.cuda.is_available()}\"); \
    print(f\"device count = {torch.cuda.device_count()}\"); \
    print(f\"current device = {torch.cuda.current_device()}\")"


COMPONENT="serve.controller" 
echo "Starting $COMPONENT"
nohup python3 -m serve.controller --host 0.0.0.0 --port 10000 2>&1 | tee serve.controller.log &
while [ `grep -c "Uvicorn running on" serve.controller.log` -eq '0' ];do
        sleep 2s;
        echo "waiting for $COMPONENT to be running"
done
echo "$COMPONENT is running."

# stuck after download config.json
# COMPONENT="interactive_demo prism-dinosiglip+13b"
# echo "Starting $COMPONENT"
# nohup python3 -m interactive_demo --port 40000 --model_id prism-dinosiglip+13b | tee prism-dinosiglip_13b.log &
# while [ `grep -c "loaded prismatic prism-dinosiglip+13b" prism-dinosiglip_13b.log` -eq '0' ];do
#         sleep 10s;
#         echo "waiting for $COMPONENT to be running"
# done
# echo "$COMPONENT is running"

#works!
COMPONENT="interactive_demo prism-dinosiglip_7b"
echo "Starting $COMPONENT"
CUDA_VISIBLE_DEVICES=0 nohup python3 -m interactive_demo --port 40001 --model_id prism-dinosiglip+7b | tee prism-dinosiglip_7b.log &
while [ `grep -c "loaded prismatic prism-dinosiglip+7b" prism-dinosiglip_7b.log` -eq '0' ];do
        sleep 10s;
        echo "waiting for $COMPONENT to be running"
done
echo "$COMPONENT is running."

#works!
COMPONENT="interactive_demo prism-dinosiglip-controlled+7b"
echo "Starting $COMPONENT"
CUDA_VISIBLE_DEVICES=1 nohup python3 -m interactive_demo --port 40002 --model_id prism-dinosiglip-controlled+7b | tee prism-dinosiglip-controlled_7b.log &
while [ `grep -c "loaded prismatic prism-dinosiglip-controlled+7b" prism-dinosiglip-controlled_7b.log` -eq '0' ];do
        sleep 10s;
        echo "waiting for $COMPONENT to be running"
done
echo "$COMPONENT is running"

#works!
COMPONENT="interactive_demo llava-v1.5-7b"
echo "Starting $COMPONENT"
CUDA_VISIBLE_DEVICES=2 nohup python3 -m interactive_demo --port 40003 --model_family llava-v15 --model_id llava-v1.5-7b --model_dir liuhaotian/llava-v1.5-7b | tee llava-v1.5-7b.log &
while [ `grep -c "loaded llava llava-v1.5-7b" llava-v1.5-7b.log` -eq '0' ];do
        sleep 10s;
        echo "waiting for $COMPONENT to be running"
done
echo "$COMPONENT is running"

ls -als $HF_HOME
tree --du -h $HF_HOME

echo "Starting serve.gradio_web_server"
python3 -m serve.gradio_web_server --controller http://127.0.0.1:10000 --model-list-mode reload # --share