File size: 2,479 Bytes
8333668 653bb2f 46a86c9 653bb2f 71b2874 52494dd 387fdbf bc2999d e5c817a a87320f 8333668 98c0fb0 4d836a9 98c0fb0 dbc88c0 4d836a9 e5c817a dbc88c0 78242ba dbc88c0 78242ba 52494dd 4d836a9 4d27f4c 46a86c9 157fd87 092b6ff 4d27f4c |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 |
#!/bin/bash
export HF_HOME="/data/.huggingface"
echo "PWD: $(pwd)"
echo $HF_TOKEN > .hf_token
echo "LS: $(ls -als)"
while true; do nvidia-smi; sleep 600; done &
python3 -c "import torch; \
print(f\"is availeble = {torch.cuda.is_available()}\"); \
print(f\"device count = {torch.cuda.device_count()}\"); \
print(f\"current device = {torch.cuda.current_device()}\")"
RUN_AND_WAIT() {
# 1st param: the script name, eg "server.controller"
# 2nd param: the command to execute
# 3rd param: the log entry to watch for that indicate the component is ready
COMPONENT=$1
echo "Starting $COMPONENT"
nohup eval $2 2>&1 | tee "$COMPONENT.log" &
while [ `grep -c $3 "$COMPONENT.log"` -eq '0' ];do
sleep 1s;
echo "wait $COMPONENT to be running"
done
echo "$COMPONENT is running"
}
COMPONENT="serve.controller"
COMMAND=python3 -m $COMPONENT --host 0.0.0.0 --port 10000
READY_LOG="Uvicorn running on"
RUN_AND_WAIT $COMPONENT $COMMAND $READY_LOG
# COMPONENT="serve.controller"
# echo "Starting $COMPONENT"
# nohup python3 -m $COMPONENT --host 0.0.0.0 --port 10000 2>&1 | tee "$COMPONENT.log" &
# while [ `grep -c "Uvicorn running on" "$COMPONENT.log"` -eq '0' ];do
# sleep 1s;
# echo "wait $COMPONENT to be running"
# done
# echo "$COMPONENT is running"
# sleep 30
# echo "Starting prism-dinosiglip+13b"
# python3 -m interactive_demo --port 40000 --model_id prism-dinosiglip+13b &
# P4=$!
# echo "Starting prism-dinosiglip+7b"
# python3 -m interactive_demo --port 40000 --model_id prism-dinosiglip+7b &
COMPONENT="interactive_demo"
COMMAND=python3 -m $COMPONENT --port 40000 --model_id prism-dinosiglip+7
READY_LOG="loaded prismatic prism-dinosiglip+7b"
RUN_AND_WAIT $COMPONENT $COMMAND $READY_LOG
# echo "Starting $COMPONENT"
# nohup | tee "$COMPONENT.log" &
# while [ `grep -c "loaded prismatic prism-dinosiglip+7b" "$COMPONENT.log"` -eq '0' ];do
# sleep 1s;
# echo "wait $COMPONENT to be running"
# done
# echo "$COMPONENT is running"
# python3 -m interactive_demo --port 40002 --model_id prism-dinosiglip-controlled+7b &
# P6=$!
# python3 -m interactive_demo --port 40003 --model_id llava-v1.5-7b &
# P7=$!
sleep 30
echo "Starting serve.gradio_web_server"
python3 -m serve.gradio_web_server --controller http://127.0.0.1:10000 --model-list-mode reload & # --share
P_WEB=$!
sleep 30
ls -als $HF_HOME
tree --du -h $HF_HOME
wait $P_CON $P_WEB $P_P7B # $P5 $P6 $P7 |