1
1
#! /bin/bash
2
2
DIR=" $( cd " $( dirname " ${BASH_SOURCE[0]} " ) " && pwd) "
3
- echo " $ DIR"
3
+ echo " Current directory: ${ DIR} "
4
4
5
- # 先kill一遍
6
- ps -efww | grep -E ' api_server' | grep -v grep | awk ' {print $2}' | xargs kill -9 || true
7
- ps -efww | grep -E ' 8188' | grep -v grep | awk ' {print $2}' | xargs kill -9 || true
8
- lsof -t -i :8188 | xargs kill -9 || true
5
+ # Clean up the environment
6
+ fastdeploy_python_pids=$( ps -ef | grep " python" | grep -v grep | awk ' {print $2}' )
7
+ echo " Process to clear:"
8
+ echo $fastdeploy_python_pids
9
+ for in_pid in ${fastdeploy_python_pids[@]} ; do
10
+ kill -9 ${in_pid}
11
+ done
12
+ echo " Clear done."
9
13
10
- export model_path=${MODEL_PATH} /paddle/ ERNIE-4.5-21B-A3B-Paddle
14
+ export model_path=${MODEL_PATH} /ERNIE-4.5-21B-A3B-Paddle
11
15
12
16
echo " pip install requirements"
13
17
python -m pip install -r requirements.txt -i https://pypi.tuna.tsinghua.edu.cn/simple
14
18
echo " uninstall org"
15
19
python -m pip uninstall paddlepaddle -y
16
20
python -m pip uninstall paddle-custom-gcu -y
17
21
python -m pip install paddlepaddle==3.1.0a0 -i https://www.paddlepaddle.org.cn/packages/stable/cpu/
22
+ python -m pip install --pre paddle-custom-gcu==3.0.0.dev20250801 -i https://www.paddlepaddle.org.cn/packages/nightly/gcu/
18
23
echo " build whl"
19
24
bash build.sh 1 || exit 1
20
25
21
26
unset http_proxy
22
27
unset https_proxy
23
28
unset no_proxy
24
29
25
- # 起服务
26
30
rm -rf log/*
27
31
rm -f core*
28
- # pkill -9 python #流水线不执行这个
29
- # 清空消息队列
32
+
33
+ # Empty the message queue
30
34
ipcrm --all=msg
35
+ echo " Start server..."
31
36
python -m fastdeploy.entrypoints.openai.api_server \
32
37
--model ${model_path} \
33
38
--port 8188 \
@@ -38,21 +43,23 @@ python -m fastdeploy.entrypoints.openai.api_server \
38
43
--max-num-seqs 8 \
39
44
--quantization wint4 > server.log 2>&1 &
40
45
41
- sleep 60
42
- # 探活
43
- TIMEOUT=$(( 5 * 60 ))
44
- INTERVAL=10 # 检查间隔(秒)
46
+ echo " Waiting 90 seconds..."
47
+ sleep 90
48
+
49
+ # Health check
50
+ TIMEOUT=$(( 11 * 60 ))
51
+ INTERVAL=10 # Check interval (seconds)
45
52
ENDPOINT=" http://0.0.0.0:8188/health"
46
- START_TIME=$( date +%s) # 记录开始时间戳
47
- echo " 开始服务健康检查,最长等待时间: ${TIMEOUT} 秒 "
53
+ START_TIME=$( date +%s) # Record the start timestamp
54
+ echo " Start the server health check, maximum waiting time: ${TIMEOUT} seconds... "
48
55
while true ; do
49
- # 计算已耗时
56
+ # Used to calculate the time cost
50
57
CURRENT_TIME=$( date +%s)
51
58
ELAPSED=$(( CURRENT_TIME - START_TIME))
52
59
53
- # 超时判断
60
+ # Timeout
54
61
if [ $ELAPSED -ge $TIMEOUT ]; then
55
- echo -e " \n服务启动超时:经过 $(( TIMEOUT/ 60 )) 分钟服务仍未启动! "
62
+ echo -e " \nServer start timeout: After $(( TIMEOUT/ 60 )) minutes, the service still doesn't start! "
56
63
cat server.log
57
64
cat log/workerlog.0
58
65
exit 1
@@ -61,26 +68,32 @@ while true; do
61
68
HTTP_CODE=$( curl -s -o /dev/null -w " %{http_code}" -m 2 " $ENDPOINT " || true)
62
69
63
70
if [ " $HTTP_CODE " = " 200" ]; then
64
- echo -e " \n服务启动成功!耗时 ${ ELAPSED} 秒 "
71
+ echo -e " \nThe server was successfully launched! Totally takes $(( ELAPSED+ 60 )) seconds. "
65
72
break
66
73
else
67
74
sleep $INTERVAL
68
75
fi
69
76
done
70
77
71
78
cat server.log
79
+ echo -e " \n"
72
80
73
- # 执行服务化推理
81
+ echo " Start inference... "
74
82
python test/ci_use/GCU/run_ernie.py
75
83
exit_code=$?
76
- echo exit_code is ${exit_code}
84
+ echo -e " exit_code is ${exit_code} .\n "
77
85
78
- ps -efww | grep -E ' api_server' | grep -v grep | awk ' {print $2}' | xargs kill -9 || true
79
- ps -efww | grep -E ' 8188' | grep -v grep | awk ' {print $2}' | xargs kill -9 || true
80
- lsof -t -i :8188 | xargs kill -9 || true
86
+ echo " Stop server..."
87
+ fastdeploy_python_pids=$( ps -ef | grep " python" | grep -v grep | awk ' {print $2}' )
88
+ echo " Process to stop:"
89
+ echo $fastdeploy_python_pids
90
+ for in_pid in ${fastdeploy_python_pids[@]} ; do
91
+ kill -9 ${in_pid}
92
+ done
93
+ echo " Stop server done."
81
94
82
95
if [ ${exit_code} -ne 0 ]; then
83
- echo " log/workerlog.0"
96
+ echo " Exit with error, please refer to log/workerlog.0"
84
97
cat log/workerlog.0
85
98
exit 1
86
99
fi
0 commit comments