-
Notifications
You must be signed in to change notification settings - Fork 83
Expand file tree
/
Copy pathlaunch_sglang_server.sh
More file actions
110 lines (96 loc) · 3.43 KB
/
launch_sglang_server.sh
File metadata and controls
110 lines (96 loc) · 3.43 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
#!/bin/bash
###############################################################################
# SGLang Server Launcher
###############################################################################
export RING_DEGREE=2
export ULYSSES_DEGREE=4
export TP_SIZE=1
export PORT=30000
# 模型路径(用于判断模型类型)。请通过环境变量 MOVA_MODEL_PATH 设置,例如:
# export MOVA_MODEL_PATH="/path/to/your/MOVA-360p-hf"
# 若不设置,需在下方 DEFAULT_MODEL_PATH 中填写你的模型目录。
DEFAULT_MODEL_PATH="${MOVA_MODEL_PATH:-}"
if [ -z "$DEFAULT_MODEL_PATH" ]; then
echo "Error: MOVA_MODEL_PATH is not set. Please set it to your MOVA checkpoint directory (e.g. .../MOVA-360p-hf)." >&2
exit 1
fi
MODEL_PATH="$DEFAULT_MODEL_PATH"
# 根据模型路径判断模型类型
if [[ "$MODEL_PATH" == *"360p"* ]]; then
MODEL_KEY="mova-360p"
elif [[ "$MODEL_PATH" == *"720p"* ]]; then
MODEL_KEY="mova-720p"
else
MODEL_KEY="mova-360p" # 默认
echo "Warning: Could not determine model type from path, defaulting to mova-360p" >&2
fi
# 获取脚本目录
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
# 切换到脚本目录,确保相对路径正确
cd "$SCRIPT_DIR"
# 统一输出目录:如果环境变量 SG_OUTPUT_DIR 未设置,使用相对路径 outputs/sglang_output
if [ -z "$SG_OUTPUT_DIR" ]; then
# 使用相对路径,相对于脚本目录
SG_OUTPUT_DIR="${SCRIPT_DIR}/outputs/sglang_output"
fi
# 确保目录存在
mkdir -p "$SG_OUTPUT_DIR"
# Colors
GREEN='\033[0;32m'
BLUE='\033[0;34m'
YELLOW='\033[1;33m'
NC='\033[0m' # No Color
echo -e "${BLUE}========================================${NC}"
echo -e "${BLUE}SGLang Server Launcher${NC}"
echo -e "${BLUE}========================================${NC}"
echo ""
echo -e "${GREEN}Configuration:${NC}"
echo -e " Model: ${MODEL_KEY}"
echo -e " Port: ${PORT}"
echo -e " GPUs: $((RING_DEGREE*ULYSSES_DEGREE*TP_SIZE))"
echo -e " Output Directory: ${SG_OUTPUT_DIR}"
echo ""
# 启动服务器(后台运行)
echo -e "${GREEN}Starting SGLang server...${NC}"
sglang serve \
--host 0.0.0.0 \
--port ${PORT} \
--model-path "${MODEL_PATH}" \
--adjust_frames 'false' \
--num-gpus $((RING_DEGREE*ULYSSES_DEGREE*TP_SIZE)) \
--ring-degree ${RING_DEGREE} \
--ulysses-degree ${ULYSSES_DEGREE} \
--tp ${TP_SIZE} \
--enable-torch-compile \
--save-output \
--output-path "$SG_OUTPUT_DIR" &
SERVER_PID=$!
# 等待服务器启动
echo -e "${YELLOW}Waiting for server to start...${NC}"
for i in {1..30}; do
if curl -s "http://localhost:${PORT}/health" > /dev/null 2>&1 || \
curl -s "http://localhost:${PORT}/v1/models" > /dev/null 2>&1 || \
netstat -tuln 2>/dev/null | grep -q ":${PORT}" || \
ss -tuln 2>/dev/null | grep -q ":${PORT}"; then
echo -e "${GREEN}✓ Server is ready!${NC}"
break
fi
sleep 2
echo -n "."
done
echo ""
# 显示访问信息
echo -e "${BLUE}========================================${NC}"
echo -e "${GREEN}Server Access Information:${NC}"
echo -e "${BLUE}========================================${NC}"
echo ""
echo -e "Local URL:"
echo -e " ${GREEN}http://localhost:${PORT}${NC}"
echo -e " ${GREEN}http://127.0.0.1:${PORT}${NC}"
echo ""
echo -e "${YELLOW}Server PID: ${SERVER_PID}${NC}"
echo -e "${YELLOW}To stop the server, run: kill ${SERVER_PID}${NC}"
echo ""
echo -e "${BLUE}========================================${NC}"
# 保持脚本运行(等待服务器进程)
wait $SERVER_PID