Skip to content

Commit 68a2c9e

Browse files
authored
Create deploy.sh
1 parent 7bde195 commit 68a2c9e

File tree

1 file changed

+142
-0
lines changed
  • llm-localization/ascend/mindie/docker

1 file changed

+142
-0
lines changed
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,142 @@
1+
#!/bin/bash
2+
3+
echo "入参:" $@
4+
5+
for a in "$@"; do
6+
#echo $a
7+
if [[ `echo $a | grep "^--model_name="` ]]; then
8+
model_name=`echo $a | grep "^--model_name=" | awk -F '=' '{print $2}'`
9+
fi
10+
if [[ `echo $a | grep "^--model_weight_path="` ]]; then
11+
model_weight_path=`echo $a | grep "^--model_weight_path=" | awk -F '=' '{print $2}'`
12+
fi
13+
if [[ `echo $a | grep "^--world_size="` ]]; then
14+
world_size=`echo $a | grep "^--world_size=" | awk -F '=' '{print $2}'`
15+
fi
16+
if [[ `echo $a | grep "^--npu_mem_size="` ]]; then
17+
npu_mem_size=`echo $a | grep "^--npu_mem_size=" | awk -F '=' '{print $2}'`
18+
fi
19+
done
20+
21+
if [ -z "$model_name" ]; then
22+
model_name="default"
23+
fi
24+
25+
if [ -z "$model_weight_path" ]; then
26+
model_weight_path="/workspace/models"
27+
fi
28+
29+
if [ -z "$world_size" ]; then
30+
world_size=4
31+
fi
32+
33+
if [ -z "$npu_mem_size" ]; then
34+
npu_mem_size=8
35+
fi
36+
37+
echo "平台入参: model_name: $model_name, model_weight_path: $model_weight_path , world_size: $world_size , npu_mem_size: $npu_mem_size"
38+
39+
40+
npuids=""
41+
card_num=$(($world_size - 1))
42+
for i in `seq 0 $card_num`
43+
do
44+
if [[ $i == $card_num ]] ;
45+
then
46+
npuids=$npuids$i
47+
else
48+
npuids=$npuids$i","
49+
fi
50+
done
51+
52+
53+
echo $npuids
54+
55+
56+
DEPLOYMENT_CONF_PATH="/home/guodong.li/workspace/config.json"
57+
58+
# DEPLOYMENT_CONF_PATH="/usr/local/Ascend/mindie/latest/mindie-service/conf/config.json"
59+
60+
cat <<EOF > $DEPLOYMENT_CONF_PATH
61+
{
62+
"OtherParam":
63+
{
64+
"ResourceParam" :
65+
{
66+
"cacheBlockSize" : 128,
67+
"preAllocBlocks" : 4
68+
},
69+
"LogParam" :
70+
{
71+
"logLevel" : "Info",
72+
"logPath" : "/logs/mindservice.log"
73+
},
74+
"ServeParam" :
75+
{
76+
"ipAddress" : "0.0.0.0",
77+
"port" : 1025,
78+
"maxLinkNum" : 300,
79+
"httpsEnabled" : false,
80+
"tlsCaPath" : "security/ca/",
81+
"tlsCaFile" : ["ca.pem"],
82+
"tlsCert" : "security/certs/server.pem",
83+
"tlsPk" : "security/keys/server.key.pem",
84+
"tlsPkPwd" : "security/pass/mindie_server_key_pwd.txt",
85+
"kmcKsfMaster" : "tools/pmt/master/ksfa",
86+
"kmcKsfStandby" : "tools/pmt/standby/ksfb",
87+
"tlsCrl" : "security/certs/server_crl.pem"
88+
}
89+
},
90+
"WorkFlowParam":
91+
{
92+
"TemplateParam" :
93+
{
94+
"templateType": "Standard",
95+
"templateName" : "Standard_llama",
96+
"pipelineNumber" : 1
97+
}
98+
},
99+
"ModelDeployParam":
100+
{
101+
"maxSeqLen" : 2560,
102+
"npuDeviceIds" : [[$npuids]],
103+
"ModelParam" : [
104+
{
105+
"modelInstanceType": "Standard",
106+
"modelName" : "$model_name",
107+
"modelWeightPath" : "$model_weight_path",
108+
"worldSize" : $world_size,
109+
"cpuMemSize" : 5,
110+
"npuMemSize" : $npu_mem_size,
111+
"backendType": "atb"
112+
}
113+
]
114+
},
115+
"ScheduleParam":
116+
{
117+
"maxPrefillBatchSize" : 50,
118+
"maxPrefillTokens" : 8192,
119+
"prefillTimeMsPerReq" : 150,
120+
"prefillPolicyType" : 0,
121+
"decodeTimeMsPerReq" : 50,
122+
"decodePolicyType" : 0,
123+
"maxBatchSize" : 200,
124+
"maxIterTimes" : 512,
125+
"maxPreemptCount" : 200,
126+
"supportSelectBatch" : false,
127+
"maxQueueDelayMicroseconds" : 5000
128+
}
129+
}
130+
EOF
131+
132+
echo "部署参数,$DEPLOYMENT_CONF_PATH"
133+
cat $DEPLOYMENT_CONF_PATH
134+
135+
# source /usr/local/Ascend/ascend-toolkit/set_env.sh
136+
# source /usr/local/Ascend/mindie/set_env.sh
137+
# source /usr/local/Ascend/llm_model/set_env.sh
138+
139+
# export PYTHONPATH=/usr/local/Ascend/llm_model:$PYTHONPATH
140+
# cd /usr/local/Ascend/mindie/latest/mindie-service/bin
141+
142+
# ./mindieservice_daemon

0 commit comments

Comments
 (0)