-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathcluster_2x4.sh
48 lines (40 loc) · 1.38 KB
/
cluster_2x4.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
#!/bin/bash
echo "WARNING: This script only for run PaddlePaddle Fluid on one node..."
echo "WARNING: You must to modify train.py manual..."
echo ""
export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/usr/local/lib
export PADDLE_PSERVER_PORTS=36001,36002
export PADDLE_PSERVER_PORT_ARRAY=(36001 36002)
export PADDLE_PSERVERS=2
#export PADDLE_PSERVER_PORTS=36001
#export PADDLE_PSERVER_PORT_ARRAY=(36001)
#export PADDLE_PSERVERS=1
export PADDLE_IP=127.0.0.1
export PADDLE_TRAINERS=4
export PADDLE_SYNC_MODE="TRUE"
export CPU_NUM=4
export BASE=/accuracy/
cd /accuracy/text_classification/
if [ "$1" = "ps" ]
then
export PADDLE_TRAINING_ROLE=PSERVER
export GLOG_v=0
export GLOG_logtostderr=1
for((i=0;i<$PADDLE_PSERVERS;i++))
do
cur_port=${PADDLE_PSERVER_PORT_ARRAY[$i]}
echo "PADDLE WILL START PSERVER "$cur_port
CUR_PORT=$cur_port PADDLE_TRAINER_ID=$i stdbuf -oL python train_high_api.py --dict_path /root/.cache/paddle/dataset/imdb/imdb.vocab --local 0 &> $BASE/pserver.$i.log &
done
fi
if [ "$1" = "tr" ]
then
export PADDLE_TRAINING_ROLE=TRAINER
export GLOG_v=0
export GLOG_logtostderr=1
for((i=0;i<$PADDLE_TRAINERS;i++))
do
echo "PADDLE WILL START Trainer "$i
PADDLE_TRAINER_ID=$i stdbuf -oL python train_high_api.py --dict_path /root/.cache/paddle/dataset/imdb/imdb.vocab --local 0 &> $BASE/trainer.$i.log &
done
fi