@@ -7,28 +7,27 @@ mkdir -p $TARGET_DIR
7
7
rsync -ruC --exclude pre_computed --exclude processed_data --exclude * .pyc $SOURCE / $TARGET_DIR
8
8
9
9
work_dir=$TARGET_DIR /
10
- log_dir=/mount/biglm_data/ELI5/logs/
11
- output_dir=/mount/biglm_data/ELI5/processed_data
10
+ log_dir=/mount/biglm_data/ELI5/logs_docs/
12
11
mkdir -p $log_dir
13
12
14
- export WORLD_SIZE=9
13
+ export WORLD_SIZE=16
15
14
nodes=$( python -c " for i in range(1,$WORLD_SIZE ): print(i)" )
16
15
node_ids=($( python -c " for i in range(0,$WORLD_SIZE ): print(i)" ) )
17
- years=($( python -c " for i in range(2011,2011+$WORLD_SIZE ): print(i)" ) )
16
+ # years=($(python -c "for i in range(2011,2011+$WORLD_SIZE): print(i)"))
18
17
# master=$(ssh -x -o LogLevel=ERROR worker-1 "echo \$hostname" )
19
18
for i in $nodes ; do
20
19
worker=worker-${node_ids[$i]}
21
20
sy=${years[$i]}
22
- kill -9 $( ps -x | grep " download_reddit_qalist.py " | grep -v grep | awk -F ' ' ' {print $1} ' )
21
+ rank= $i
23
22
ssh -x -o LogLevel=ERROR $worker " mkdir -p $TARGET_DIR "
24
23
rsync -ruC --exclude pre_computed --exclude processed_data -e " ssh -o StrictHostKeyChecking=no -o UserKnownHostsFile=/dev/null -o LogLevel=ERROR" $TARGET_DIR / $worker :$TARGET_DIR
25
- ssh -x -o LogLevel=ERROR $worker " mkdir -p $log_dir ; cd $work_dir ; nohup ./download_qa .sh $sy > ${log_dir} /nohup_${i} .std 2> ${log_dir} /nohup_${i} .err &"
24
+ ssh -x -o LogLevel=ERROR $worker " mkdir -p $log_dir ; cd $work_dir ; nohup ./download_docs .sh $rank > ${log_dir} /nohup_${i} .std 2> ${log_dir} /nohup_${i} .err &"
26
25
done
27
26
28
27
i=0
28
+ rank=$i
29
29
worker=worker-${node_ids[$i]}
30
30
sy=${years[$i]}
31
- kill -9 $( ps -x | grep " download_reddit_qalist.py" | grep -v grep| awk -F' ' ' {print $1}' )
32
31
ssh -x -o LogLevel=ERROR $worker " mkdir -p $TARGET_DIR "
33
32
rsync -ruC --exclude pre_computed --exclude processed_data -e " ssh -o StrictHostKeyChecking=no -o UserKnownHostsFile=/dev/null -o LogLevel=ERROR" $TARGET_DIR / $worker :$TARGET_DIR
34
- ssh -x -o LogLevel=ERROR $worker " mkdir -p $log_dir ; cd $work_dir ; ./download_qa .sh $sy "
33
+ ssh -x -o LogLevel=ERROR $worker " mkdir -p $log_dir ; cd $work_dir ; ./download_docs .sh $rank "
0 commit comments