forked from LeoWood/bert
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Sbatch_Data_128_pre_rest.sbatch
33 lines (31 loc) · 1.79 KB
/
Sbatch_Data_128_pre_rest.sbatch
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
#!/bin/bash
#SBATCH -p normal
#SBATCH -N 1
#SBATCH --exclusive
#SBATCH -J data_128
#SBATCH -o data_128_rest.out
python create_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_pre/pre_training_TP_128.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw_New/TP.txt \
--max_seq_length 128
python create_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_pre/pre_training_TQ_128.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw_New/TQ.txt \
--max_seq_length 128
python create_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_pre/pre_training_TS_128.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw_New/TS.txt \
--max_seq_length 128
python create_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_pre/pre_training_TU_128.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw_New/TU.txt \
--max_seq_length 128
python create_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_pre/pre_training_TV_128.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw_New/TV.txt \
--max_seq_length 128