forked from google-research/bert
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Data_419_cscd_all_ernie.sh
124 lines (122 loc) · 8.04 KB
/
Data_419_cscd_all_ernie.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
#!/usr/bin/env bash
#cscd医学领域数据, max_seq 128, wwm
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_O_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/O.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_P_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/P.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_Q_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/Q.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_R_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/R.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_S_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/S.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_U_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/U.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_V_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/V.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_X_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/X.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_TB_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/TB.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_TD_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/TD.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_TE_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/TE.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_TF_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/TF.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_TG_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/TG.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_TH_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/TH.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_TJ_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/TJ.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_TK_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/TK.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_TL_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/TL.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_TM_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/TM.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_TN_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/TN.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_TP_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/TP.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_TQ_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/TQ.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_TS_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/TS.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_TU_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/TU.txt \
--max_seq_length 128
python create_ernie_pretraining_data.py \
--vocab_file /public/home/zzx6320/lh/Projects/bert/models/chinese_L-12_H-768_A-12/vocab.txt \
--output_file /work1/zzx6320/lh/Projects/bert/data/cscd_all_wwm/pre_training_TV_cscd_128_wwm_cmesh.tfrecord \
--input_file /work1/zzx6320/lh/Projects/Data/Pretraining_Raw/TV.txt \
--max_seq_length 128