-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathpreprocess_data.sh
38 lines (31 loc) · 1005 Bytes
/
preprocess_data.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
for split in train dev test
do
python preprocess.py \
--input_file /home/ba63/codafication/data/${split}/${split}.tsv \
--control_token none \
--output_file /home/ba63/codafication/data/${split}/${split}
done
# gold control tokens
for split in train dev test
do
for token in msa_phrase da_phrase city digit
do
python preprocess.py \
--input_file /home/ba63/codafication/data/${split}/${split}.tsv \
--control_token $token \
--mode gold \
--output_file /home/ba63/codafication/data/${split}/${split}_${token}_gold
done
done
# pred control tokens
for split in dev test
do
for token in msa_phrase da_phrase city digit
do
python preprocess.py \
--input_file /home/ba63/codafication/data/${split}/${split}.tsv \
--control_token $token \
--mode pred \
--output_file /home/ba63/codafication/data/${split}/${split}_${token}_pred \
done
done