-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathalign.sh
31 lines (25 loc) · 826 Bytes
/
align.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
source ./config.sh
mkdir data_align
trainpref=$DATA/$TRAIN_PREF
validpref=$DATA/$VALID_PREF
fast_align_dir='/lab/ogawa/tools/fast_align/build/'
mosesdecoder_dir='/lab/ogawa/tools/mosesdecoder/'
# train
python scripts/build_sym_alignment.py \
--fast_align_dir $fast_align_dir \
--mosesdecoder_dir $mosesdecoder_dir \
--source_file $trainpref.src \
--target_file $trainpref.tgt \
--output_dir data_align
cp data_align/align.forward $trainpref.forward
cp data_align/align.backward $trainpref.backward
# valid
python scripts/build_sym_alignment.py \
--fast_align_dir $fast_align_dir \
--mosesdecoder_dir $mosesdecoder_dir \
--source_file $validpref.src \
--target_file $validpref.tgt \
--output_dir data_align
cp data_align/align.forward $validpref.forward
cp data_align/align.backward $validpref.backward
rm -rf data_align