Skip to content

Commit 56a8a89

Browse files
committed
Update Adapt Models
1 parent 9f0f495 commit 56a8a89

File tree

3 files changed

+76
-1
lines changed

3 files changed

+76
-1
lines changed

scripts/openNMT-py/Adapt.sh

+69
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,69 @@
1+
#!/bin/bash
2+
3+
input=$1
4+
name=$2
5+
corpus=$3
6+
mkdir -p /tmp/${name}/
7+
mkdir -p /model/${name}/
8+
size=512
9+
if [ $# -ne 3 ]; then
10+
size=$4
11+
fi
12+
13+
14+
15+
16+
for l in s t
17+
do
18+
for set in valid
19+
do
20+
echo "" > /tmp/${name}/$set.$l
21+
for f in /data/${input}/${set}/*\.${l}
22+
do
23+
24+
cat $f >> /tmp/${name}/$set.$l
25+
done
26+
done
27+
done
28+
29+
30+
31+
python /opt/OpenNMT-py/preprocess.py \
32+
-train_src /data/${input}/train/${corpus}.s \
33+
-train_tgt /data/${input}/train/${corpus}.t \
34+
-valid_src /tmp/${name}/valid.s \
35+
-valid_tgt /tmp/${name}/valid.t \
36+
-save_data /tmp/${name}/train.${corpus} \
37+
-vocab /model/${name}/train.dict \
38+
-src_langs s \
39+
-tgt_langs t
40+
41+
42+
python -u /opt/OpenNMT-py/train.py -data /tmp/${name}/train.${corpus}.train.pt \
43+
-save_model /tmp/${name}/adapt.${corpus}.model \
44+
-brnn \
45+
-rnn_size $size \
46+
-word_vec_size $size \
47+
-batch_size 128 \
48+
-max_generator_batches 16 \
49+
-optim adam \
50+
-dropout 0.2 \
51+
-epochs 5 \
52+
-learning_rate 0.000125 \
53+
-train_from_state_dict /model/${name}/model.pt \
54+
-gpus 0
55+
56+
57+
echo -n "" > /tmp/${name}/list.adapt.${corpus}
58+
59+
for f in /tmp/${name}/adapt.${corpus}.model_ppl_*.pt
60+
do
61+
echo $f >> /tmp/${name}/list.adapt.${corpus} ;
62+
done
63+
64+
best=`awk '{ppl=$0;gsub(/.tmp..*.adapt.*.model_ppl_/,"",ppl);gsub(/_e[0-9]*.pt/,"",ppl); if(NR==1 || 1.0*ppl < 1.0*min){min=ppl;f=$0}}END{print f}' /tmp/${name}/list.adapt.${corpus}`
65+
echo $best
66+
67+
cp $best /model/$name/model.adapt.${corpus}.pt
68+
69+
rm -r /tmp/${name}/

scripts/openNMT-py/Train.sh

+4
Original file line numberDiff line numberDiff line change
@@ -51,6 +51,8 @@ python -u /opt/OpenNMT-py/train.py -data /tmp/${name}/train.train.pt \
5151
-learning_rate 0.001 \
5252
-gpus 0
5353

54+
echo -n "" > /tmp/${name}/list
55+
5456
for f in /tmp/${name}/model_ppl_*.pt
5557
do
5658
echo $f >> /tmp/${name}/list ;
@@ -74,6 +76,8 @@ python -u /opt/OpenNMT-py/train.py -data /tmp/${name}/train.train.pt \
7476
-gpus 0
7577

7678

79+
echo -n "" > /tmp/${name}/list.cont
80+
7781
for f in /tmp/${name}/cont.model_ppl_*.pt
7882
do
7983
echo $f >> /tmp/${name}/list.cont ;

systems/midSize/Train.sh

+3-1
Original file line numberDiff line numberDiff line change
@@ -11,10 +11,12 @@
1111

1212
#Train NMT
1313
/opt/SLT.KIT/scripts/openNMT-py/Train.sh prepro mt 1024
14+
/opt/SLT.KIT/scripts/openNMT-py/Adapt.sh prepro mt TED 1024
1415

1516

1617
#Preprocess for Puncutation
1718
/opt/SLT.KIT/scripts/monoTranslationData/Train.sh prepro monoTransPrepro
1819

1920
#monTranslationSystem
20-
/opt/SLT.KIT/scripts/openNMT-py/Train.sh monoTransPrepro monTrans
21+
/opt/SLT.KIT/scripts/openNMT-py/Train.sh monoTransPrepro monTrans 1024
22+
/opt/SLT.KIT/scripts/openNMT-py/Adapt.sh monoTransPrepro monTrans TED 1024

0 commit comments

Comments
 (0)