-
Notifications
You must be signed in to change notification settings - Fork 12
/
Copy pathtrain_crosent.sh
executable file
·58 lines (44 loc) · 1.6 KB
/
train_crosent.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
#!/bin/bash
set -x
set -e
if [ $# -lt 1 ]; then
echo "`basename $0` <seedval> <optional-gpu-num>"
exit 1
fi
## setting paths
################
SEED=$1
EXP_NAME=crosent
OUT_DIR=training/$EXP_NAME
MODEL_DIR=$OUT_DIR/models/model$SEED/
mkdir -p $MODEL_DIR
FAIRSEQPY=fairseq
APPLYBPE=scripts/apply_bpe.py
BPE_MODEL=models/bpe/mlconvgec_aaai18_bpe.model
DATA_DIR=data/processed
EMBED_PATH=models/embed/model.vec
DECODER_INIT_PATH=$PWD/models/decoder/lm.pt
## training
############
if [ $# -eq 1 ] ; then
DEVICE=0
else
DEVICE=$2
fi
TRAIN_LOG=$MODEL_DIR/train.log.txt
echo "MACHINE: `hostname` | GPU: $DEVICE" | tee -a $TRAIN_LOG
echo "START TIME: `date`" | tee -a $TRAIN_LOG
PYTHONPATH=$FAIRSEQPY:$PYTHONPATH CUDA_VISIBLE_DEVICES=$DEVICE python3 -u $FAIRSEQPY/train.py \
--encoder-layers '[(1024,3)] * 7' --decoder-layers '[(1024,3)] * 7' \
--encoder-embed-dim 500 --decoder-embed-dim 500 --decoder-out-embed-dim 500 \
--encoder-embed-path $EMBED_PATH --decoder-embed-path $EMBED_PATH \
--arch fconv_dualenc_gec_gatedaux --auxencoder-embed-dim 500 --auxencoder-embed-path $EMBED_PATH --auxencoder-layers '[(1024,3)] * 3' --task translation_ctx \
--dropout 0.2 --clip-norm 0.1 --lr 0.25 --min-lr 1e-4 \
--momentum 0.99 --max-epoch 100 --batch-size 48 --update-freq 2 \
--no-progress-bar --seed $SEED --no-epoch-checkpoints \
--criterion label_smoothed_cross_entropy --label-smoothing 0.1 \
--source-token-dropout 0.2 \
--restore-file $DECODER_INIT_PATH \
--raw-text \
--save-dir $MODEL_DIR $DATA_DIR | tee -a $TRAIN_LOG
echo "END TIME: `date`" | tee -a $TRAIN_LOG