mt_train.py
Less than 1 minute
mt_train.py
Train a neural machine translation (NMT) model on one CPU, one or multiple GPUs
usage: mt_train.py [-h] [--config CONFIG] [--config2 CONFIG2]
[--config3 CONFIG3] [--ngpu NGPU]
[--train-dtype {float16,float32,float64,O0,O1,O2,O3}]
[--backend {chainer,pytorch}] --outdir OUTDIR
[--debugmode DEBUGMODE] --dict DICT [--seed SEED]
[--debugdir DEBUGDIR] [--resume [RESUME]]
[--minibatches MINIBATCHES] [--verbose VERBOSE]
[--tensorboard-dir [TENSORBOARD_DIR]]
[--report-interval-iters REPORT_INTERVAL_ITERS]
[--save-interval-iters SAVE_INTERVAL_ITERS]
[--train-json TRAIN_JSON] [--valid-json VALID_JSON]
[--model-module MODEL_MODULE] [--lsm-weight LSM_WEIGHT]
[--report-bleu] [--nbest NBEST] [--beam-size BEAM_SIZE]
[--penalty PENALTY] [--maxlenratio MAXLENRATIO]
[--minlenratio MINLENRATIO] [--rnnlm RNNLM]
[--rnnlm-conf RNNLM_CONF] [--lm-weight LM_WEIGHT]
[--sym-space SYM_SPACE] [--sym-blank SYM_BLANK]
[--sortagrad [SORTAGRAD]]
[--batch-count {auto,seq,bin,frame}]
[--batch-size BATCH_SIZE] [--batch-bins BATCH_BINS]
[--batch-frames-in BATCH_FRAMES_IN]
[--batch-frames-out BATCH_FRAMES_OUT]
[--batch-frames-inout BATCH_FRAMES_INOUT] [--maxlen-in ML]
[--maxlen-out ML] [--n-iter-processes N_ITER_PROCESSES]
[--opt {adadelta,adam,noam}] [--accum-grad ACCUM_GRAD]
[--eps EPS] [--eps-decay EPS_DECAY] [--lr LR]
[--lr-decay LR_DECAY] [--weight-decay WEIGHT_DECAY]
[--criterion {loss,acc}] [--threshold THRESHOLD]
[--epochs EPOCHS]
[--early-stop-criterion [EARLY_STOP_CRITERION]]
[--patience [PATIENCE]] [--grad-clip GRAD_CLIP]
[--num-save-attention NUM_SAVE_ATTENTION]
[--context-residual [CONTEXT_RESIDUAL]]
[--tie-src-tgt-embedding [TIE_SRC_TGT_EMBEDDING]]
[--tie-classifier [TIE_CLASSIFIER]] [--enc-init [ENC_INIT]]
[--enc-init-mods ENC_INIT_MODS] [--dec-init [DEC_INIT]]
[--dec-init-mods DEC_INIT_MODS]
[--multilingual MULTILINGUAL] [--replace-sos REPLACE_SOS]