{"step-count": "-1", "teacher-path": "./results/checkpoints/WMT16enro_distill_CMLM_benchmark/imputer_best.pt", "embed-loss-factor": "0.0", "lr": "1e-3", "max-tokens": "2048", "max-tokens-valid": "4096", "dataset": "/storage/sajad/data-bin/wmt16_enro_distill", "source-lang": "en", "target-lang": "ro", "distill-loss-factor": "1", "noise": "random_mask", "teacher-iterative-steps": "2", "ctc-distill": true, "criterion": "ctc", "mask-policy": "block", "teacher-random-unmask": false, "distill-on-valid": false, "patience": 10, "valid-per-epoch": "5", "label-smoothing": "0.0", "teacher-temp": "1", "valid-subset": "test", "align-noise":true, "unsupervised": false, "teacher-ema": false, "teacher-ema-decay": "0.9992"}
