{
	"step-count": "-1",
	"arch": "cmlm_transformer",
	"criterion": "ctc",
	"teacher-path": "./results/checkpoints/IWSLTdeen_distill_CMLM_benchmark/checkpoint_best.pt",
	"dataset": "data-bin/iwslt14_deen_jointdict/",
	"embed-loss-factor": ".2",
	"cross-attn-loss-factor": ".0",
	"self-attn-loss-factor": ".0",
	"orig-loss-factor": ".0",
	"max-tokens": "1024", 
	"distill-on-valid": true,
	"insertCausalSelfAttn": true,
        "no-scale-embedding": true,
	"decoder-ffn-embed-dim": 1024,
	"encoder-ffn-embed-dim": 1024,
	"teacher-ema": true,
	"teacher-ema-decay": "0.997",
	"keep-best-checkpoints": "1"
}

