{
	"arch":"cmlmc_transformer",
	"step-count": "-1",
	"teacher-path": "./results/checkpoints/IWSLTdeen_distill_CMLMC_benchmark/IWSLTdeen_distill_CMLMC.pt",
	"dataset": "data-bin/iwslt14_deen_jointdict/",
	"embed-loss-factor": ".2",
	"cross-attn-loss-factor": ".0",
	"self-attn-loss-factor": ".0",
	"orig-loss-factor": ".0",
	"max-tokens": "1024", 
	"distill-on-valid": true,
	"insertCausalSelfAttn": true,
        "no-scale-embedding": true,
	"decoder-ffn-embed-dim": 1024,
	"encoder-ffn-embed-dim": 1024,
	"teacher-ema": true,
	"teacher-ema-decay": "0.997",
	"keep-best-checkpoints": "1",
	"layer-prediction-loss-factor":"0.5",
	"concat-prediction": true
}

