{
  "train_datasets": {"1438":"data/train-1438.json", "500":"data/train-500.json"},
  "val_dataset":"data/val.json",
  "test_dataset":"data/test.json",
  "training_sets": [{"structures":100, "rules":1438}, 
                    {"structures":1000, "rules":1438}, 
                    {"structures":10000, "rules":1438},
                    {"structures":100, "rules":500},
                    {"structures":1000, "rules":500},
                    {"structures":10000, "rules":500}
                  ],
  "model_args": {"empiricist_rules": {"structure_length":6, "ninp":256,"nhid":256, "nhead":8, "nlayers":4, "dropout":0.1, "learning_rate":3e-4},
                 "empiricist_labels": {"structure_length":6, "ninp":256,"nhid":256, "nhead":8, "nlayers":4, "dropout":0.1, "learning_rate":3e-4},
                 "empiricist_conscious": {"structure_length":6, "ninp":256,"nhid":256, "nhead":8, "nlayers":4, "dropout":0.1, "learning_rate":3e-4, "rule_reg_coeff":100},
                 "interpreter":{"ninp":128,"nhid":128, "nhead":8, "nlayers":4, "dropout":0.1, "learning_rate":3e-4}},
  "num_beams":300
}