{
    "s2p_encoder": {
        "type": "ConformerNet",
        "kwargs": {
            "num_cells": 14,
            "idim": 80,
            "hdim": 512,
            "conv": "vgg2l",
            "num_heads": 4,
            "kernel_size": 15,
            "n_classes": 37
        }
    },
    "beamDecoder": {
        "type": "CTCBeamDecoder",
        "n_classes": 37,
        "beam_width": 16,
        "log_probs_input": true,
        "num_processes": 2
    },
    "sampler": {
        "n_samples": 10,
        "cache_enabled": true,
        "add_supervised": false
    },
    "p2g_encoder": {
        "type": "TransformerDecoder",
        "kwargs": {
            "num_layers": 8,
            "num_emb": 37,
            "hdim": 512,
            "num_heads": 4,
            "intermediate_size": 1024,
            "max_position_embeddings": 512,
            "num_classes": 500,
            "with_head": true
        }
    },
    "g2p_encoder": {
        "type": "TransformerDecoder",
        "kwargs": {
            "num_layers": 8,
            "num_emb": 37,
            "hdim": 512,
            "num_heads": 4,
            "intermediate_size": 1024,
            "n_classes": 37,
            "with_head": true
        }
    },
    "scheduler": {
        "type": "SchedulerEarlyStop",
        "kwargs": {
            "min_step": 20000,
            "n_tol": 10,
            "gamma": 0.5,
            "stop_lr": 1e-06
        },
        "optimizer": {
            "type": "Adam",
            "kwargs": {
                "lr": 3e-05,
                "betas": [
                    0.9,
                    0.98
                ],
                "weight_decay": 1e-06
            }
        }
    }
}