runner: "mt_episode"
test_interval: 500
save_model_interval: 500
log_interval: 500    
learner_log_interval: 500
t_max: 30000
save_model: False
action_selector: "epsilon_greedy"
epsilon_start: 1.0
epsilon_finish: 0.05
epsilon_anneal_time: 50000
target_update_interval: 80
agent_output_type: "q"
learner: "bikt_learner"
double_q: True
mixer: "mt_qattn"
mixing_embed_dim: 32
hypernet_layers: 2
hypernet_embed: 64
name: "bikt"
agent: "mt_bikt"
mac: "mt_bikt_mac"
entity_embed_dim: 64
attn_embed_dim: 8
c_step: 1
beta: 0.001
coef_conservative: 5.0
coef_dist: 5.0
pretrain_steps: 15000
head: 1
depth: 1
id_length: 4
max_agent: 15
debug: False
pretrain_vae: False
pretrain: False
offline_data_folder_4_save_vae: "dataset_skill"
train_DT: False
dt_agent: "gpt"
model_type: "rtgs_state_action" 
optim_type: "adam" 
dt_lr: 0.0002 
mini_batch_size: 16
n_layer: 2
block_size: 1  
step_block_size: 10 
n_embd: 64
n_head: 2
attn_pdrop: 0
resid_pdrop: 0
grad_norm_clip: 0.5
action_dim:  10  
skill_softmax: False
skill_max: False
test_greedy: True
test_nepisode: 32
log_interval: 500
runner_log_interval: 500
offline_data_folder: "dataset"
offline_data_name: ""
offline_data_quality: "expert"
offline_data_size: 2000
offline_data_shuffle: False
offline_data_folder: "dataset_skill"
num_episodes_collected: 2000
obs_last_skill: true
gen_dataset_ac_ad: False
offline_data_ac_ad_folder: "dataset_ac_ad"
vqvae_agent: "vqvae_agent"
pretrain_vqvae: False
vqvae_beta: 1.0
z_e_dim:  64
vqvae_K: 16 
vqvae_D: 64 
vqvae_lr: 0.0005
save_dataset_interval: 300
offline_data_folder4_gl_skill: "dataset_skill_w_vqvae" 
train_DT_w_glsk: False
codebook_alpha: 0.01
train_steps_per_batch: 1




