dl_toolbox: "torch"  
project_name: "XuanCe_Benchmark"
logger: "tensorboard"  
wandb_user_name: "your_user_name"
render: False
render_mode: 'rgb_array' 
fps: 5
test_mode: False
device: "cuda:0"

agent: "MAPPO"  
learner: "MAPPO_Clip_Learner"
global_state: True
env_name: "MultiAgentRNAEnv"
env_id: "RNAEnv-v0.1"
vectorize: "SubprocVecMultiAgentEnv_RNA"  
policy: "Categorical_MAAC_Policy"
runner: "MARL"

gain: 0.01
actor_hidden_size: [128, 64, ]
critic_hidden_size: [128, 64, ]
activation: "relu"
activation_action: "relu"

use_conv: True
representation: "Basic_CNN"
filters: [32, 64, 64]  
kernels: [8, 4, 3]  
strides: [4, 2, 1]
seed: 100 
parallels: 2
buffer_size: 8192
horizon_size: 256
n_epochs: 10
n_minibatch: 16  
learning_rate: 0.00001  
weight_decay: 0
vf_coef: 0.5
ent_coef: 0.02  
target_kl: 0.25  
clip_range: 0.2  
clip_type: 1  
gamma: 0.99

use_linear_lr_decay: False  
end_factor_lr_decay: 0.5
use_global_state: True  
use_grad_clip: True  
grad_clip_norm: 10.0
use_value_clip: True  
value_clip_range: 0.2
use_value_norm: True  
use_huber_loss: True  
huber_delta: 10.0
use_advnorm: True
use_gae: True
gae_lambda: 0.95
start_training: 1
running_steps: 25000000
training_frequency: 1
test_steps: 1000
eval_interval: 200000
test_episode: 20
log_dir: "../logs/mappo/"
model_dir: "./saved_models/mappo/"

use_parameter_sharing: False
input_file : True 
dot_brackets_dir: "../data/train.txt"  
state_radius: 30 
state_radius_action: 15  
mutation_threshold: 0
reward_exponent: 1.0
use_embedding: True
diversity_loss: False
state_dim: 900
rew_shape: (1,)
max_episode_steps: 400
tolerance: 0.0  
search_radius: 0

