Task: "JointTrainAgent"

BasicSettings:
  Seed: 0
  ImageSize: 64
  ReplayBufferOnGPU: True

JointTrainAgent:
  SampleMaxSteps: 102000
  BufferMaxLength: 100000
  BufferWarmUp: 1024
  WarmupSteps: 5000
  NumEnvs: 1
  BatchSize: 16
  DemonstrationBatchSize: 4
  BatchLength: 64 
  ImagineBatchSize: 512
  ImagineDemonstrationBatchSize: 256
  ImagineContextLength: 16
  ImagineBatchLength: 16
  TrainDynamicsEverySteps: 1 
  TrainAgentEverySteps: 1
  UseDemonstration: False
  SaveEverySteps: 5000 

Models:
  WorldModel: 
    if_harmony: True
    InChannels: 3
    StochDim: 32
    TransformerMaxLength: 64
    TransformerHiddenDim: 512
    TransformerNumLayers: 2
    ExpertNumLayers: 2 
    TransformerNumHeads: 8
    TaskDim: 96
    n_experts: 12
    n_clusters: 12
    n_activate_experts: 3

     

  Agent:
    NumLayers: 3
    HiddenDim: 512
    Gamma: 0.985
    Lambda: 0.95
    EntropyCoef: 3E-4