dataset: "bridge"
sequence_interval: 1
val_start_frame_interval: 16
cam_ids: [0]
accumulate_action: False
pre_encode : True
normalize: True
raw_video: False
mode: 'val'

anno: 'bridge_frame_ada'
debug: False
do_evaluate: False
final_frame_ada: False

evaluate_checkpoint: False

# model config: 
model: WM-XL/2
num_frames: 16
video_size: [256,320]
learn_sigma: False
extras: 3 # [3, 5] 3 frame-level condition 5 video-level condition
mask_frame_num: 1

learning_rate: 1e-4
ckpt_every: 10000
clip_max_norm: 0.1
start_clip_iter: 0
local_batch_size: 1
local_val_batch_size: 1
max_train_steps: 300000
global_seed: 3407
num_workers: 11
log_every: 100
val_every: 10000
gradient_accumulation_steps: 2
attention_mode: 'math'

resume_from_checkpoint : '06/16/bridge_frame_ada'