# ===================== Model =====================
model: snn_ocr_optimized
norm: gn
gn_max_groups: 32
gn_nocast: true

height_pool_mode: attn_gate
height_pool_mix: 0.75

dual_res_down_mode: mix
dual_res_down_mix_init: 0.8

use_mem_residual: true
mem_residual_init: 0.0

use_abs_pos: true
use_conv_pos: true
conv_pos_k: 7
pos_allow_interp: true

temporal_max_T: 4
temporal_fp32_reduce: true
use_checkpoint: false

time_step: 2
layer: 7
dim: 768
mlp_ratio: 4.0
seq_block_layout: auto
ssm_kernel: 31
ssm_expand_ratio: 2.0

temporal_fuse: gate
temporal_gate: scalar
temporal_eps: 1.0e-6
temporal_fuse_pre: gate
temporal_fuse_final: wg

use_aux_ctc: true
aux_ctc_weight: 0.2
aux_temporal_fuse: gate

consistency_kl_weight: 0.05
consistency_kl_temp: 1.0
consistency_kl_symmetric: true

use_temporal_coding: true
use_xaxis_rectifier: true
use_dual_res_fusion: true
use_token_merge: true

token_min_keep_ratio: 0.7
token_blank_thresh: 0.88
token_merge_k: 3
xrect_max_disp: 0.12

# ===================== Dataset (READ2016) =====================
dataset: read2016
data_path: /workspace/data/OCR/READ2016

train_split: train
val_split: valid
test_split: test

img_height: 64
img_max_width: 512
crop_pad: 2
allow_empty: false
cache_size: 8

# Text normalization
text_norm: true
text_norm_form: NFKC
text_collapse_ws: true
text_drop_chars: ""
max_label_len: 0
oov: error
add_unk: false
charset_from: trainval

# Image normalize / width estimation
normalize: half
estimate_valid_w: true
bg_thresh: 250

# ===================== Augmentation =====================
aug_affine_p: 0.15
aug_degrees: 2.5
aug_translate: 0.015
aug_shear: 2.5

aug_stroke_p: 0.25
aug_stroke_kmin: 3
aug_stroke_kmax: 5

aug_sharpen_p: 0.10
aug_invert_p: 0.0

aug_noise_p: 0.20
aug_noise_std: 0.03

aug_wstretch_p: 0.30
aug_wstretch_min: 0.7
aug_wstretch_max: 1.3

# ===================== Train =====================
initial_checkpoint: ""
resume: ""
no_resume_opt: false

batch_size: 4
val_batch_size: 4
workers: 4

opt: adamw
weight_decay: 0.05
momentum: 0.9
opt_eps: null
opt_betas: null

clip_grad: 1.0
clip_mode: norm

sched: cosine
sched_on_updates: null
lr: 3.0e-4
warmup_lr: 1.0e-5
min_lr: 1.0e-6
epochs: 210
warmup_epochs: 5
cooldown_epochs: 10
decay_epochs: 30
decay_rate: 0.1

drop: 0.1
drop_path: 0.2
seq_nhead: 12
seq_layers: 6
max_seq_len: 512

accum_steps: 1

amp: false
apex_amp: false
native_amp: true
amp_dtype: fp16

channels_last: false
pin_mem: true
no_prefetcher: false
tf32: true
matmul_precision: high

seed: 340
log_interval: 50
checkpoint_hist: 1

output: ./output/read_snn_ocr
experiment: read_spike_htr
eval_metric: cer
save_images: false
log_wandb: false

model_ema: true
model_ema_force_cpu: false
model_ema_decay: 0.9998

find_unused_parameters: false
dist_bn: ""

# ===================== CTC safety =====================
force_no_store_v: false
strict_ctc_lengths: true
ctc_len_violation: clamp
dump_on_ctc_violation: false
logit_clip: 0.0
