"""
KSKT Model Configuration File
"""
model:
  name: "KSKT"
  base_model: "Qwen3-4B-Thinking-2507"
  vocab_size: 152064
  hidden_size: 3584
  intermediate_size: 18944
  num_hidden_layers: 32
  num_attention_heads: 28
  max_position_embeddings: 32768
  rms_norm_eps: 1e-6

kskt_specific:
  dual_stream_attention:
    enabled: true
    fusion_init_method: "xavier_uniform"
    attention_bias_init_std: 0.02
  
  bipolar_reasoning:
    enabled: true
    num_thinking_layers: 2
    gate_hidden_size: 3584
  
  mutual_understanding_pe:
    enabled: true
    temperature: 0.5
  
  self_awareness_moe:
    enabled: true
    num_experts: 4  # P, K, E, C
    expert_names: ["personality", "knowledge", "emotional", "capability"]
    load_balance_weight: 0.01
    temperature_init: 1.0

training:
  # Phase 1: Self-understanding
  phase1:
    name: "self_understanding"
    epochs: 2
    learning_rate: 2e-5
    lambda_consistency: 0.2
    lambda_understanding: 0.0
    lambda_balance: 0.01
  
  # Phase 2: Other-understanding  
  phase2:
    name: "other_understanding"
    epochs: 1
    learning_rate: 1e-5
    lambda_consistency: 0.1
    lambda_understanding: 0.3
    lambda_balance: 0.01
  
  # Phase 3: Mutual understanding
  phase3:
    name: "mutual_understanding"  
    epochs: 1
    learning_rate: 5e-6
    lambda_consistency: 0.1
    lambda_understanding: 0.2
    lambda_balance: 0.01

  # General settings
  batch_size: 8
  gradient_accumulation_steps: 4
  max_grad_norm: 1.0
  weight_decay: 0.01
  warmup_steps: 500
  max_sequence_length: 2048
  save_steps: 1000
  logging_steps: 100
  evaluation_steps: 500

data:
  train_data_paths:
    - "data/character_profiles.json"
    - "data/instruction_following.json" 
    - "data/role_conversations.json"
  
  val_data_paths:
    - "data/character_bench_dev.json"
    - "data/conflict_scenarios_dev.json"
  
  test_data_paths:
    - "data/character_bench_test.json"
    - "data/conflict_scenarios_test.json"

evaluation:
  character_bench:
    enabled: true
    metrics: ["Memory", "Knowledge_FA", "Knowledge_BC_K", "Persona_AC_b", 
              "Persona_AC_h", "Persona_BC_b_P", "Persona_BC_h_P", 
              "Emotion_ES", "Emotion_ER", "Morality_MS", "Morality_MR", 
              "Believability_HL", "Believability_EG"]
  
  dual_perspective:
    enabled: true
    conflict_scenarios: ["knowledge_boundary", "value_system_conflict", 
                        "emotional_support", "expertise_boundary"]

