dataset_alias: "FNSPID/ver_gen1"
# dataset_version: "ver_turn1_final"
dataset_version: "ver_gen1"
dataset_root: "dataset/FNSPID"

# 数据预处理/模态控制
use_multimodal: true           # 默认启用文本新闻
use_text_news: true            # 显式控制是否返回新闻文本
use_news_embedding: true       # 同步加载 embedding，模型可按需使用
# use_news_embedding: false
use_llm_hidden: false          # 可选加载预编码 LLM hidden states
train_news_embed_file: "/ver_camf/embedding_qwen/all_embeddings.pt::train_news"
vali_news_embed_file: "/ver_camf/embedding_qwen/all_embeddings.pt::vali_news"
test_news_embed_file: "/ver_camf/embedding_qwen/all_embeddings.pt::test_news"
train_news_hidden_file: null
vali_news_hidden_file: null
test_news_hidden_file: null

# time series parameters
seq_len: 5      # historical sequence length
pred_len: 5     # prediction length
label_len: 0    # label length for Informer
batch_size: 32  # batch size for training
patch_len: 5    # patch length for PatchTST
stride: 1       # stride for sliding window
epochs: 25     # reduced for testing

# 可用性滞后配置
news_lag:
  max_lag: 0             # 默认对齐，可在实验脚本中覆盖
  min_lag: 0             # 与 max_lag 联动；当 max_lag>0 时建议设置 >=0
  mode: "uniform"        # uniform / geometric
  geometric_p: 0.4       # 截断几何分布参数
  drop_border: false     # 超出边界是否直接丢弃样本
  clamp_border: true     # 若 drop=false，则截断到最早可见新闻
  seed: null             # 可选随机种子，沿用 overall.yaml 的 seed

# 扫描范围（脚本读取）
availability_lag_eval_ns: [0, 1, 2, 3]
impact_lag_eval_ls: [0, 1, 2, 3]
