


# train_file: "/train.json"
# vali_file: "/vali.json"
# test_file: "/test.json"
# #初代news+md
# # train_news_file: "/ver0/llama_embeddings/train_news.npy"
# # vali_news_file: "/ver0/llama_embeddings/vali_news.npy"
# # test_news_file: "/ver0/llama_embeddings/test_news.npy"
# # train_meta_file: "/ver0/llama_embeddings/train_meta_domain.npy"
# # vali_meta_file: "/ver0/llama_embeddings/vali_meta_domain.npy"
# # test_meta_file: "/ver0/llama_embeddings/test_meta_domain.npy"

# #二代news+md
# train_news_file: "/ver1/llama_embeddings/train_news.npy"
# vali_news_file: "/ver1/llama_embeddings/vali_news.npy"
# test_news_file: "/ver1/llama_embeddings/test_news.npy"
# train_meta_file: "/ver1/llama_embeddings/train_meta_domain.npy"
# vali_meta_file: "/ver1/llama_embeddings/vali_meta_domain.npy"
# test_meta_file: "/ver1/llama_embeddings/test_meta_domain.npy"
# # # 因为没有ct，借用md的ct1
# # train_ct1_file: "/ver0/llama_embeddings/train_meta_domain.npy"
# # vali_ct1_file: "/ver0/llama_embeddings/vali_meta_domain.npy"
# # test_ct1_file: "/ver0/llama_embeddings/test_meta_domain.npy"

# enc_in: 1
# seq_len: 7
# pred_len: 7
# label_len: 0
# batch_size: 16
# patch_len: 4
# stride: 1
# epochs: 30

# content: "Air quality indicators are key indicators for detecting the degree of air pollution in a region."
# hyper_parameters: []

dataset_alias: "Environment/ver_gen1"
# dataset_version: "ver_turn1_final"
dataset_version: "ver_gen1"
dataset_root: "dataset/Environment"

# 数据预处理/模态控制
use_multimodal: true           # 默认启用文本新闻
use_text_news: true            # 显式控制是否返回新闻文本
use_news_embedding: true       # 同步加载 embedding，模型可按需使用
# use_news_embedding: false
use_llm_hidden: false          # 可选加载预编码 LLM hidden states
train_news_embed_file: "/ver_camf/embedding_qwen/all_embeddings.pt::train_news"
vali_news_embed_file: "/ver_camf/embedding_qwen/all_embeddings.pt::vali_news"
test_news_embed_file: "/ver_camf/embedding_qwen/all_embeddings.pt::test_news"
train_news_hidden_file: null
vali_news_hidden_file: null
test_news_hidden_file: null

# time series parameters
seq_len: 7      # historical sequence length
pred_len: 7     # prediction length
label_len: 0    # label length for Informer
batch_size: 32  # batch size for training
patch_len: 7    # patch length for PatchTST
stride: 1       # stride for sliding window
epochs: 25     # reduced for testing

# 可用性滞后配置
news_lag:
  max_lag: 0             # 默认对齐，可在实验脚本中覆盖
  min_lag: 0             # 与 max_lag 联动；当 max_lag>0 时建议设置 >=0
  mode: "uniform"        # uniform / geometric
  geometric_p: 0.4       # 截断几何分布参数
  drop_border: false     # 超出边界是否直接丢弃样本
  clamp_border: true     # 若 drop=false，则截断到最早可见新闻
  seed: null             # 可选随机种子，沿用 overall.yaml 的 seed

# 扫描范围（脚本读取）
availability_lag_eval_ns: [0, 1, 2, 3]
impact_lag_eval_ls: [0, 1, 2, 3]
