
# MultiModal Baseline with Dynamic Dropout and BERT Transformer
# 基于MultiModal_Baseline_Dynamic_Dropout，使用BERT Transformer替代平均池化
# 支持token级别文本输入，学习性dropout重要token
# 使用BERT Transformer进行上下文编码和CLS提取，替代简单平均池化

# learning_rate: [0.005]
learning_rate: [0.001,0.005,0.01]

requires_news_embedding: true

# embedding_size: 512
embedding_size: [256,512,1024]

# depth: [5, 10, 15]
depth: 10
num_envs: 10
# num_envs: [10]
dropout: [0.1, 0.2, 0.3]
# dropout: 0.1
meta_drop: 0.1
# sudden_drop: 0.1
sudden_drop: [0.1, 0.2, 0.3]
# fuse_drop: 0.1
fuse_drop: [0.1, 0.2, 0.3]

e_layers: 1
d_layers: 1
factor: 3
enc_in: 1
dec_in: 1
c_out: 1
embedd: timeF
use_multimodal: True
inverse: False
text_emb_dim: 4096

# BERT Transformer配置（可选）
# bert_model_name: bert-base-uncased  # 默认值，可在config中覆盖
# bert_model_path: /path/to/local/bert/model  # 本地BERT模型路径（如果网络无法访问Hugging Face Hub，使用此参数）
bert_model_path: /public/home/maoyaoxin/llh/MMTSF/hf_home/bert-base-uncased
# Loss weights for dynamic dropout
beta1: 0.2
beta2: 0.2
beta3: 0.1   # word embedding loss weight - 监督dropout后的embeddings接近理想embeddings
beta4: 0.05  # reconstruction loss weight (reserved for future use)

# DataLoader configuration
# 设置为0以避免多进程并发训练时的线程资源耗尽
# 当同时运行多个训练任务时，建议设置为0（单进程加载，稍慢但稳定）
# 如果只运行单个训练任务，可以设置为2-4以提升数据加载速度
num_workers: 2

# Hyperparameter search space
hyper_parameters: ["learning_rate","embedding_size","dropout","sudden_drop","fuse_drop"]

