name: "tinyRSNN-attention"

#seq_forward: False
seq_forward: True
spike_after_dynamic: False
multiSyn_LIF: False
adaptive_bn: False
Rep_Linear: False
separate_brain_area: False
firingRate_Decoder: False

BatchNorm: True
#output_BN: True
output_BN: False
multi_BN: False
#multi_BN: True
Layer_init: True
area_wise: False
#no_MLP: True
no_MLP: False
readout_MLP: False
pretrain_forze: False
reshape_num: 4
#reshape_num: 8

output_feedback: False
output_crossAttention: False
output_feedback_timestep: 16
#deefback_hidden_size: 96
self_and_crossAttention: False
feedback_max_epoch_ratio: 0.75
feedback_teacher_forcing_ratio_start: 0.8
feedback_teacher_forcing_ratio_end: 0
step_training: False
step_num: 3


multi_hidden: False
hidden_shortcut: False
# block1：Linear Hidden layers
nb_linear_hidden: 0
linear_hidden_size: [192]
linear_hidden_dim: [1]
linear_hidden_recurrent: [True]
# block1：conv Hidden layers
nb_conv_hidden: 0
conv_hidden_stride: [2]
conv_hidden_recurrent: [True]
conv_hidden_kernel_size: [5]
conv_hidden_nb_filters: [6]
# block1：linear Hidden encoder
linear_encode_size: [4, 256]

# block2：Attention Hidden layers
forward_shortcut: False
nb_Attention_hidden: 1
nb_Attention_embed: [4] #
nb_Attention_head: [4]
Attention_parameter_scale: 1
Attention_qkv_mix: False
#Attention_qkv_mix: True
#Attention_qkv: linear #linear or conv
#Attention_qkv: conv #linear or conv
Attention_qkv: conv_linear #linear or conv
Attention_hidden_recurrent_qkv: [False]
#Attention_hidden_recurrent_qkv: [True]
# for linear
commom_linear: False
Attention_hidden_size: [48]
Linear_bias: False
# for conv:
Attention_kernel_size: [3]
Attention_conv_stride: [1]
#Repconv: "LayerNorm"
Repconv: True
Attention_recurrent: [True]
# MLP
shortcut: True
shortcut_opFlag: False
shortcut_Linear: True
#MLP_size: [192]
MLP_size: [512]
MLP_id_map: False
#shortcut_Linear: False
Attention_hidden_recurrent_MLP: [True]
#connection_class: Connection_withBatchNorm

# no attention
nb_hidden: 1
#hidden_size: [64]
hidden_size: [1024]
recurrent: [True]


# Neuron parameters
tau_mem: 20e-3
tau_syn: 10e-3

# Stochastic
stochastic: False

# Dropout
dropout_p: 0.3

# Heterogenous time constants
het_timescales: True
het_timescales_readout: True

learn_timescales: True
learn_timescales_readout: True

# Delta synapses
delta_synapses: False

# half precision
is_half: False

# Readout
multiple_readouts: True
#multiple_readouts: False

tau_mem_readout: 50e-3
tau_syn_readout: 10e-3

readouts:
  ro1:
    type: default
  ro2:
    type: default
    tau_syn: 5e-3
    tau_mem: 20e-3
  ro3:
    type: default
    tau_syn: 20e-3
    tau_mem: 20e-3
  ro4:
    type: default
    tau_syn: 10e-3
    tau_mem: 30e-3
  ro5:
    type: default
    tau_syn: 30e-3
    tau_mem: 100e-3