pretrain:   # zero shot need a pretrained model
seed: 1024
data:
    dataset: kinetics700
    modality: RGB
    num_segments: 8
    seg_length: 1
    split: 1
    batch_size: 64
    workers: 16
    num_classes: 322
    image_tmpl: '{:06d}.jpg'
    val_list: 'lists/kinetics_700_val_frames.txt' #
    label_list: 'lists/kinetics_700_labels.csv'
    index_bias: 1
    input_size: 224
    random_shift: False
network:
    arch: ViT-B/16  #ViT-B/32 ViT-B/16
    init: True
    tsm: False
    drop_out: 0.0 # probability of an element to be zeroed
    emb_dropout: 0.0 # probability of embedding to be zeroed
    type: clip_k700
    sim_header: "Transf"   #Transf   meanP  LSTM  Conv_1D  Transf_cls
    joint: False
    describe:
    ratio: 1
    f_ratio: 10
logging:
    print_freq: 10
    eval_freq: 1
DENOISER:
    corpus: "./en.json"
    top_k: 10
    num_beams: 1
    num_iter: 10
    percentage: 100
    temp: "linear" # linear log
    result: "./new_textlist_beam{:}_{:}.list"
    idx_sim: 1
    intra: True
    inter: True
    Q_style: "mean" # max mean