seed: 1024
data:
    dataset: k400
    modality: video
    num_segments: 8
    seg_length: 1
    batch_size: 4
    workers: 8
    num_classes: 200
    image_tmpl: 'img_{:05d}.jpg'
    val_root: '/media/h/Lenovo/DATASET/k400/videos_256/val_256/'
    val_list: 'lists/k400/B2N/k400_novel_vallist.txt'
    label_list: 'lists/k400/B2N/k400_novel_labels.csv'
    index_bias: 1
    input_size: 224
network:
    arch: ViT-B/16   # ViT-L/14
    init: True
    drop_out: 0.0
    emb_dropout: 0.0 
    sim_header: None
    interaction: DP  # DP VCS
    temporal_layer: 4
logging:
    print_freq: 10
    eval_freq: 1