{
    "train_data": [
        {
            "type": "hfds",
            "prefix": "amazon_reviews_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 16.4678276174]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/amazon_reviews_full/train"
        },
        {
            "type": "hfds",
            "prefix": "paq_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 22.5417926692]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/paq_full/train"
        },
        {
            "type": "hfds",
            "prefix": "s2orc_citation_title_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 3.2310768452]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/s2orc_citation_title_full/train"
        },
        {
            "type": "hfds",
            "prefix": "s2orc_title_abstract_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 15.08443898395]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/s2orc_title_abstract_full/train"
        },
        {
            "type": "hfds",
            "prefix": "s2orc_abstract_citation_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 3.1966268373]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/s2orc_abstract_citation_full/train"
        },
        {
            "type": "hfds",
            "prefix": "s2orc_abstract_body_index_filtered",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 2.7407833792]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/s2orc_abstract_body_index_filtered/train"
        },
        {
            "type": "hfds",
            "prefix": "wikianswers_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 4.2207391483]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/wikianswers_full/train"
        },
        {
            "type": "hfds",
            "prefix": "wiki_title_body_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 2.5933422827]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/wiki_title_body_full/train"
        },
        {
            "type": "hfds",
            "prefix": "gooaq_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.5360443819]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/gooaq_full/train"
        },
        {
            "type": "hfds",
            "prefix": "codesearch_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.3615181776]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/codesearch_full/train"
        },
        {
            "type": "hfds",
            "prefix": "yahoo_title_answer_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.1157856668]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/yahoo_title_answer_full/train"
        },
        {
            "type": "hfds",
            "prefix": "agnews_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.1758538278]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/agnews_full/train"
        },
        {
            "type": "hfds",
            "prefix": "amazon_qa_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.09461858785]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/amazon_qa_full/train"
        },
        {
            "type": "hfds",
            "prefix": "yahoo_qa_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.06003259585]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/yahoo_qa_full/train"
        },
        {
            "type": "hfds",
            "prefix": "yahoo_title_question_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.08925579255]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/yahoo_title_question_full/train"
        },
        {
            "type": "hfds",
            "prefix": "ccnews_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.147980012]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/ccnews_full/train"
        },
        {
            "type": "hfds",
            "prefix": "npr_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.1527520086]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/npr_full/train"
        },
        {
            "type": "hfds",
            "prefix": "eli5_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.04467852421]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/eli5_full/train"
        },
        {
            "type": "hfds",
            "prefix": "cnn_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.1228129078]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/cnn_full/train"
        },
        {
            "type": "hfds",
            "prefix": "stackexchange_question_question_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.03063199218]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/stackexchange_question_question_full/train"
        },
        {
            "type": "hfds",
            "prefix": "stackexchange_title_body_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.03376381108]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/stackexchange_title_body_full/train"
        },
        {
            "type": "hfds",
            "prefix": "stackexchange_body_body_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.02748511043]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/stackexchange_body_body_full/train"
        },
        {
            "type": "hfds",
            "prefix": "sentence_compression_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.07263811462]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/sentence_compression_full/train"
        },
        {
            "type": "hfds",
            "prefix": "wikihow_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.04017975109]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/wikihow_full/train"
        },
        {
            "type": "hfds",
            "prefix": "altlex_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.0463216308]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/altlex_full/train"
        },
        {
            "type": "hfds",
            "prefix": "quora_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const", 0.01878045307]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/quora_full/train"
        },
        {
            "type": "hfds",
            "prefix": "simplewiki_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const",0.04088603169]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/simplewiki_full/train"
        },
        {
            "type": "hfds",
            "prefix": "squad_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const",0.01050927124]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/squad_full/train"
        },
        {
            "type": "hfds",
            "prefix": "reddit_full",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "max_epoch": 1, 
            "scheduler": [
            [0, ["const",27.7008435877]]
            ],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_src_split/reddit_full/train"
        },
        {
            "type": "hfds",
            "prefix": "train_nomic_positive_only_combined",
            "data_signature": {"keys":["query", "document"], "format_fn": "pass_retrieval_pair"},
            "weight": 0,
            "scheduler": ["base-renorm"],
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/nomic_positive_only_combined/train"
        }

    ],
    "val_data": [
        {
            "type": "hfds",
            "prefix": "train_alpaca",
            "data_signature": {"keys":["question", "response"], "format_fn": "pass_retrieval_pair"},
            "weight": 1,
            "data_dir": "/XXXX-30/XXXX-29/XXXX-31/proj-shared/language_datasets/processed/alpaca_subset/train"
        }
    ]
}