LICENSE
MANIFEST.in
README.md
pyproject.toml
setup.py
open_lm/__init__.py
open_lm/attention.py
open_lm/data.py
open_lm/distributed.py
open_lm/evaluate.py
open_lm/file_utils.py
open_lm/logger.py
open_lm/losses.py
open_lm/main.py
open_lm/meters.py
open_lm/model.py
open_lm/norms.py
open_lm/params.py
open_lm/precision.py
open_lm/scheduler.py
open_lm/train.py
open_lm.egg-info/PKG-INFO
open_lm.egg-info/SOURCES.txt
open_lm.egg-info/dependency_links.txt
open_lm.egg-info/requires.txt
open_lm.egg-info/top_level.txt
open_lm/datapreprocess/__init__.py
open_lm/datapreprocess/make_2048.py
open_lm/datapreprocess/make_assistant_data.py
open_lm/datapreprocess/wiki_download.py
open_lm/datapreprocess/ray/__init__.py
open_lm/datapreprocess/ray/token_counter.py
open_lm/datapreprocess/ray/tokenize_shuffle.py
open_lm/model_configs/__init__.py
open_lm/model_configs/ant_neox.json
open_lm/model_configs/aphid_neox.json
open_lm/model_configs/atom_neox.json
open_lm/model_configs/g3b_neox.json
open_lm/model_configs/l7b_neox.json
open_lm/model_configs/llama2_7b.json
open_lm/model_configs/m1b_neox.json
open_lm/model_configs/m1b_tiktoken.json
open_lm/model_configs/mamba_130m.json
open_lm/model_configs/mamba_1b.json
open_lm/model_configs/mamba_7b.json
open_lm/model_configs/marmot_neox.json
open_lm/model_configs/open_lm_11m.json
open_lm/model_configs/open_lm_11m_v2.json
open_lm/model_configs/open_lm_154m_v2.json
open_lm/model_configs/open_lm_160m.json
open_lm/model_configs/open_lm_1b.json
open_lm/model_configs/open_lm_1b_old.json
open_lm/model_configs/open_lm_25m.json
open_lm/model_configs/open_lm_3b.json
open_lm/model_configs/open_lm_410m.json
open_lm/model_configs/open_lm_411m_v2.json
open_lm/model_configs/open_lm_41m.json
open_lm/model_configs/open_lm_79m_v2.json
open_lm/model_configs/open_lm_7b.json
open_lm/model_configs/open_lm_830m.json
open_lm/model_configs/open_lm_87m.json
open_lm/model_configs/open_lm_test_tiny.json
open_lm/model_configs/potato_neox.json
open_lm/model_configs/quark_neox.json
open_lm/positional_embedding/__init__.py
open_lm/positional_embedding/head_rotary.py
open_lm/positional_embedding/llama_rotary.py
open_lm/positional_embedding/none.py
open_lm/positional_embedding/rotary.py
open_lm/utils/__init__.py
open_lm/utils/averaging_utils.py
open_lm/utils/convert_llama.py
open_lm/utils/llm_foundry_wrapper.py
open_lm/utils/make_wds_manifest.py
open_lm/utils/update_manifest.py
open_lm/utils/transformers/__init__.py
open_lm/utils/transformers/convert_to_hf.py
open_lm/utils/transformers/generation.py
open_lm/utils/transformers/hf_config.py
open_lm/utils/transformers/hf_model.py
open_lm/utils/transformers/hf_wrapper.py
tests/__init__.py
tests/shared.py
tests/test_attention_masking.py
tests/test_custom_attention.py
tests/test_dataset_basic.py
tests/test_dataset_deterministic.py
tests/test_dataset_no_resample.py
tests/test_file_utils.py
tests/test_generate_kv_cache_time.py
tests/test_generate_load_kv_cache_equal.py
tests/test_grad_accum.py
tests/test_loss_masking.py
tests/test_make_wds_manifest.py
tests/test_param_parsing.py
tests/test_save_load.py
tests/test_save_load_from_main.py
tests/test_tiny_generate_kv_cache_equal.py
tests/test_tokenize_shuffle.py
tests/test_training_simple.py
tests/test_training_tokens.py
tests/utils.py