LICENSE
README.md
pyproject.toml
setup.cfg
setup.py
examples/__init__.py
examples/architext.py
examples/ilql_sentiments.py
examples/ilql_sentiments_t5.py
examples/nemo_ilql_inference.py
examples/nemo_ilql_sentiments.py
examples/nemo_sft_sentiments.py
examples/ppo_sentiments.py
examples/ppo_sentiments_llama.py
examples/ppo_sentiments_t5.py
examples/ppo_translation_t5.py
examples/sft_sentiments.py
examples/simulacra.py
examples/randomwalks/__init__.py
examples/randomwalks/ilql_randomwalks.py
examples/randomwalks/ppo_randomwalks.py
examples/randomwalks/randomwalks.py
examples/summarize_daily_cnn/__init__.py
examples/summarize_daily_cnn/t5_summarize_daily_cnn.py
tests/test_configs.py
tests/test_minibatch.py
tests/test_models.py
tests/test_pipelines.py
tests/test_trainers.py
tests/test_utils.py
trlx/__init__.py
trlx/reference.py
trlx/sweep.py
trlx/trlx.py
trlx.egg-info/PKG-INFO
trlx.egg-info/SOURCES.txt
trlx.egg-info/dependency_links.txt
trlx.egg-info/requires.txt
trlx.egg-info/top_level.txt
trlx/data/__init__.py
trlx/data/accelerate_base_datatypes.py
trlx/data/configs.py
trlx/data/default_configs.py
trlx/data/ilql_types.py
trlx/data/method_configs.py
trlx/data/ppo_types.py
trlx/models/__init__.py
trlx/models/modeling_base.py
trlx/models/modeling_ilql.py
trlx/models/modeling_nemo_ilql.py
trlx/models/modeling_nemo_sft.py
trlx/models/modeling_ppo.py
trlx/pipeline/__init__.py
trlx/pipeline/offline_pipeline.py
trlx/pipeline/ppo_pipeline.py
trlx/trainer/__init__.py
trlx/trainer/accelerate_base_trainer.py
trlx/trainer/accelerate_ilql_trainer.py
trlx/trainer/accelerate_ppo_trainer.py
trlx/trainer/accelerate_sft_trainer.py
trlx/trainer/nemo_ilql_trainer.py
trlx/trainer/nemo_sft_trainer.py
trlx/utils/__init__.py
trlx/utils/loading.py
trlx/utils/logging.py
trlx/utils/modeling.py