.gitignore
.isort.cfg
README.md
pyproject.toml
.github/workflows/publish.yml
configs/eval/default.yaml
configs/eval/quick.yaml
configs/eval/quick_pretrained.yaml
configs/serve/char_shakespeare.yaml
configs/serve/tinyllama.yaml
configs/train/defaults.yaml
configs/train/train_llama.yaml
configs/train/train_llama_shakespeare.yaml
configs/train/criterion/cross_entropy.yaml
configs/train/loggers/basic.yaml
configs/train/loggers/none.yaml
configs/train/lr_scheduler/cosine.yaml
configs/train/lr_scheduler/wsd.yaml
configs/train/model/llama2-x-lite.yaml
configs/train/model/llama2.yaml
configs/train/optimization/amp/bfloat16.yaml
configs/train/optimization/amp/disabled.yaml
configs/train/optimization/amp/float16.yaml
optimus_dl/__init__.py
optimus_dl/_version.py
optimus_dl/py.typed
optimus_dl.egg-info/PKG-INFO
optimus_dl.egg-info/SOURCES.txt
optimus_dl.egg-info/dependency_links.txt
optimus_dl.egg-info/entry_points.txt
optimus_dl.egg-info/requires.txt
optimus_dl.egg-info/top_level.txt
optimus_dl/core/__init__.py
optimus_dl/core/bootstrap.py
optimus_dl/core/device.py
optimus_dl/core/env.py
optimus_dl/core/log.py
optimus_dl/core/model_utils.py
optimus_dl/core/omegaconf.py
optimus_dl/core/profile.py
optimus_dl/core/registry.py
optimus_dl/modules/__init__.py
optimus_dl/modules/checkpoint/__init__.py
optimus_dl/modules/checkpoint/checkpoint_manager.py
optimus_dl/modules/checkpoint/load_strategy.py
optimus_dl/modules/criterion/__init__.py
optimus_dl/modules/criterion/base.py
optimus_dl/modules/criterion/config.py
optimus_dl/modules/criterion/cross_entropy.py
optimus_dl/modules/data/__init__.py
optimus_dl/modules/data/config.py
optimus_dl/modules/data/datasets/__init__.py
optimus_dl/modules/data/datasets/base.py
optimus_dl/modules/data/datasets/composite.py
optimus_dl/modules/data/datasets/huggingface.py
optimus_dl/modules/data/datasets/loop_dataset.py
optimus_dl/modules/data/datasets/tokenized_flat_dataset.py
optimus_dl/modules/data/datasets/txt_lines.py
optimus_dl/modules/data/presets/__init__.py
optimus_dl/modules/data/presets/fineweb-edu.py
optimus_dl/modules/data/presets/slimpajama.py
optimus_dl/modules/data/presets/tinyshakespeare.py
optimus_dl/modules/data/transforms/__init__.py
optimus_dl/modules/data/transforms/base.py
optimus_dl/modules/data/transforms/chunk_tokens.py
optimus_dl/modules/data/transforms/composite.py
optimus_dl/modules/data/transforms/flat_tokens_batcher.py
optimus_dl/modules/data/transforms/prefetch.py
optimus_dl/modules/data/transforms/shuffle.py
optimus_dl/modules/data/transforms/to_device.py
optimus_dl/modules/data/transforms/tokenize.py
optimus_dl/modules/distributed/__init__.py
optimus_dl/modules/distributed/base.py
optimus_dl/modules/distributed/fake.py
optimus_dl/modules/distributed/mesh.py
optimus_dl/modules/eval/__init__.py
optimus_dl/modules/eval/model.py
optimus_dl/modules/loggers/__init__.py
optimus_dl/modules/loggers/base.py
optimus_dl/modules/loggers/config.py
optimus_dl/modules/loggers/jsonl.py
optimus_dl/modules/loggers/wandb.py
optimus_dl/modules/lr_scheduler/__init__.py
optimus_dl/modules/lr_scheduler/base.py
optimus_dl/modules/lr_scheduler/cosine_annealing.py
optimus_dl/modules/lr_scheduler/linear_warmup.py
optimus_dl/modules/lr_scheduler/wsd_scheduler.py
optimus_dl/modules/metrics/__init__.py
optimus_dl/modules/metrics/base.py
optimus_dl/modules/metrics/common.py
optimus_dl/modules/model/__init__.py
optimus_dl/modules/model/base.py
optimus_dl/modules/model/config.py
optimus_dl/modules/model/gpt2.py
optimus_dl/modules/model/llama2.py
optimus_dl/modules/model/blocks/__init__.py
optimus_dl/modules/model/blocks/attention.py
optimus_dl/modules/model/blocks/layer_norms.py
optimus_dl/modules/model/presets/__init__.py
optimus_dl/modules/model/presets/hf_llama.py
optimus_dl/modules/model_transforms/__init__.py
optimus_dl/modules/model_transforms/base.py
optimus_dl/modules/model_transforms/compile.py
optimus_dl/modules/model_transforms/config.py
optimus_dl/modules/model_transforms/distributed.py
optimus_dl/modules/optim/__init__.py
optimus_dl/modules/optim/adamw.py
optimus_dl/modules/optim/config.py
optimus_dl/modules/tokenizer/__init__.py
optimus_dl/modules/tokenizer/base.py
optimus_dl/modules/tokenizer/config.py
optimus_dl/modules/tokenizer/implementations/__init__.py
optimus_dl/modules/tokenizer/implementations/char.py
optimus_dl/modules/tokenizer/implementations/huggingface.py
optimus_dl/modules/tokenizer/implementations/tiktoken.py
optimus_dl/recipe/__init__.py
optimus_dl/recipe/eval/__init__.py
optimus_dl/recipe/eval/base.py
optimus_dl/recipe/eval/config.py
optimus_dl/recipe/mixins/__init__.py
optimus_dl/recipe/mixins/model_builder.py
optimus_dl/recipe/serve/__init__.py
optimus_dl/recipe/serve/base.py
optimus_dl/recipe/serve/config.py
optimus_dl/recipe/serve/models.py
optimus_dl/recipe/train/__init__.py
optimus_dl/recipe/train/base.py
optimus_dl/recipe/train/config.py
optimus_dl/recipe/train/builders/__init__.py
optimus_dl/recipe/train/builders/criterion_builder.py
optimus_dl/recipe/train/builders/data_builder.py
optimus_dl/recipe/train/builders/optimizer_builder.py
optimus_dl/recipe/train/builders/scheduler_builder.py
optimus_dl/recipe/train/mixins/execution/__init__.py
optimus_dl/recipe/train/mixins/execution/context_mixin.py
optimus_dl/recipe/train/mixins/execution/interruption_mixin.py
optimus_dl/recipe/train/mixins/execution/iteration_mixin.py
optimus_dl/recipe/train/mixins/managers/__init__.py
optimus_dl/recipe/train/mixins/managers/evaluation_manager.py
optimus_dl/recipe/train/mixins/managers/logger_manager.py
scripts/eval.py
scripts/serve.py
scripts/train.py
tests/criterion/test_cross_entropy.py
tests/data/test_char_tokenize.py
tests/data/test_composite_dataset_v2.py
tests/data/test_hf_dataset.py
tests/data/test_tokenized_flat_dataset.py
tests/data/test_txt_lines.py
tests/integration/__init__.py
tests/integration/test_data_pipeline.py
tests/integration/test_training_pipeline.py
tests/loggers/test_loggers.py
tests/lr_scheduler/test_base.py
tests/lr_scheduler/test_cosine_annealing.py
tests/lr_scheduler/test_linear_warmup.py
tests/metrics/test_metrics_system.py
tests/model/test_attention.py
tests/model/test_gpt2.py
tests/model/test_hf_llama_loading.py
tests/model/test_layer_norms.py
tests/model/test_llama2.py
tests/model/test_logits_matching.py
tests/optim/test_adamw.py