.gitignore
CLAUDE.md
LICENSE.md
Readme.md
image.png
pyproject.toml
test-vector-projection.py
test.jsonl
tox.ini
uv.lock
.github/dependabot.yml
.github/workflows/claude.yml
.github/workflows/pr-tests.yml
.github/workflows/pypi.yaml
benchmarks/bench_v_proj.py
docs/distributed_initialization.md
docs/superpowers/specs/2026-04-02-full-state-checkpointing-design.md
regression_tests/README.md
regression_tests/benchmark_batching.py
regression_tests/run_multi_node_fidelity_test.sh
regression_tests/test_checkpoint_all_models.py
regression_tests/test_full_state_checkpoint_fidelity.py
regression_tests/test_full_state_checkpoint_signal.sh
regression_tests/test_gpt_oss_conversion_accuracy.py
regression_tests/test_osft_fidelity_script.py
regression_tests/test_osft_orthogonalization.py
research_scratch/README.md
research_scratch/fsdp1_dummy_script.py
research_scratch/fsdp1_wrapper.py
research_scratch/sequence_length_experiment.py
scripts/convert_to_pretrain.py
scripts/process_data.py
src/mini_trainer/__init__.py
src/mini_trainer/_version.py
src/mini_trainer/api_train.py
src/mini_trainer/async_structured_logger.py
src/mini_trainer/batch_metrics.py
src/mini_trainer/batch_packer.py
src/mini_trainer/fsdp2_lazy_init.py
src/mini_trainer/full_state_checkpoint.py
src/mini_trainer/gpt_oss_utils.py
src/mini_trainer/mlflow_wrapper.py
src/mini_trainer/none_reduction_losses.py
src/mini_trainer/osft_utils.py
src/mini_trainer/sampler.py
src/mini_trainer/setup_model_for_training.py
src/mini_trainer/train.py
src/mini_trainer/training_types.py
src/mini_trainer/utils.py
src/mini_trainer/vlm_utils.py
src/mini_trainer/wandb_wrapper.py
src/rhai_innovation_mini_trainer.egg-info/PKG-INFO
src/rhai_innovation_mini_trainer.egg-info/SOURCES.txt
src/rhai_innovation_mini_trainer.egg-info/dependency_links.txt
src/rhai_innovation_mini_trainer.egg-info/requires.txt
src/rhai_innovation_mini_trainer.egg-info/top_level.txt
tests/__init__.py
tests/conftest.py
tests/test_api_train.py
tests/test_async_logger.py
tests/test_batch_lengths_to_minibatches.py
tests/test_data_loader.py
tests/test_data_loader_pretraining.py
tests/test_dtype_conversion.py
tests/test_full_state_checkpoint.py
tests/test_integration_small_models.py
tests/test_model_initialization.py
tests/test_osft.py
tests/test_osft_dtype_functionality.py
tests/test_osft_fidelity.py
tests/test_pretraining_dataset.py
tests/test_scheduler_config.py
tests/test_training_components.py
tests/test_training_loop.py
tests/gpu_tests/__init__.py
tests/gpu_tests/conftest.py
tests/gpu_tests/setup_flash_attn.py
tests/gpu_tests/test_distributed_utils.py
tests/gpu_tests/test_mixed_precision.py
tests/test_utils/__init__.py
tests/test_utils/orthogonality.py
tutorials/tensor_paralleism_getting_started.py