LICENSE
README.md
pyproject.toml
src/modalities/__init__.py
src/modalities/__main__.py
src/modalities/api.py
src/modalities/batch.py
src/modalities/evaluator.py
src/modalities/exceptions.py
src/modalities/gym.py
src/modalities/loss_functions.py
src/modalities/main.py
src/modalities/trainer.py
src/modalities/util.py
src/modalities.egg-info/PKG-INFO
src/modalities.egg-info/SOURCES.txt
src/modalities.egg-info/dependency_links.txt
src/modalities.egg-info/entry_points.txt
src/modalities.egg-info/requires.txt
src/modalities.egg-info/top_level.txt
src/modalities/checkpointing/__init__.py
src/modalities/checkpointing/checkpoint_conversion.py
src/modalities/checkpointing/checkpoint_loading.py
src/modalities/checkpointing/checkpoint_saving.py
src/modalities/checkpointing/checkpoint_saving_execution.py
src/modalities/checkpointing/checkpoint_saving_instruction.py
src/modalities/checkpointing/checkpoint_saving_strategies.py
src/modalities/checkpointing/fsdp/__init__.py
src/modalities/checkpointing/fsdp/fsdp_checkpoint_loading.py
src/modalities/checkpointing/fsdp/fsdp_checkpoint_saving.py
src/modalities/checkpointing/stateful/__init__.py
src/modalities/checkpointing/stateful/app_state.py
src/modalities/checkpointing/stateful/app_state_factory.py
src/modalities/checkpointing/torch/__init__.py
src/modalities/checkpointing/torch/torch_checkpoint_loading.py
src/modalities/config/__init__.py
src/modalities/config/component_factory.py
src/modalities/config/config.py
src/modalities/config/instantiation_models.py
src/modalities/config/lookup_enum.py
src/modalities/config/pydantic_if_types.py
src/modalities/config/utils.py
src/modalities/conversion/__init__.py
src/modalities/conversion/gpt2/__init__.py
src/modalities/conversion/gpt2/configuration_gpt2.py
src/modalities/conversion/gpt2/conversion_code.py
src/modalities/conversion/gpt2/conversion_model.py
src/modalities/conversion/gpt2/conversion_tokenizer.py
src/modalities/conversion/gpt2/convert_gpt2.py
src/modalities/conversion/gpt2/modeling_gpt2.py
src/modalities/dataloader/__init__.py
src/modalities/dataloader/apply_chat_template.py
src/modalities/dataloader/create_index.py
src/modalities/dataloader/create_instruction_tuning_data.py
src/modalities/dataloader/create_packed_data.py
src/modalities/dataloader/dataloader.py
src/modalities/dataloader/dataloader_factory.py
src/modalities/dataloader/dataset.py
src/modalities/dataloader/dataset_factory.py
src/modalities/dataloader/filter_packed_data.py
src/modalities/dataloader/large_file_lines_reader.py
src/modalities/dataloader/sampler_factory.py
src/modalities/dataloader/samplers.py
src/modalities/dataloader/collate_fns/collate_if.py
src/modalities/dataloader/collate_fns/collator_fn_wrapper_for_loss_masking.py
src/modalities/dataloader/preprocessing/__init__.py
src/modalities/dataloader/preprocessing/tokenization/tokenized_file_writer.py
src/modalities/inference/__init__.py
src/modalities/inference/inference.py
src/modalities/inference/text/__init__.py
src/modalities/inference/text/config.py
src/modalities/inference/text/inference_component.py
src/modalities/logging_broker/__init__.py
src/modalities/logging_broker/message_broker.py
src/modalities/logging_broker/messages.py
src/modalities/logging_broker/publisher.py
src/modalities/logging_broker/subscriber.py
src/modalities/logging_broker/subscriber_impl/__init__.py
src/modalities/logging_broker/subscriber_impl/progress_subscriber.py
src/modalities/logging_broker/subscriber_impl/results_subscriber.py
src/modalities/logging_broker/subscriber_impl/subscriber_factory.py
src/modalities/models/__init__.py
src/modalities/models/model.py
src/modalities/models/model_factory.py
src/modalities/models/utils.py
src/modalities/models/coca/__init__.py
src/modalities/models/coca/attention_pooling.py
src/modalities/models/coca/coca_model.py
src/modalities/models/coca/collator.py
src/modalities/models/coca/multi_modal_decoder.py
src/modalities/models/coca/text_decoder.py
src/modalities/models/components/__init__.py
src/modalities/models/components/layer_norms.py
src/modalities/models/gpt2/__init__.py
src/modalities/models/gpt2/collator.py
src/modalities/models/gpt2/gpt2_model.py
src/modalities/models/huggingface/__init__.py
src/modalities/models/huggingface/huggingface_model.py
src/modalities/models/huggingface_adapters/__init__.py
src/modalities/models/huggingface_adapters/hf_adapter.py
src/modalities/models/parallelism/__init__.py
src/modalities/models/parallelism/pipeline_parallelism.py
src/modalities/models/parallelism/pipeline_parallelism_configs.py
src/modalities/models/parallelism/stages_generator.py
src/modalities/models/parallelism/stages_generator_configs.py
src/modalities/models/vision_transformer/__init__.py
src/modalities/models/vision_transformer/vision_transformer_model.py
src/modalities/nn/__init__.py
src/modalities/nn/attention.py
src/modalities/nn/mlp.py
src/modalities/nn/model_initialization/__init__.py
src/modalities/nn/model_initialization/composed_initialization.py
src/modalities/nn/model_initialization/initialization_if.py
src/modalities/nn/model_initialization/initialization_routines.py
src/modalities/nn/model_initialization/parameter_name_filters.py
src/modalities/optimizers/__init__.py
src/modalities/optimizers/lr_schedulers.py
src/modalities/optimizers/optimizer_factory.py
src/modalities/optimizers/optimizer_list.py
src/modalities/optimizers/scheduler_list.py
src/modalities/preprocessing/__init__.py
src/modalities/preprocessing/create_chunks.py
src/modalities/preprocessing/shuffle_data.py
src/modalities/registry/__init__.py
src/modalities/registry/components.py
src/modalities/registry/registry.py
src/modalities/running_env/__init__.py
src/modalities/running_env/cuda_env.py
src/modalities/running_env/env_utils.py
src/modalities/running_env/fsdp/__init__.py
src/modalities/running_env/fsdp/device_mesh.py
src/modalities/running_env/fsdp/fsdp_auto_wrapper.py
src/modalities/running_env/fsdp/reducer.py
src/modalities/tokenization/__init__.py
src/modalities/tokenization/tokenizer_wrapper.py
src/modalities/training/__init__.py
src/modalities/training/training_progress.py
src/modalities/training/activation_checkpointing/__init__.py
src/modalities/training/activation_checkpointing/activation_checkpointing.py
src/modalities/training/activation_checkpointing/activation_checkpointing_variants.py
src/modalities/training/gradient_clipping/__init__.py
src/modalities/training/gradient_clipping/fsdp_gradient_clipper.py
src/modalities/training/gradient_clipping/fsdp_gradient_clipper_config.py
src/modalities/training/gradient_clipping/gradient_clipper.py
src/modalities/utils/__init__.py
src/modalities/utils/communication_test.py
src/modalities/utils/debug.py
src/modalities/utils/debug_components.py
src/modalities/utils/debugging_configs.py
src/modalities/utils/deprecated_alias.py
src/modalities/utils/file_ops.py
src/modalities/utils/logger_utils.py
src/modalities/utils/maybe_list_parameter.py
src/modalities/utils/mfu.py
src/modalities/utils/number_conversion.py
src/modalities/utils/seeding.py
src/modalities/utils/typing_utils.py
src/modalities/utils/verify_tokenization_consistency.py
src/modalities/utils/benchmarking/__init__.py
src/modalities/utils/benchmarking/benchmarking_utils.py
src/modalities/utils/benchmarking/sweep_utils.py
src/modalities/utils/profilers/__init__.py
src/modalities/utils/profilers/batch_generator.py
src/modalities/utils/profilers/modalities_profiler.py
src/modalities/utils/profilers/profiler_configs.py
src/modalities/utils/profilers/profiler_factory.py
src/modalities/utils/profilers/profilers.py
src/modalities/utils/profilers/steppable_component_configs.py
src/modalities/utils/profilers/steppable_components.py
src/modalities/utils/profilers/steppable_components_if.py
tests/test_evaluator.py
tests/test_gym.py
tests/test_initialization_fsdp1.py
tests/test_initialization_fsdpx.py
tests/test_loss_functions.py
tests/test_lr_scheduler.py
tests/test_main.py
tests/test_optimizer_factory.py
tests/test_rotary_qkv_transform.py
tests/test_tokenization.py
tests/test_torch_compile.py
tests/test_util.py
tests/test_weight_tying.py
tests/tests.py