.gitignore
.pre-commit-config.yaml
.readthedocs.yaml
CLAUDE.md
README.md
pyproject.toml
requirements.txt
uv.lock
.github/pull_request_template.md
.github/ISSUE_TEMPLATE/1-bug-report.md
.github/ISSUE_TEMPLATE/2-feature-request.md
.github/workflows/lint.yml
cicd/README.md
cicd/run_traincicd.sh
docs/Makefile
docs/README.md
docs/conf.py
docs/index.rst
docs/requirements.txt
docs/developer_guide/index.rst
docs/developer_guide/new_dataset_guide.md
docs/developer_guide/new_model_guide.md
docs/developer_guide/new_processor_guide.md
docs/developer_guide/new_trainer_guide.md
docs/getting_started/index.rst
docs/getting_started/introduction.rst
docs/getting_started/quick_start.rst
docs/getting_started/train.md
docs/models/bagel.md
docs/models/index.rst
docs/models/qwenvl.md
docs/reference/api.md
docs/reference/design_principle.md
docs/reference/index.rst
docs/reference/video_configuration.md
docs/user_guide/data_prep.md
docs/user_guide/datasets.md
docs/user_guide/index.rst
docs/user_guide/peak_perf.md
examples/load_from_config_example.yaml
examples/load_from_pretrained_example.yaml
examples/run.sh
examples/bagel/example_config.yaml
examples/bagel/run.sh
examples/dgn/run.sh
examples/dgn/train_dgn_1b.yaml
examples/diffusion_language_model/README.md
examples/diffusion_language_model/dllm_train_adam_multi_gpu_deepspeed.yaml
examples/diffusion_language_model/dllm_train_muon_multi_gpu_fsdp2.yaml
examples/diffusion_language_model/dllm_train_muon_single_gpu.yaml
examples/diffusion_language_model/run.sh
examples/diffusion_language_model/run_multigpu.sh
examples/ds_config/default_config.json
examples/qwen2_5_llm/example_config.yaml
examples/qwen2_5_llm/run.sh
examples/qwen2_5_omni/example_config.yaml
examples/qwen2_5_omni/run.sh
examples/qwen2_5_vl/example_config.yaml
examples/qwen2_5_vl/run.sh
examples/qwen3_vl/example_config.yaml
examples/qwen3_vl/qwen3_vl_8b_train.sh
examples/qwen3_vl/run.sh
examples/representation_autoencoder/reconstruct.py
examples/representation_autoencoder/run.sh
examples/representation_autoencoder/run_rae.sh
examples/scalable_interpolant_transformer/README.md
examples/scalable_interpolant_transformer/run.sh
examples/scalable_interpolant_transformer/sit_xl_2.yaml
examples/scalable_interpolant_transformer/verify_setup.py
examples/wanvideo/README.md
examples/wanvideo/run.sh
examples/wanvideo/configs/wan2.2_ti2v_5b_from_pretrained.yaml
examples/wanvideo/configs/wan2.2_ti2v_5b_from_scratch.yaml
src/lmms_engine/__init__.py
src/lmms_engine/mapping_func.py
src/lmms_engine.egg-info/PKG-INFO
src/lmms_engine.egg-info/SOURCES.txt
src/lmms_engine.egg-info/dependency_links.txt
src/lmms_engine.egg-info/entry_points.txt
src/lmms_engine.egg-info/requires.txt
src/lmms_engine.egg-info/top_level.txt
src/lmms_engine/datasets/__init__.py
src/lmms_engine/datasets/config.py
src/lmms_engine/datasets/multimodal_mixin.py
src/lmms_engine/datasets/collator/__init__.py
src/lmms_engine/datasets/collator/bagel_collator.py
src/lmms_engine/datasets/collator/text_dllm_collator.py
src/lmms_engine/datasets/collator/vision_collator.py
src/lmms_engine/datasets/iterable/__init__.py
src/lmms_engine/datasets/iterable/bagel_iterable_dataset.py
src/lmms_engine/datasets/iterable/base_iterable_dataset.py
src/lmms_engine/datasets/iterable/fineweb_edu_dataset.py
src/lmms_engine/datasets/iterable/multimodal_iterable_dataset.py
src/lmms_engine/datasets/iterable/qwen3_vl_iterable_dataset.py
src/lmms_engine/datasets/iterable/vision_iterable_dataset.py
src/lmms_engine/datasets/naive/__init__.py
src/lmms_engine/datasets/naive/base_dataset.py
src/lmms_engine/datasets/naive/multimodal_dataset.py
src/lmms_engine/datasets/naive/qwen_omni_dataset.py
src/lmms_engine/datasets/naive/rae_dataset.py
src/lmms_engine/datasets/naive/sit_dataset.py
src/lmms_engine/datasets/naive/vision_audio_dataset.py
src/lmms_engine/datasets/naive/vision_dataset.py
src/lmms_engine/datasets/processor/__init__.py
src/lmms_engine/datasets/processor/aero_processor.py
src/lmms_engine/datasets/processor/bagel_processor.py
src/lmms_engine/datasets/processor/base_qwen2_5_processor.py
src/lmms_engine/datasets/processor/config.py
src/lmms_engine/datasets/processor/llava_processor.py
src/lmms_engine/datasets/processor/pure_text_processor.py
src/lmms_engine/datasets/processor/qwen2_5_omni_processor.py
src/lmms_engine/datasets/processor/qwen2_5_vl_processor.py
src/lmms_engine/datasets/processor/qwen2_processor.py
src/lmms_engine/datasets/processor/qwen2_vl_processor.py
src/lmms_engine/datasets/processor/qwen3_vl_processor.py
src/lmms_engine/datasets/processor/rae_processor.py
src/lmms_engine/datasets/processor/sit_processor.py
src/lmms_engine/datasets/processor/wanvideo_processor.py
src/lmms_engine/launch/__init__.py
src/lmms_engine/launch/cli.py
src/lmms_engine/launch/config/default_config.yaml
src/lmms_engine/models/__init__.py
src/lmms_engine/models/config.py
src/lmms_engine/models/monkey_patch.py
src/lmms_engine/models/sequence_packing_utils.py
src/lmms_engine/models/utils.py
src/lmms_engine/models/aero/__init__.py
src/lmms_engine/models/aero/aero_ops.py
src/lmms_engine/models/aero/configuration_aero.py
src/lmms_engine/models/aero/modeling_aero.py
src/lmms_engine/models/aero/monkey_patch.py
src/lmms_engine/models/aero/processing_aero.py
src/lmms_engine/models/bagel/__init__.py
src/lmms_engine/models/bagel/autoencoder.py
src/lmms_engine/models/bagel/bagel.py
src/lmms_engine/models/bagel/cache_utils.py
src/lmms_engine/models/bagel/data_utils.py
src/lmms_engine/models/bagel/modeling_utils.py
src/lmms_engine/models/bagel/monkey_patch.py
src/lmms_engine/models/bagel/nsa_op.py
src/lmms_engine/models/bagel/qwen2_navit.py
src/lmms_engine/models/bagel/siglip_navit.py
src/lmms_engine/models/bagel/transforms.py
src/lmms_engine/models/bagel/qwen2/__init__.py
src/lmms_engine/models/bagel/qwen2/configuration_qwen2.py
src/lmms_engine/models/bagel/qwen2/modeling_qwen2.py
src/lmms_engine/models/bagel/qwen2/tokenization_qwen2.py
src/lmms_engine/models/bagel/qwen2/tokenization_qwen2_fast.py
src/lmms_engine/models/bagel/siglip/__init__.py
src/lmms_engine/models/bagel/siglip/configuration_siglip.py
src/lmms_engine/models/bagel/siglip/convert_siglip_to_hf.py
src/lmms_engine/models/bagel/siglip/image_processing_siglip.py
src/lmms_engine/models/bagel/siglip/modeling_siglip.py
src/lmms_engine/models/bagel/siglip/processing_siglip.py
src/lmms_engine/models/bagel/siglip/tokenization_siglip.py
src/lmms_engine/models/llava_onevision/__init__.py
src/lmms_engine/models/llava_onevision/llava_ov_liger.py
src/lmms_engine/models/llava_onevision/monkey_patch.py
src/lmms_engine/models/qwen2/__init__.py
src/lmms_engine/models/qwen2/monkey_patch.py
src/lmms_engine/models/qwen2/qwen2_liger.py
src/lmms_engine/models/qwen2/qwen2_ops.py
src/lmms_engine/models/qwen2_5_omni/__init__.py
src/lmms_engine/models/qwen2_5_omni/monkey_patch.py
src/lmms_engine/models/qwen2_5_omni/qwen2_5_omni_liger.py
src/lmms_engine/models/qwen2_5_omni/qwen2_5_omni_ops.py
src/lmms_engine/models/qwen2_5_vl/__init__.py
src/lmms_engine/models/qwen2_5_vl/monkey_patch.py
src/lmms_engine/models/qwen2_5_vl/qwen2_5_vl_liger.py
src/lmms_engine/models/qwen2_5_vl/qwen2_5_vl_ops.py
src/lmms_engine/models/qwen2_audio/__init__.py
src/lmms_engine/models/qwen2_audio/monkey_patch.py
src/lmms_engine/models/qwen2_audio/qwen2_audio_ops.py
src/lmms_engine/models/qwen3_dllm/__init__.py
src/lmms_engine/models/qwen3_dllm/configuration_qwen3_dllm.py
src/lmms_engine/models/qwen3_dllm/modeling_qwen3_dllm.py
src/lmms_engine/models/qwen3_vl/__init__.py
src/lmms_engine/models/qwen3_vl/monkey_patch.py
src/lmms_engine/models/qwen3_vl/qwen3_vl_liger.py
src/lmms_engine/models/qwen3_vl/qwen3_vl_ops.py
src/lmms_engine/models/rae_siglip/__init__.py
src/lmms_engine/models/rae_siglip/configuration_rae_siglip.py
src/lmms_engine/models/rae_siglip/diffaug.py
src/lmms_engine/models/rae_siglip/discriminator.py
src/lmms_engine/models/rae_siglip/general_decoder.py
src/lmms_engine/models/rae_siglip/lpips.py
src/lmms_engine/models/rae_siglip/lpips_utils.py
src/lmms_engine/models/rae_siglip/modeling_rae_siglip.py
src/lmms_engine/models/sit/__init__.py
src/lmms_engine/models/sit/_imports.py
src/lmms_engine/models/sit/configuration_sit.py
src/lmms_engine/models/sit/modeling_sit.py
src/lmms_engine/models/sit/models.py
src/lmms_engine/models/sit/transport/__init__.py
src/lmms_engine/models/sit/transport/integrators.py
src/lmms_engine/models/sit/transport/path.py
src/lmms_engine/models/sit/transport/transport.py
src/lmms_engine/models/sit/transport/utils.py
src/lmms_engine/models/wanvideo/__init__.py
src/lmms_engine/models/wanvideo/configuration_wanvideo.py
src/lmms_engine/models/wanvideo/modeling_wanvideo.py
src/lmms_engine/models/wanvideo/modeling_wanvideo_legacy.py
src/lmms_engine/models/wanvideo/processing_wanvideo.py
src/lmms_engine/models/wanvideo/wan_video_camera_controller.py
src/lmms_engine/models/wanvideo/wan_video_dit.py
src/lmms_engine/models/wanvideo/wan_video_image_encoder.py
src/lmms_engine/models/wanvideo/wan_video_motion_controller.py
src/lmms_engine/models/wanvideo/wan_video_scheduler.py
src/lmms_engine/models/wanvideo/wan_video_text_encoder.py
src/lmms_engine/models/wanvideo/wan_video_vace.py
src/lmms_engine/models/wanvideo/wan_video_vae.py
src/lmms_engine/parallel/process_group_manager.py
src/lmms_engine/parallel/sequence_parallel/ulysses.py
src/lmms_engine/protocol/__init__.py
src/lmms_engine/protocol/args.py
src/lmms_engine/protocol/data_proto.py
src/lmms_engine/protocol/lmms_proto.py
src/lmms_engine/train/__init__.py
src/lmms_engine/train/config.py
src/lmms_engine/train/registry.py
src/lmms_engine/train/runner.py
src/lmms_engine/train/fsdp2/__init__.py
src/lmms_engine/train/fsdp2/fsdp2_trainer.py
src/lmms_engine/train/fsdp2/rae_trainer.py
src/lmms_engine/train/fsdp2/sit_trainer.py
src/lmms_engine/train/hf/__init__.py
src/lmms_engine/train/hf/dllm_trainer.py
src/lmms_engine/train/hf/trainer.py
src/lmms_engine/train/hf/wan_trainer.py
src/lmms_engine/utils/__init__.py
src/lmms_engine/utils/config_loader.py
src/lmms_engine/utils/data_utils.py
src/lmms_engine/utils/fsdp2_utils.py
src/lmms_engine/utils/imports.py
src/lmms_engine/utils/logging_utils.py
src/lmms_engine/utils/muon_utils.py
src/lmms_engine/utils/profiler.py
src/lmms_engine/utils/tracking.py
src/lmms_engine/utils/train_utils.py
test/run_suite.py
test/utils.py
test/dataset/test_data_proto.py
test/dataset/test_preference_data.py
test/dataset/test_vision_audio_data.py
test/dataset/test_vision_data.py
test/models/test_import_models.py
test/train/run_cicd.py
test/train/utils.py
test/train/bagel/__init__.py
test/train/bagel/test_bagel.py
test/train/bagel/train_bagel.py
test/train/llava_onevision/__init__.py
test/train/llava_onevision/test_llava_onevision.py
test/train/llava_onevision/train_llava_onevision.py
test/train/qwen2_5/__init__.py
test/train/qwen2_5/test_qwen2_5.py
test/train/qwen2_5/train_qwen2_5.py
test/train/qwen2_5/train_qwen2_5_iterable.py
test/train/qwen2_5/train_qwen2_5_sp.py
test/train/qwen2_5_vl/__init__.py
test/train/qwen2_5_vl/test_qwen2_5_vl.py
test/train/qwen2_5_vl/train_qwen2_5_vl.py
test/train/qwen2_5_vl/train_qwen2_5_vl_sp.py
test/train/qwen3_vl/__init__.py
test/train/qwen3_vl/test_qwen3_vl.py
test/train/qwen3_vl/train_qwen3_vl.py
test/utils/test_utils.py
tools/configure_envs.sh
tools/create_hf_dataset.py
tools/create_json_dataset.py
tools/merge_fsdp.py
tools/prepare_qwen_2_5_kino.py
tools/check_data/check_dataset_tokens.py
tools/check_data/check_dataset_tokens_cloud.py
tools/check_data/check_dataset_yaml.py
tools/check_data/precompute_tokens.py
tools/check_data/precompute_tokens_cloud.py
tools/check_data/precompute_tokens_inline.py
tools/create_data/musiccaps_gpt4o.py
tools/create_data/split_jsonlines.py
tools/create_data/prompt/conversation.txt
tools/generate_config/generate_default_yaml.py
tools/generate_config/generate_default_yaml.sh
tools/prepare_init_weight/convert_maas_to_hf.py
tools/prepare_init_weight/merge_kino_adapter.py
tools/prepare_init_weight/prepare_aero.py
tools/prepare_init_weight/prepare_aero_omni.py
tools/prepare_init_weight/prepare_kino_lora.py
tools/prepare_init_weight/prepare_mistral3_audio.py
tools/prepare_init_weight/prepare_qwen_2_5_kino.py
tools/prepare_init_weight/prepare_rae_siglip2.py