.gitignore
.pre-commit-config.yaml
.readthedocs.yaml
.shellcheckrc
.yapfignore
CODE_OF_CONDUCT.md
CONTRIBUTING.md
DCO
LICENSE
README.md
RELEASING.md
_local_envs_for_test.sh
format.sh
mkdocs.yaml
pyproject.toml
uv.lock
.github/CODEOWNERS
.github/pull_request_template.md
.github/ISSUE_TEMPLATE/bug-report.yml
.github/ISSUE_TEMPLATE/config.yml
.github/ISSUE_TEMPLATE/feature-request.yml
.github/ISSUE_TEMPLATE/rfc.yml
.github/actions/free-up-disk-space/action.yml
.github/workflows/add_label_automerge.yml
.github/workflows/build_and_publish.yaml
.github/workflows/build_docker.yml
.github/workflows/check_uv_lock.yml
.github/workflows/lint_scripts.yml
.github/workflows/pre-commit.yml
.github/workflows/publish_to_test_pypi.yaml
.github/workflows/reminder_comment.yml
.github/workflows/stale.yml
.github/workflows/test.yml
.github/workflows/matchers/ruff.json
docker/.senlib.json
docker/Dockerfile.amd64
docker/simple_vllm_serve.sh
docs/.nav.yml
docs/README.md
docs/requirements-docs.txt
docs/contributing/README.md
docs/contributing/architecture.md
docs/contributing/maintaining.md
docs/contributing/images/vllm_v1.svg
docs/contributing/images/vllm_v1_spyre.svg
docs/contributing/multimodal/adding_new_models.md
docs/deploying/docker.md
docs/deploying/k8s.md
docs/deploying/rhoai.md
docs/getting_started/installation.md
docs/mkdocs/hooks/generate_examples.py
docs/mkdocs/hooks/generate_model_tables.py
docs/mkdocs/hooks/url_schemes.py
docs/mkdocs/overrides/main.html
docs/roadmaps/q3-2025.md
docs/user_guide/configuration.md
docs/user_guide/env_vars.md
docs/user_guide/supported_features.md
docs/user_guide/supported_models.md
examples/offline_inference/long_context.py
examples/offline_inference/text_inference.py
examples/offline_inference/vision_inference.py
examples/online_inference/openai_spyre_text.py
examples/online_inference/openai_spyre_vision.py
examples/online_inference/spyre_vllm_benchmark.py
examples/online_inference/spyre_vllm_setup_container.sh
sendnn_inference/__init__.py
sendnn_inference/_version.py
sendnn_inference/argparse_utils.py
sendnn_inference/compat_utils.py
sendnn_inference/compilation_utils.py
sendnn_inference/envs.py
sendnn_inference/perf_metrics.py
sendnn_inference/platform.py
sendnn_inference/utils.py
sendnn_inference.egg-info/PKG-INFO
sendnn_inference.egg-info/SOURCES.txt
sendnn_inference.egg-info/dependency_links.txt
sendnn_inference.egg-info/entry_points.txt
sendnn_inference.egg-info/requires.txt
sendnn_inference.egg-info/top_level.txt
sendnn_inference/config/README.md
sendnn_inference/config/__init__.py
sendnn_inference/config/model_config.py
sendnn_inference/config/model_configs.yaml
sendnn_inference/config/model_matcher.py
sendnn_inference/config/model_registry.py
sendnn_inference/config/configurators/__init__.py
sendnn_inference/config/configurators/model_configurator.py
sendnn_inference/model_executor/__init__.py
sendnn_inference/model_executor/model_loader/__init__.py
sendnn_inference/model_executor/model_loader/spyre.py
sendnn_inference/model_executor/model_loader/spyre_setup.py
sendnn_inference/multimodal/__init__.py
sendnn_inference/multimodal/mm_mappings/__init__.py
sendnn_inference/multimodal/mm_mappings/base.py
sendnn_inference/multimodal/mm_mappings/llava_next.py
sendnn_inference/multimodal/mm_mappings/mistral3.py
sendnn_inference/v1/__init__.py
sendnn_inference/v1/core/__init__.py
sendnn_inference/v1/core/scheduler.py
sendnn_inference/v1/metrics/__init__.py
sendnn_inference/v1/metrics/stats_logger.py
sendnn_inference/v1/sample/golden_token_injector.py
sendnn_inference/v1/sample/spyre_logits_processor.py
sendnn_inference/v1/worker/__init__.py
sendnn_inference/v1/worker/spyre_input_batch.py
sendnn_inference/v1/worker/spyre_model_runner.py
sendnn_inference/v1/worker/spyre_worker.py
tests/conftest.py
tests/download_model_configs.py
tests/hf_cache.json
tests/hf_result_cache.py
tests/llm_cache.py
tests/llm_cache_util.py
tests/output_util.py
tests/scheduling_utils.py
tests/spyre_util.py
tests/aftu/graph_compare_utils.py
tests/aftu/test_compare_graphs.py
tests/config/__init__.py
tests/config/conftest.py
tests/config/test_env_config_path.py
tests/config/test_error_handling.py
tests/config/test_integration.py
tests/config/test_model_config.py
tests/config/test_model_configurator.py
tests/config/test_model_matcher.py
tests/config/test_model_registry.py
tests/config/fixtures/test_error_handling_models.yaml
tests/e2e/test_chunked_prefill.py
tests/e2e/test_chunked_prefill_tkv_steps.py
tests/e2e/test_logits_processors.py
tests/e2e/test_profiler.py
tests/e2e/test_sampling_params.py
tests/e2e/test_spyre_async_llm.py
tests/e2e/test_spyre_basic.py
tests/e2e/test_spyre_cp_scheduler_steps.py
tests/e2e/test_spyre_embeddings.py
tests/e2e/test_spyre_mm.py
tests/e2e/test_spyre_online.py
tests/e2e/test_spyre_pc_scheduler_steps.py
tests/e2e/test_spyre_scoring.py
tests/e2e/test_spyre_seed.py
tests/e2e/test_spyre_stagger_basic.py
tests/e2e/test_stats_logger.py
tests/e2e/test_structured_outputs.py
tests/fixtures/model_configs/BAAI/bge-reranker-large/config.json
tests/fixtures/model_configs/BAAI/bge-reranker-v2-m3/config.json
tests/fixtures/model_configs/ibm-ai-platform/micro-g3.3-8b-instruct-1b/config.json
tests/fixtures/model_configs/ibm-granite/granite-3.3-8b-instruct/config.json
tests/fixtures/model_configs/ibm-granite/granite-3.3-8b-instruct-FP8/config.json
tests/fixtures/model_configs/ibm-granite/granite-4-8b-dense/config.json
tests/fixtures/model_configs/ibm-granite/granite-4-8b-dense-hybrid/config.json
tests/fixtures/model_configs/ibm-granite/granite-embedding-125m-english/config.json
tests/fixtures/model_configs/ibm-granite/granite-embedding-278m-multilingual/config.json
tests/fixtures/model_configs/intfloat/multilingual-e5-large/config.json
tests/fixtures/model_configs/sentence-transformers/all-roberta-large-v1/config.json
tests/model_loader/test_spyre.py
tests/multimodal/test_llava_next.py
tests/multimodal/test_mistral3.py
tests/precompilation/test_disable_compilation.py
tests/utils/test_cli_args.py
tests/utils/test_envs.py
tests/utils/test_golden_token_injector.py
tests/utils/test_platform_validation.py
tests/utils/test_spyre_model_list.py
tests/utils/test_upstream_compatibility.py
tests/utils/bge_copy/config.json
tests/v1/core/test_scheduler_structured_outputs.py
tests/v1/worker/mock_model.py
tests/v1/worker/test_prefix_caching_worker.py
tests/v1/worker/test_scheduler_tkv_limits.py
tests/v1/worker/test_spyre_input_batch.py
tests/v1/worker/test_spyre_worker_profile.py
tools/check_aiu.sh
tools/check_repo.sh
tools/download_model.py
tools/lint_scripts.sh