LICENSE
MANIFEST.in
README.md
pyproject.toml
src/inferia/__init__.py
src/inferia/cli.py
src/inferia/cli_init.py
src/inferia/inferiadocs.py
src/inferia/startup_events.py
src/inferia/startup_ui.py
src/inferia/dashboard/Logo.png
src/inferia/dashboard/index.html
src/inferia/dashboard/logo.svg
src/inferia/dashboard/vite.svg
src/inferia/dashboard/assets/index-CnVpzT2b.css
src/inferia/dashboard/assets/index-qHEZv9BG.js
src/inferia/gateways/filtration_gateway/app.py
src/inferia/gateways/filtration_gateway/main.py
src/inferia/gateways/inference_gateway/__init__.py
src/inferia/gateways/inference_gateway/app.py
src/inferia/gateways/inference_gateway/client.py
src/inferia/gateways/inference_gateway/config.py
src/inferia/gateways/inference_gateway/main.py
src/inferia/gateways/inference_gateway/core/auth.py
src/inferia/gateways/inference_gateway/core/http_client.py
src/inferia/gateways/inference_gateway/core/orchestrator.py
src/inferia/gateways/inference_gateway/core/providers.py
src/inferia/gateways/inference_gateway/core/rate_limiter.py
src/inferia/gateways/inference_gateway/core/service.py
src/inferia/gateways/inference_gateway/core/stream_processor.py
src/inferia/gateways/orchestration_gateway/app.py
src/inferia/gateways/orchestration_gateway/config.py
src/inferia/gateways/orchestration_gateway/main.py
src/inferia/infra/schema/global_schema.sql
src/inferia/infra/schema/orchestration.sql
src/inferia/services/filtration/bootstrap_db.py
src/inferia/services/filtration/config.py
src/inferia/services/filtration/drop_db.py
src/inferia/services/filtration/models.py
src/inferia/services/filtration/reset_db.py
src/inferia/services/filtration/audit/__init__.py
src/inferia/services/filtration/audit/api_models.py
src/inferia/services/filtration/audit/router.py
src/inferia/services/filtration/audit/service.py
src/inferia/services/filtration/data/__init__.py
src/inferia/services/filtration/data/api_models.py
src/inferia/services/filtration/data/chunker.py
src/inferia/services/filtration/data/engine.py
src/inferia/services/filtration/data/parser.py
src/inferia/services/filtration/data/router.py
src/inferia/services/filtration/db/__init__.py
src/inferia/services/filtration/db/database.py
src/inferia/services/filtration/db/security.py
src/inferia/services/filtration/db/models/__init__.py
src/inferia/services/filtration/db/models/api_key.py
src/inferia/services/filtration/db/models/audit_log.py
src/inferia/services/filtration/db/models/deployment.py
src/inferia/services/filtration/db/models/inference_log.py
src/inferia/services/filtration/db/models/invitation.py
src/inferia/services/filtration/db/models/organization.py
src/inferia/services/filtration/db/models/policy.py
src/inferia/services/filtration/db/models/role.py
src/inferia/services/filtration/db/models/usage.py
src/inferia/services/filtration/db/models/user.py
src/inferia/services/filtration/db/models/user_organization.py
src/inferia/services/filtration/gateway/__init__.py
src/inferia/services/filtration/gateway/internal_middleware.py
src/inferia/services/filtration/gateway/middleware.py
src/inferia/services/filtration/gateway/rate_limiter.py
src/inferia/services/filtration/gateway/router.py
src/inferia/services/filtration/guardrail/__init__.py
src/inferia/services/filtration/guardrail/api_models.py
src/inferia/services/filtration/guardrail/config.py
src/inferia/services/filtration/guardrail/engine.py
src/inferia/services/filtration/guardrail/models.py
src/inferia/services/filtration/guardrail/pii_service.py
src/inferia/services/filtration/guardrail/providers/base.py
src/inferia/services/filtration/guardrail/providers/lakera_provider.py
src/inferia/services/filtration/guardrail/providers/llama_guard_provider.py
src/inferia/services/filtration/guardrail/providers/llm_guard_provider.py
src/inferia/services/filtration/management/__init__.py
src/inferia/services/filtration/management/api_keys.py
src/inferia/services/filtration/management/config.py
src/inferia/services/filtration/management/dependencies.py
src/inferia/services/filtration/management/deployments.py
src/inferia/services/filtration/management/knowledge_base.py
src/inferia/services/filtration/management/organizations.py
src/inferia/services/filtration/management/prompts.py
src/inferia/services/filtration/management/router.py
src/inferia/services/filtration/management/users.py
src/inferia/services/filtration/policy/__init__.py
src/inferia/services/filtration/policy/engine.py
src/inferia/services/filtration/prompt/__init__.py
src/inferia/services/filtration/prompt/engine.py
src/inferia/services/filtration/prompt/rewriter.py
src/inferia/services/filtration/prompt/templates.py
src/inferia/services/filtration/rbac/__init__.py
src/inferia/services/filtration/rbac/api_models.py
src/inferia/services/filtration/rbac/auth.py
src/inferia/services/filtration/rbac/authorization.py
src/inferia/services/filtration/rbac/initialization.py
src/inferia/services/filtration/rbac/middleware.py
src/inferia/services/filtration/rbac/mock_data.py
src/inferia/services/filtration/rbac/models.py
src/inferia/services/filtration/rbac/roles_router.py
src/inferia/services/filtration/rbac/router.py
src/inferia/services/filtration/rbac/users_router.py
src/inferia/services/filtration/schemas/auth.py
src/inferia/services/filtration/schemas/common.py
src/inferia/services/filtration/schemas/config.py
src/inferia/services/filtration/schemas/inference.py
src/inferia/services/filtration/schemas/knowledge_base.py
src/inferia/services/filtration/schemas/logging.py
src/inferia/services/filtration/schemas/management.py
src/inferia/services/filtration/schemas/prompt.py
src/inferia/services/filtration/tests/__init__.py
src/inferia/services/filtration/tests/conftest.py
src/inferia/services/filtration/tests/test_audit.py
src/inferia/services/filtration/tests/test_gateway.py
src/inferia/services/filtration/tests/test_guardrail_proceed.py
src/inferia/services/filtration/tests/test_integration.py
src/inferia/services/filtration/tests/test_rbac.py
src/inferia/services/filtration/tests/verify_advanced_linking.py
src/inferia/services/filtration/tests/verify_http_prompt_process.py
src/inferia/services/filtration/tests/verify_template_linking.py
src/inferia/services/orchestration/add_inference_model.py
src/inferia/services/orchestration/check_nosana_api.py
src/inferia/services/orchestration/fix_schema_constraints.py
src/inferia/services/orchestration/app/__init__.py
src/inferia/services/orchestration/app/nosana_cli.py
src/inferia/services/orchestration/app/infra/__init__.py
src/inferia/services/orchestration/app/infra/db.py
src/inferia/services/orchestration/app/infra/k8s_llmd_client.py
src/inferia/services/orchestration/app/infra/kafka_producer.py
src/inferia/services/orchestration/app/infra/redis_client.py
src/inferia/services/orchestration/app/infra/redis_event_bus.py
src/inferia/services/orchestration/app/infra/spot_reclaimer.py
src/inferia/services/orchestration/app/infra/test_setup.py
src/inferia/services/orchestration/app/provisioning/__init__.py
src/inferia/services/orchestration/app/provisioning/base.py
src/inferia/services/orchestration/app/provisioning/skypilot.py
src/inferia/services/orchestration/app/repositories/autoscaler_repo.py
src/inferia/services/orchestration/app/repositories/base_repo.py
src/inferia/services/orchestration/app/repositories/filtration_sync_repo.py
src/inferia/services/orchestration/app/repositories/inventory_repo.py
src/inferia/services/orchestration/app/repositories/job_repo.py
src/inferia/services/orchestration/app/repositories/model_deployment_repo.py
src/inferia/services/orchestration/app/repositories/model_registry_repo.py
src/inferia/services/orchestration/app/repositories/node_repo.py
src/inferia/services/orchestration/app/repositories/outbox_repo.py
src/inferia/services/orchestration/app/repositories/placement_repo.py
src/inferia/services/orchestration/app/repositories/pool_repo.py
src/inferia/services/orchestration/app/repositories/provider_repo.py
src/inferia/services/orchestration/app/repositories/quota_repo.py
src/inferia/services/orchestration/app/repositories/scheduler_repo.py
src/inferia/services/orchestration/app/services/__init__.py
src/inferia/services/orchestration/app/services/adapter_engine/__init__.py
src/inferia/services/orchestration/app/services/adapter_engine/base.py
src/inferia/services/orchestration/app/services/adapter_engine/engine.py
src/inferia/services/orchestration/app/services/adapter_engine/registry.py
src/inferia/services/orchestration/app/services/adapter_engine/service.py
src/inferia/services/orchestration/app/services/adapter_engine/types.py
src/inferia/services/orchestration/app/services/adapter_engine/adapters/akash/__init__.py
src/inferia/services/orchestration/app/services/adapter_engine/adapters/akash/akash_adapter.py
src/inferia/services/orchestration/app/services/adapter_engine/adapters/akash/sdl_builder.py
src/inferia/services/orchestration/app/services/adapter_engine/adapters/aws/__init__.py
src/inferia/services/orchestration/app/services/adapter_engine/adapters/aws/adapter.py
src/inferia/services/orchestration/app/services/adapter_engine/adapters/aws/aws_adapter.py
src/inferia/services/orchestration/app/services/adapter_engine/adapters/base/__init__.py
src/inferia/services/orchestration/app/services/adapter_engine/adapters/base/adapter.py
src/inferia/services/orchestration/app/services/adapter_engine/adapters/k8s/k8s_adapter.py
src/inferia/services/orchestration/app/services/adapter_engine/adapters/k8s/k8s_liveness.py
src/inferia/services/orchestration/app/services/adapter_engine/adapters/nosana/job_builder.py
src/inferia/services/orchestration/app/services/adapter_engine/adapters/nosana/nosana_adapter.py
src/inferia/services/orchestration/app/services/adapter_engine/adapters/skypilot/skypilot_adapter.py
src/inferia/services/orchestration/app/services/adapter_engine/adapters/skypilot/spec_builder.py
src/inferia/services/orchestration/app/services/autoscaler/worker.py
src/inferia/services/orchestration/app/services/compute_node/service.py
src/inferia/services/orchestration/app/services/compute_pool_engine/__init__.py
src/inferia/services/orchestration/app/services/compute_pool_engine/compute_pool_manager.py
src/inferia/services/orchestration/app/services/depin-sidecar/package.json
src/inferia/services/orchestration/app/services/depin-sidecar/tsconfig.json
src/inferia/services/orchestration/app/services/depin-sidecar/src/server.ts
src/inferia/services/orchestration/app/services/depin-sidecar/src/modules/akash/akash_service.ts
src/inferia/services/orchestration/app/services/depin-sidecar/src/modules/nosana/nosana_service.ts
src/inferia/services/orchestration/app/services/eventing/outbox_publisher.py
src/inferia/services/orchestration/app/services/inventory_manager/http.py
src/inferia/services/orchestration/app/services/inventory_manager/liveness.py
src/inferia/services/orchestration/app/services/inventory_manager/service.py
src/inferia/services/orchestration/app/services/llmd/spec_builder.py
src/inferia/services/orchestration/app/services/llmd_runtime/client.py
src/inferia/services/orchestration/app/services/llmd_runtime/health.py
src/inferia/services/orchestration/app/services/llmd_runtime/runtime.py
src/inferia/services/orchestration/app/services/llmd_runtime/spec.py
src/inferia/services/orchestration/app/services/model_deployment/controller.py
src/inferia/services/orchestration/app/services/model_deployment/deployment_server.py
src/inferia/services/orchestration/app/services/model_deployment/runtime_resolver.py
src/inferia/services/orchestration/app/services/model_deployment/service.py
src/inferia/services/orchestration/app/services/model_deployment/worker.py
src/inferia/services/orchestration/app/services/model_deployment/worker_main.py
src/inferia/services/orchestration/app/services/model_deployment/strategies/base.py
src/inferia/services/orchestration/app/services/model_deployment/strategies/llmd.py
src/inferia/services/orchestration/app/services/model_deployment/strategies/vllm.py
src/inferia/services/orchestration/app/services/model_registry/service.py
src/inferia/services/orchestration/app/services/node-agent/__init__.py
src/inferia/services/orchestration/app/services/node-agent/main.py
src/inferia/services/orchestration/app/services/node-agent/agent/__init__.py
src/inferia/services/orchestration/app/services/node-agent/agent/cpu.py
src/inferia/services/orchestration/app/services/node-agent/agent/gpu.py
src/inferia/services/orchestration/app/services/node-agent/agent/heartbeat.py
src/inferia/services/orchestration/app/services/node-agent/agent/memory.py
src/inferia/services/orchestration/app/services/nosana_runtime/client.py
src/inferia/services/orchestration/app/services/placement_engine/__init__.py
src/inferia/services/orchestration/app/services/placement_engine/scoring.py
src/inferia/services/orchestration/app/services/placement_engine/service.py
src/inferia/services/orchestration/app/services/scheduler/service.py
src/inferia/services/orchestration/app/services/traffic_router/__init__.py
src/inferia/services/orchestration/app/services/traffic_router/engine.py
src/inferia/services/orchestration/app/services/vllm_runtime/health.py
src/inferia/services/orchestration/app/services/vllm_runtime/process.py
src/inferia/services/orchestration/app/services/vllm_runtime/runtime.py
src/inferia/services/orchestration/app/shared/__init__.py
src/inferia/services/orchestration/app/v1/__init__.py
src/inferia/services/orchestration/app/v1/adapter_engine_pb2.py
src/inferia/services/orchestration/app/v1/adapter_engine_pb2_grpc.py
src/inferia/services/orchestration/app/v1/compute_node_pb2.py
src/inferia/services/orchestration/app/v1/compute_node_pb2_grpc.py
src/inferia/services/orchestration/app/v1/compute_pool_pb2.py
src/inferia/services/orchestration/app/v1/compute_pool_pb2_grpc.py
src/inferia/services/orchestration/app/v1/inventory_manager_pb2.py
src/inferia/services/orchestration/app/v1/inventory_manager_pb2_grpc.py
src/inferia/services/orchestration/app/v1/model_deployment_pb2.py
src/inferia/services/orchestration/app/v1/model_deployment_pb2_grpc.py
src/inferia/services/orchestration/app/v1/model_registry_pb2.py
src/inferia/services/orchestration/app/v1/model_registry_pb2_grpc.py
src/inferia/services/orchestration/app/v1/placement_engine_pb2.py
src/inferia/services/orchestration/app/v1/placement_engine_pb2_grpc.py
src/inferia/services/orchestration/app/v1/scheduler_pb2.py
src/inferia/services/orchestration/app/v1/scheduler_pb2_grpc.py
src/inferia/services/orchestration/app/v1/v1/compute_pool_pb2.py
src/inferia/services/orchestration/app/v1/v1/compute_pool_pb2_grpc.py
src/inferia/services/orchestration/app/workers/autoscaler_worker.py
src/inferia/services/orchestration/app/workers/deployment_worker.py
src/inferia/services/orchestration/app/workers/inventory_liveness_worker.py
src/inferia/services/orchestration/app/workers/outbox_worker.py
src/inferia/services/orchestration/app/workers/spot_reclaimer_worker.py
src/inferia/services/orchestration/test/aws_instance_specs.py
src/inferia/services/orchestration/test/test_aws_realtime_capacity.py
src/inferia/services/orchestration/test/test_grpc.py
src/inferia/services/orchestration/test/test_node_agent_heartbeat.py
src/inferia/services/orchestration/test/test_node_liveness.py
src/inferia/services/orchestration/test/test_traffic_router.py
src/inferia/services/orchestration/test/adapter_test/test_adapter_engine.py
src/inferia/services/orchestration/test/adapter_test/test_k8s_compute_e2e.py
src/inferia/services/orchestration/test/adapter_test/test_model_deploy.py
src/inferia/services/orchestration/test/adapter_test/test_model_deploy_nosana.py
src/inferia/services/orchestration/test/adapter_test/test_skypilot_adapter.py
src/inferia/services/orchestration/test/autoscaler/test_scale_down.py
src/inferia/services/orchestration/test/autoscaler/test_scale_up.py
src/inferia/services/orchestration/test/compute_pools_nodes/test_compute_node_grpc.py
src/inferia/services/orchestration/test/compute_pools_nodes/test_fake_adapter.py
src/inferia/services/orchestration/test/e2e/test_e2e_control_plane.py
src/inferia/services/orchestration/test/gang/test_gang_concurrency.py
src/inferia/services/orchestration/test/gang/test_gang_insufficient_capacity.py
src/inferia/services/orchestration/test/gang/test_gang_success.py
src/inferia/services/orchestration/test/integration/test_control_plane_e2e.py
src/inferia/services/orchestration/test/model_deployment/test_model_deployment_e2e.py
src/inferia/services/orchestration/test/model_registry/test_model_registry.py
src/inferia/services/orchestration/test/placement_test/test_placement_engine.py
src/inferia/services/orchestration/test/provisioning/__init__.py
src/inferia/services/orchestration/test/provisioning/test_skypilot_provisioner.py
src/inferia/services/orchestration/test/quota/_setup.py
src/inferia/services/orchestration/test/quota/test_billing_events.py
src/inferia/services/orchestration/test/quota/test_hard_quota.py
src/inferia/services/orchestration/test/quota/test_quota_preemption.py
src/inferia/services/orchestration/test/quota/test_quota_release.py
src/inferia/services/orchestration/test/scheduler/test_concurrency.py
src/inferia/services/orchestration/test/spot/test_spot_allocation.py
src/inferia/services/orchestration/test/spot/test_spot_reclaim.py
src/inferia/services/orchestration/test/spot/test_spot_vs_ondemand.py
src/inferia/services/orchestration/test/test_inventory/send_heartbeat.py
src/inferiallm.egg-info/PKG-INFO
src/inferiallm.egg-info/SOURCES.txt
src/inferiallm.egg-info/dependency_links.txt
src/inferiallm.egg-info/entry_points.txt
src/inferiallm.egg-info/requires.txt
src/inferiallm.egg-info/top_level.txt