LICENSE
MANIFEST.in
README.md
pyproject.toml
src/inferia/__init__.py
src/inferia/cli.py
src/inferia/cli_init.py
src/inferia/inferiadocs.py
src/inferia/startup_events.py
src/inferia/startup_ui.py
src/inferia/common/__init__.py
src/inferia/common/app_setup.py
src/inferia/common/circuit_breaker.py
src/inferia/common/config_manager.py
src/inferia/common/errors.py
src/inferia/common/exception_handlers.py
src/inferia/common/http_client.py
src/inferia/common/logger.py
src/inferia/common/middleware.py
src/inferia/common/model_types.py
src/inferia/common/pagination.py
src/inferia/common/rate_limit.py
src/inferia/common/schemas/__init__.py
src/inferia/common/schemas/chat.py
src/inferia/common/schemas/common.py
src/inferia/common/schemas/data.py
src/inferia/common/schemas/embeddings.py
src/inferia/common/schemas/guardrail.py
src/inferia/common/schemas/prompt.py
src/inferia/dashboard/Logo.png
src/inferia/dashboard/config.js
src/inferia/dashboard/index.html
src/inferia/dashboard/logo.svg
src/inferia/dashboard/vite.svg
src/inferia/dashboard/assets/InsightsCharts-DWTNY39M.js
src/inferia/dashboard/assets/index-BoPyI3qg.css
src/inferia/dashboard/assets/index-CpU4VF4k.js
src/inferia/infra/schema/global_schema.sql
src/inferia/infra/schema/migrations/20250218_add_model_type.sql
src/inferia/infra/schema/migrations/20260212_add_inference_logs_ip.sql
src/inferia/services/api_gateway/app.py
src/inferia/services/api_gateway/bootstrap_db.py
src/inferia/services/api_gateway/config.py
src/inferia/services/api_gateway/main.py
src/inferia/services/api_gateway/models.py
src/inferia/services/api_gateway/audit/__init__.py
src/inferia/services/api_gateway/audit/router.py
src/inferia/services/api_gateway/audit/service.py
src/inferia/services/api_gateway/db/__init__.py
src/inferia/services/api_gateway/db/database.py
src/inferia/services/api_gateway/db/security.py
src/inferia/services/api_gateway/db/models/__init__.py
src/inferia/services/api_gateway/db/models/api_key.py
src/inferia/services/api_gateway/db/models/audit_log.py
src/inferia/services/api_gateway/db/models/deployment.py
src/inferia/services/api_gateway/db/models/inference_log.py
src/inferia/services/api_gateway/db/models/invitation.py
src/inferia/services/api_gateway/db/models/organization.py
src/inferia/services/api_gateway/db/models/policy.py
src/inferia/services/api_gateway/db/models/role.py
src/inferia/services/api_gateway/db/models/system_setting.py
src/inferia/services/api_gateway/db/models/usage.py
src/inferia/services/api_gateway/db/models/user.py
src/inferia/services/api_gateway/db/models/user_organization.py
src/inferia/services/api_gateway/gateway/__init__.py
src/inferia/services/api_gateway/gateway/health_routes.py
src/inferia/services/api_gateway/gateway/http_client.py
src/inferia/services/api_gateway/gateway/internal_middleware.py
src/inferia/services/api_gateway/gateway/middleware.py
src/inferia/services/api_gateway/gateway/proxy_routes.py
src/inferia/services/api_gateway/gateway/rate_limiter.py
src/inferia/services/api_gateway/gateway/router.py
src/inferia/services/api_gateway/management/__init__.py
src/inferia/services/api_gateway/management/api_keys.py
src/inferia/services/api_gateway/management/config_manager.py
src/inferia/services/api_gateway/management/configuration.py
src/inferia/services/api_gateway/management/dependencies.py
src/inferia/services/api_gateway/management/deployments.py
src/inferia/services/api_gateway/management/insights.py
src/inferia/services/api_gateway/management/knowledge_base.py
src/inferia/services/api_gateway/management/organizations.py
src/inferia/services/api_gateway/management/prompts.py
src/inferia/services/api_gateway/management/router.py
src/inferia/services/api_gateway/management/users.py
src/inferia/services/api_gateway/policy/__init__.py
src/inferia/services/api_gateway/policy/engine.py
src/inferia/services/api_gateway/prompt/__init__.py
src/inferia/services/api_gateway/prompt/templates.py
src/inferia/services/api_gateway/rbac/__init__.py
src/inferia/services/api_gateway/rbac/auth.py
src/inferia/services/api_gateway/rbac/authorization.py
src/inferia/services/api_gateway/rbac/initialization.py
src/inferia/services/api_gateway/rbac/middleware.py
src/inferia/services/api_gateway/rbac/mock_data.py
src/inferia/services/api_gateway/rbac/models.py
src/inferia/services/api_gateway/rbac/roles_router.py
src/inferia/services/api_gateway/rbac/router.py
src/inferia/services/api_gateway/rbac/users_router.py
src/inferia/services/api_gateway/schemas/auth.py
src/inferia/services/api_gateway/schemas/common.py
src/inferia/services/api_gateway/schemas/config.py
src/inferia/services/api_gateway/schemas/inference.py
src/inferia/services/api_gateway/schemas/insights.py
src/inferia/services/api_gateway/schemas/knowledge_base.py
src/inferia/services/api_gateway/schemas/logging.py
src/inferia/services/api_gateway/schemas/management.py
src/inferia/services/api_gateway/schemas/prompt.py
src/inferia/services/api_gateway/security/encryption.py
src/inferia/services/api_gateway/tests/__init__.py
src/inferia/services/api_gateway/tests/conftest.py
src/inferia/services/api_gateway/tests/test_audit.py
src/inferia/services/api_gateway/tests/test_gateway.py
src/inferia/services/api_gateway/tests/test_guardrail_proceed.py
src/inferia/services/api_gateway/tests/test_integration.py
src/inferia/services/api_gateway/tests/test_management_insights.py
src/inferia/services/api_gateway/tests/test_rbac.py
src/inferia/services/api_gateway/tests/verify_advanced_linking.py
src/inferia/services/api_gateway/tests/verify_http_prompt_process.py
src/inferia/services/api_gateway/tests/verify_template_linking.py
src/inferia/services/data/__init__.py
src/inferia/services/data/api_models.py
src/inferia/services/data/app.py
src/inferia/services/data/chunker.py
src/inferia/services/data/config.py
src/inferia/services/data/config_manager.py
src/inferia/services/data/engine.py
src/inferia/services/data/main.py
src/inferia/services/data/middleware.py
src/inferia/services/data/parser.py
src/inferia/services/data/prompt_engine.py
src/inferia/services/data/prompt_rewriter.py
src/inferia/services/data/prompt_templates.py
src/inferia/services/data/router.py
src/inferia/services/guardrail/__init__.py
src/inferia/services/guardrail/api_models.py
src/inferia/services/guardrail/app.py
src/inferia/services/guardrail/config.py
src/inferia/services/guardrail/config_manager.py
src/inferia/services/guardrail/engine.py
src/inferia/services/guardrail/main.py
src/inferia/services/guardrail/middleware.py
src/inferia/services/guardrail/models.py
src/inferia/services/guardrail/pii_service.py
src/inferia/services/guardrail/providers/base.py
src/inferia/services/guardrail/providers/lakera_provider.py
src/inferia/services/guardrail/providers/llama_guard_provider.py
src/inferia/services/guardrail/providers/llm_guard_provider.py
src/inferia/services/inference/__init__.py
src/inferia/services/inference/app.py
src/inferia/services/inference/client.py
src/inferia/services/inference/config.py
src/inferia/services/inference/main.py
src/inferia/services/inference/core/__init__.py
src/inferia/services/inference/core/auth.py
src/inferia/services/inference/core/concurrency_limiter.py
src/inferia/services/inference/core/http_client.py
src/inferia/services/inference/core/orchestrator.py
src/inferia/services/inference/core/providers.py
src/inferia/services/inference/core/rate_limiter.py
src/inferia/services/inference/core/service.py
src/inferia/services/inference/core/stream_processor.py
src/inferia/services/orchestration/__init__.py
src/inferia/services/orchestration/config.py
src/inferia/services/orchestration/constants.py
src/inferia/services/orchestration/main.py
src/inferia/services/orchestration/middleware.py
src/inferia/services/orchestration/server.py
src/inferia/services/orchestration/infra/__init__.py
src/inferia/services/orchestration/infra/db.py
src/inferia/services/orchestration/infra/k8s_llmd_client.py
src/inferia/services/orchestration/infra/kafka_producer.py
src/inferia/services/orchestration/infra/redis_client.py
src/inferia/services/orchestration/infra/redis_event_bus.py
src/inferia/services/orchestration/infra/spot_reclaimer.py
src/inferia/services/orchestration/provisioning/__init__.py
src/inferia/services/orchestration/provisioning/base.py
src/inferia/services/orchestration/provisioning/skypilot.py
src/inferia/services/orchestration/repositories/api_gateway_sync_repo.py
src/inferia/services/orchestration/repositories/autoscaler_repo.py
src/inferia/services/orchestration/repositories/base_repo.py
src/inferia/services/orchestration/repositories/inventory_repo.py
src/inferia/services/orchestration/repositories/job_repo.py
src/inferia/services/orchestration/repositories/model_deployment_repo.py
src/inferia/services/orchestration/repositories/model_registry_repo.py
src/inferia/services/orchestration/repositories/node_repo.py
src/inferia/services/orchestration/repositories/outbox_repo.py
src/inferia/services/orchestration/repositories/placement_repo.py
src/inferia/services/orchestration/repositories/pool_repo.py
src/inferia/services/orchestration/repositories/provider_repo.py
src/inferia/services/orchestration/repositories/quota_repo.py
src/inferia/services/orchestration/repositories/scheduler_repo.py
src/inferia/services/orchestration/services/__init__.py
src/inferia/services/orchestration/services/adapter_engine/__init__.py
src/inferia/services/orchestration/services/adapter_engine/base.py
src/inferia/services/orchestration/services/adapter_engine/engine.py
src/inferia/services/orchestration/services/adapter_engine/registry.py
src/inferia/services/orchestration/services/adapter_engine/service.py
src/inferia/services/orchestration/services/adapter_engine/types.py
src/inferia/services/orchestration/services/adapter_engine/adapters/akash/__init__.py
src/inferia/services/orchestration/services/adapter_engine/adapters/akash/akash_adapter.py
src/inferia/services/orchestration/services/adapter_engine/adapters/akash/sdl_builder.py
src/inferia/services/orchestration/services/adapter_engine/adapters/aws/__init__.py
src/inferia/services/orchestration/services/adapter_engine/adapters/aws/adapter.py
src/inferia/services/orchestration/services/adapter_engine/adapters/aws/aws_adapter.py
src/inferia/services/orchestration/services/adapter_engine/adapters/base/__init__.py
src/inferia/services/orchestration/services/adapter_engine/adapters/base/adapter.py
src/inferia/services/orchestration/services/adapter_engine/adapters/k8s/k8s_adapter.py
src/inferia/services/orchestration/services/adapter_engine/adapters/k8s/k8s_liveness.py
src/inferia/services/orchestration/services/adapter_engine/adapters/nosana/job_builder.py
src/inferia/services/orchestration/services/adapter_engine/adapters/nosana/nosana_adapter.py
src/inferia/services/orchestration/services/adapter_engine/adapters/skypilot/skypilot_adapter.py
src/inferia/services/orchestration/services/adapter_engine/adapters/skypilot/spec_builder.py
src/inferia/services/orchestration/services/autoscaler/worker.py
src/inferia/services/orchestration/services/compute_node/service.py
src/inferia/services/orchestration/services/compute_pool_engine/__init__.py
src/inferia/services/orchestration/services/compute_pool_engine/compute_pool_manager.py
src/inferia/services/orchestration/services/depin-sidecar/package.json
src/inferia/services/orchestration/services/depin-sidecar/tsconfig.json
src/inferia/services/orchestration/services/depin-sidecar/dist/server.js
src/inferia/services/orchestration/services/depin-sidecar/dist/modules/akash/akash_service.js
src/inferia/services/orchestration/services/depin-sidecar/dist/modules/nosana/nosana_logs.js
src/inferia/services/orchestration/services/depin-sidecar/dist/modules/nosana/nosana_service.js
src/inferia/services/orchestration/services/depin-sidecar/src/server.ts
src/inferia/services/orchestration/services/depin-sidecar/src/modules/akash/akash_service.ts
src/inferia/services/orchestration/services/depin-sidecar/src/modules/nosana/nosana_logs.ts
src/inferia/services/orchestration/services/depin-sidecar/src/modules/nosana/nosana_service.ts
src/inferia/services/orchestration/services/eventing/outbox_publisher.py
src/inferia/services/orchestration/services/inventory_manager/http.py
src/inferia/services/orchestration/services/inventory_manager/liveness.py
src/inferia/services/orchestration/services/inventory_manager/service.py
src/inferia/services/orchestration/services/llmd/spec_builder.py
src/inferia/services/orchestration/services/llmd_runtime/client.py
src/inferia/services/orchestration/services/llmd_runtime/health.py
src/inferia/services/orchestration/services/llmd_runtime/runtime.py
src/inferia/services/orchestration/services/llmd_runtime/spec.py
src/inferia/services/orchestration/services/model_deployment/controller.py
src/inferia/services/orchestration/services/model_deployment/deployment_server.py
src/inferia/services/orchestration/services/model_deployment/runtime_resolver.py
src/inferia/services/orchestration/services/model_deployment/service.py
src/inferia/services/orchestration/services/model_deployment/worker.py
src/inferia/services/orchestration/services/model_deployment/worker_main.py
src/inferia/services/orchestration/services/model_deployment/strategies/base.py
src/inferia/services/orchestration/services/model_deployment/strategies/llmd.py
src/inferia/services/orchestration/services/model_deployment/strategies/vllm.py
src/inferia/services/orchestration/services/model_registry/service.py
src/inferia/services/orchestration/services/node-agent/__init__.py
src/inferia/services/orchestration/services/node-agent/main.py
src/inferia/services/orchestration/services/node-agent/agent/__init__.py
src/inferia/services/orchestration/services/node-agent/agent/cpu.py
src/inferia/services/orchestration/services/node-agent/agent/gpu.py
src/inferia/services/orchestration/services/node-agent/agent/heartbeat.py
src/inferia/services/orchestration/services/node-agent/agent/memory.py
src/inferia/services/orchestration/services/placement_engine/__init__.py
src/inferia/services/orchestration/services/placement_engine/scoring.py
src/inferia/services/orchestration/services/placement_engine/service.py
src/inferia/services/orchestration/services/scheduler/service.py
src/inferia/services/orchestration/services/traffic_router/__init__.py
src/inferia/services/orchestration/services/traffic_router/engine.py
src/inferia/services/orchestration/shared/__init__.py
src/inferia/services/orchestration/test/aws_instance_specs.py
src/inferia/services/orchestration/test/test_aws_realtime_capacity.py
src/inferia/services/orchestration/test/test_grpc.py
src/inferia/services/orchestration/test/test_node_agent_heartbeat.py
src/inferia/services/orchestration/test/test_node_liveness.py
src/inferia/services/orchestration/test/test_traffic_router.py
src/inferia/services/orchestration/test/adapter_test/test_adapter_engine.py
src/inferia/services/orchestration/test/adapter_test/test_k8s_compute_e2e.py
src/inferia/services/orchestration/test/adapter_test/test_model_deploy.py
src/inferia/services/orchestration/test/adapter_test/test_model_deploy_nosana.py
src/inferia/services/orchestration/test/adapter_test/test_skypilot_adapter.py
src/inferia/services/orchestration/test/autoscaler/test_scale_down.py
src/inferia/services/orchestration/test/autoscaler/test_scale_up.py
src/inferia/services/orchestration/test/compute_pools_nodes/test_compute_node_grpc.py
src/inferia/services/orchestration/test/compute_pools_nodes/test_fake_adapter.py
src/inferia/services/orchestration/test/e2e/test_e2e_control_plane.py
src/inferia/services/orchestration/test/gang/test_gang_concurrency.py
src/inferia/services/orchestration/test/gang/test_gang_insufficient_capacity.py
src/inferia/services/orchestration/test/gang/test_gang_success.py
src/inferia/services/orchestration/test/integration/test_control_plane_e2e.py
src/inferia/services/orchestration/test/model_deployment/test_model_deployment_e2e.py
src/inferia/services/orchestration/test/model_deployment/test_start_deployment_controller.py
src/inferia/services/orchestration/test/model_registry/test_model_registry.py
src/inferia/services/orchestration/test/placement_test/test_placement_engine.py
src/inferia/services/orchestration/test/provisioning/__init__.py
src/inferia/services/orchestration/test/provisioning/test_skypilot_provisioner.py
src/inferia/services/orchestration/test/quota/_setup.py
src/inferia/services/orchestration/test/quota/test_billing_events.py
src/inferia/services/orchestration/test/quota/test_hard_quota.py
src/inferia/services/orchestration/test/quota/test_quota_preemption.py
src/inferia/services/orchestration/test/quota/test_quota_release.py
src/inferia/services/orchestration/test/scheduler/test_concurrency.py
src/inferia/services/orchestration/test/spot/test_spot_allocation.py
src/inferia/services/orchestration/test/spot/test_spot_reclaim.py
src/inferia/services/orchestration/test/spot/test_spot_vs_ondemand.py
src/inferia/services/orchestration/test/test_inventory/send_heartbeat.py
src/inferia/services/orchestration/v1/__init__.py
src/inferia/services/orchestration/v1/adapter_engine_pb2.py
src/inferia/services/orchestration/v1/adapter_engine_pb2_grpc.py
src/inferia/services/orchestration/v1/compute_node_pb2.py
src/inferia/services/orchestration/v1/compute_node_pb2_grpc.py
src/inferia/services/orchestration/v1/compute_pool_pb2.py
src/inferia/services/orchestration/v1/compute_pool_pb2_grpc.py
src/inferia/services/orchestration/v1/inventory_manager_pb2.py
src/inferia/services/orchestration/v1/inventory_manager_pb2_grpc.py
src/inferia/services/orchestration/v1/model_deployment_pb2.py
src/inferia/services/orchestration/v1/model_deployment_pb2_grpc.py
src/inferia/services/orchestration/v1/model_registry_pb2.py
src/inferia/services/orchestration/v1/model_registry_pb2_grpc.py
src/inferia/services/orchestration/v1/placement_engine_pb2.py
src/inferia/services/orchestration/v1/placement_engine_pb2_grpc.py
src/inferia/services/orchestration/v1/scheduler_pb2.py
src/inferia/services/orchestration/v1/scheduler_pb2_grpc.py
src/inferia/services/orchestration/workers/autoscaler_worker.py
src/inferia/services/orchestration/workers/deployment_worker.py
src/inferia/services/orchestration/workers/inventory_liveness_worker.py
src/inferia/services/orchestration/workers/outbox_worker.py
src/inferia/services/orchestration/workers/spot_reclaimer_worker.py
src/inferiallm.egg-info/PKG-INFO
src/inferiallm.egg-info/SOURCES.txt
src/inferiallm.egg-info/dependency_links.txt
src/inferiallm.egg-info/entry_points.txt
src/inferiallm.egg-info/requires.txt
src/inferiallm.egg-info/top_level.txt