README.md
pyproject.toml
src/llamacpp_cli/__init__.py
src/llamacpp_cli/backend_registry.py
src/llamacpp_cli/cli.py
src/llamacpp_cli/config.py
src/llamacpp_cli/conversation_affinity.py
src/llamacpp_cli/cpu_topology.py
src/llamacpp_cli/db.py
src/llamacpp_cli/gpu_detect.py
src/llamacpp_cli/installer.py
src/llamacpp_cli/ip_filter.py
src/llamacpp_cli/lb_proxy.py
src/llamacpp_cli/lb_proxy_logging.py
src/llamacpp_cli/llm_plugin.py
src/llamacpp_cli/model_manager.py
src/llamacpp_cli/model_warmer.py
src/llamacpp_cli/multi_model_proxy.py
src/llamacpp_cli/multi_model_server.py
src/llamacpp_cli/prometheus_metrics.py
src/llamacpp_cli/proxy.py
src/llamacpp_cli/ps.py
src/llamacpp_cli/request_logger.py
src/llamacpp_cli/response_cache.py
src/llamacpp_cli/run.py
src/llamacpp_cli/search.py
src/llamacpp_cli/server.py
src/llamacpp_cli/slot_manager.py
src/llamacpp_cli/slot_serve.py
src/llamacpp_cli/utils.py
src/llamacpp_cli.egg-info/PKG-INFO
src/llamacpp_cli.egg-info/SOURCES.txt
src/llamacpp_cli.egg-info/dependency_links.txt
src/llamacpp_cli.egg-info/entry_points.txt
src/llamacpp_cli.egg-info/requires.txt
src/llamacpp_cli.egg-info/top_level.txt
tests/test_backend_registry.py
tests/test_circuit_breaker.py
tests/test_cli.py
tests/test_config.py
tests/test_conversation_affinity.py
tests/test_cpu_topology.py
tests/test_db.py
tests/test_gpu_detect.py
tests/test_ip_filter.py
tests/test_lb_proxy_endpoints.py
tests/test_lb_proxy_logging.py
tests/test_lb_proxy_queue.py
tests/test_management_cli.py
tests/test_model_manager.py
tests/test_model_warmer.py
tests/test_multi_model_server.py
tests/test_openapi.py
tests/test_prometheus_metrics.py
tests/test_realtime_dashboard.py
tests/test_request_logger.py
tests/test_response_cache.py
tests/test_response_cache_integration.py
tests/test_server.py
tests/test_slot_manager.py
tests/test_sse_parsing.py
tests/test_tps_stats.py
tests/test_utils.py
tests/test_weighted_lb.py