CLAUDE.md
MANIFEST.in
README.md
pyproject.toml
requirements.txt
setup.py
cli_arena/__init__.py
cli_arena/__main__.py
cli_arena/canary_protection.py
cli_arena/post_install.py
cli_arena/repository_manager.py
cli_arena.egg-info/PKG-INFO
cli_arena.egg-info/SOURCES.txt
cli_arena.egg-info/dependency_links.txt
cli_arena.egg-info/entry_points.txt
cli_arena.egg-info/requires.txt
cli_arena.egg-info/top_level.txt
cli_arena/agents/__init__.py
cli_arena/agents/agent_utils.py
cli_arena/agents/base_agent.py
cli_arena/agents/base_docker_agent.py
cli_arena/agents/failure_mode.py
cli_arena/agents/naive_agent.py
cli_arena/agents/oracle_agent.py
cli_arena/agents/prompt_manager.py
cli_arena/agents/simple_oracle_agent.py
cli_arena/agents/installed_agents/naive_agent.py
cli_arena/agents/installed_agents/aider/__init__.py
cli_arena/agents/installed_agents/aider/aider-setup.sh
cli_arena/agents/installed_agents/aider/aider_agent.py
cli_arena/agents/installed_agents/claude_code/__init__.py
cli_arena/agents/installed_agents/claude_code/claude-code-setup.sh
cli_arena/agents/installed_agents/claude_code/claude_code_agent.py
cli_arena/agents/installed_agents/cursor_cli/__init__.py
cli_arena/agents/installed_agents/cursor_cli/cursor_cli_agent.py
cli_arena/agents/installed_agents/gemini_cli/__init__.py
cli_arena/agents/installed_agents/gemini_cli/gemini-cli-setup.sh
cli_arena/agents/installed_agents/gemini_cli/gemini_cli_agent.py
cli_arena/agents/installed_agents/openai_codex/__init__.py
cli_arena/agents/installed_agents/openai_codex/codex-setup.sh
cli_arena/agents/installed_agents/openai_codex/codex_agent.py
cli_arena/agents/prompts/README.md
cli_arena/agents/prompts/USAGE.md
cli_arena/agents/prompts/complex_prompt.txt
cli_arena/agents/prompts/enhanced_multi_step_prompt.txt
cli_arena/agents/prompts/expert_prompt.txt
cli_arena/agents/prompts/my_custom_prompt.txt
cli_arena/agents/prompts/naive_prompt.txt
cli_arena/cache/__init__.py
cli_arena/cache/agent_cache.py
cli_arena/cache/anthropic.py
cli_arena/cli/__init__.py
cli_arena/cli/fork_wizard.py
cli_arena/cli/wizard.py
cli_arena/cli/arena/__init__.py
cli_arena/cli/arena/admin.py
cli_arena/cli/arena/cache.py
cli_arena/cli/arena/datasets.py
cli_arena/cli/arena/docker_cli.py
cli_arena/cli/arena/leaderboard.py
cli_arena/cli/arena/main.py
cli_arena/cli/arena/publish.py
cli_arena/cli/arena/quality_cli.py
cli_arena/cli/arena/registry_cli.py
cli_arena/cli/arena/runs.py
cli_arena/cli/arena/tasks.py
cli_arena/cli/arena/quality_checker/__init__.py
cli_arena/cli/arena/quality_checker/quality_checker.py
cli_arena/cli/arena/quality_checker/task_fixer.py
cli_arena/cli/tb/__init__.py
cli_arena/cli/tb/quality_checker/check.txt
cli_arena/cli/tb/quality_checker/fix.txt
cli_arena/cli/tb/quality_checker/models.py
cli_arena/cli/template-task/docker-compose.yaml
cli_arena/cli/template-task/run-tests.sh
cli_arena/cli/template-task/solution.sh
cli_arena/cli/template-task/solution.yaml
cli_arena/cli/template-task/tests/test_outputs.py
cli_arena/cli/workbench/__init__.py
cli_arena/cli/workbench/main.py
cli_arena/compat/terminal_bench/__init__.py
cli_arena/compat/terminal_bench/agents/__init__.py
cli_arena/compat/terminal_bench/handlers/__init__.py
cli_arena/compat/terminal_bench/handlers/trial_handler.py
cli_arena/compat/terminal_bench/harness/__init__.py
cli_arena/compat/terminal_bench/terminal/__init__.py
cli_arena/compat/terminal_bench/terminal/models.py
cli_arena/compat/terminal_bench/terminal/terminal.py
cli_arena/compat/terminal_bench/terminal/tmux_session.py
cli_arena/dataset/__init__.py
cli_arena/dataset/dataset.py
cli_arena/dataset/dataset_metadata.py
cli_arena/evaluation/__init__.py
cli_arena/evaluation/advanced_metrics.py
cli_arena/evaluation/improved_metrics.py
cli_arena/evaluation/tool_call_analyzer.py
cli_arena/harness/__init__.py
cli_arena/harness/consolidated_harness.py
cli_arena/harness/docker_health_manager.py
cli_arena/harness/models.py
cli_arena/leaderboard/__init__.py
cli_arena/leaderboard/badges.py
cli_arena/leaderboard/ci_integration.py
cli_arena/leaderboard/enhanced_metrics.py
cli_arena/leaderboard/enhanced_web.py
cli_arena/leaderboard/leaderboard.py
cli_arena/leaderboard/server.py
cli_arena/leaderboard/web.py
cli_arena/llms/base_llm.py
cli_arena/llms/lite_llm.py
cli_arena/llms/litellm.py
cli_arena/llms/test_claude.py
cli_arena/parsers/__init__.py
cli_arena/parsers/base_parser.py
cli_arena/parsers/parser_factory.py
cli_arena/parsers/pytest_parser.py
cli_arena/parsers/swebench_parser.py
cli_arena/quality/__init__.py
cli_arena/quality/task_validator.py
cli_arena/recording/harness_integration.py
cli_arena/recording/session_recorder.py
cli_arena/recording/web_player.py
cli_arena/registry/client.py
cli_arena/registry/manager.py
cli_arena/registry/publisher.py
cli_arena/reliability/__init__.py
cli_arena/reliability/flakiness_detector.py
cli_arena/scoring/__init__.py
cli_arena/scoring/example_rubric.yaml
cli_arena/scoring/harness_integration.py
cli_arena/scoring/rubrics.py
cli_arena/scoring/simple_rubrics.py
cli_arena/terminal/__init__.py
cli_arena/terminal/docker_compose_manager.py
cli_arena/terminal/get-asciinema-timestamp.sh
cli_arena/terminal/models.py
cli_arena/terminal/terminal.py
cli_arena/terminal/tmux_session.py
cli_arena/utils/__init__.py
cli_arena/utils/agent_bash_script.sh
cli_arena/utils/anthropic_caching.py
cli_arena/utils/create_embedded_parser.py
cli_arena/utils/create_embedded_parser_v2.py
cli_arena/utils/docker_subprocess.py
cli_arena/utils/env.py
cli_arena/utils/env_model.py
cli_arena/utils/livestreamer.py
cli_arena/utils/llm_response_parser.py
cli_arena/utils/logger.py
cli_arena/utils/parse_and_execute.py
cli_arena/utils/run_lock.py
cli_arena/utils/task_timeouts.py
cli_arena/utils/verify_maintenance.py
docker/agents/goose/Dockerfile
docker/agents/goose/add_recipe_prompt.py
docker/agents/goose/config-template.yaml
docker/agents/goose/docker-compose.yaml
docker/agents/goose/entrypoint.sh
docker/agents/goose/recipe-template.yaml
docker/base-images/docker-compose.yaml
docker/base-images/deveval/Dockerfile
docker/base-images/python-3-13/Dockerfile
docker/base-images/ubuntu-24-04/Dockerfile
docker/base-images/ubuntu-24-04/Dockerfile.cli-tools
docker/base-images/ubuntu-24-04/Dockerfile.minimal
docker/base-images/ubuntu-24-04/Dockerfile.optimized
docker/base-images/ubuntu-24-04/Dockerfile.quick
docker/base-images/ubuntu-24-04/Dockerfile.with-go
docker/base-images/ubuntu-24-04/Dockerfile.working
docker/mcp-server/Dockerfile
docker/mcp-server/docker-compose.yaml
docker/mcp-server/server/server.py
docker/mcp-server/server/tmux_session.py
repositories/cli-arena-devops-go-a/.aider.chat.history.md
repositories/cli-arena-devops-go-a/README.md
repositories/cli-arena-devops-go-a/.pytest_cache/README.md
repositories/cli-arena-devops-go-a/db/README.md
repositories/cli-arena-devops-go-a/docs/README.md
repositories/cli-arena-devops-go-a/docs/index.md
repositories/cli-arena-devops-go-a/setup_tests/README.md
repositories/cli-arena-devops-go-a/setup_tests/unit/test_arithmetic.py
repositories/cli-arena-devops-go-a/tasks/configure_cross_account_iam_role_terraform/task.yaml
repositories/cli-arena-devops-go-a/tasks/configure_cross_account_iam_role_terraform/verify.sh
repositories/cli-arena-devops-go-a/tasks/debug_terraform_dependent_resource_creation_failure/task.yaml
repositories/cli-arena-devops-go-a/tasks/debug_terraform_dependent_resource_creation_failure/verify.sh
repositories/cli-arena-devops-go-a/tasks/diagnose_and_fix_terraform_drift/task.yaml
repositories/cli-arena-devops-go-a/tasks/diagnose_and_fix_terraform_drift/verify.sh
repositories/cli-arena-devops-go-a/tasks/harden-docker-security/task.yaml
repositories/cli-arena-devops-go-a/tasks/harden-docker-security/verify.sh
repositories/cli-arena-devops-go-a/tasks/implement_canary_deployment_strategy_docker/task.yaml
repositories/cli-arena-devops-go-a/tasks/implement_canary_deployment_strategy_docker/verify.sh
repositories/cli-arena-devops-go-a/tasks/integrate_go_app_with_vault_for_secrets/task.yaml
repositories/cli-arena-devops-go-a/tasks/integrate_go_app_with_vault_for_secrets/verify.sh
repositories/cli-arena-devops-go-a/tasks/migrate_terraform_backend_s3_to_gcs/task.yaml
repositories/cli-arena-devops-go-a/tasks/migrate_terraform_backend_s3_to_gcs/verify.sh
repositories/cli-arena-devops-go-a/tasks/optimize_and_secure_ci_pipeline_for_go_terraform/task.yaml
repositories/cli-arena-devops-go-a/tasks/optimize_and_secure_ci_pipeline_for_go_terraform/verify.sh
repositories/cli-arena-devops-go-a/tasks/restore_application_from_failed_kubernetes_node_simulation/task.yaml
repositories/cli-arena-devops-go-a/tasks/restore_application_from_failed_kubernetes_node_simulation/verify.sh
repositories/cli-arena-devops-go-a/tasks/setup_centralized_logging_docker_go_fluentd/task.yaml
repositories/cli-arena-devops-go-a/tasks/setup_centralized_logging_docker_go_fluentd/verify.sh
repositories/cli-arena-devops-go-a/tasks/troubleshoot_multi_stage_docker_build_failure/task.yaml
repositories/cli-arena-devops-go-a/tasks/troubleshoot_multi_stage_docker_build_failure/verify.sh
repositories/cli-arena-devops-go-a/tests/unit/test_arithmetic.py
repositories/cli-arena-devops-go-b/PROJECT_STATUS.md
repositories/cli-arena-devops-go-b/README.md
repositories/cli-arena-devops-go-b/.pytest_cache/README.md
repositories/cli-arena-devops-go-b/setup_tests/test_environment.py
repositories/cli-arena-devops-go-b/tasks/custom-terraform-backend/task.yaml
repositories/cli-arena-devops-go-b/tasks/custom-terraform-backend/verify.sh
repositories/cli-arena-devops-go-b/tasks/custom-terraform-provider/task.yaml
repositories/cli-arena-devops-go-b/tasks/custom-terraform-provider/verify.sh
repositories/cli-arena-devops-go-b/tasks/future-numbering-system/task.yaml
repositories/cli-arena-devops-go-b/tasks/future-numbering-system/verify.sh
repositories/cli-arena-devops-go-b/tasks/gear-service-vehicle/task.yaml
repositories/cli-arena-devops-go-b/tasks/gear-service-vehicle/verify.sh
repositories/cli-arena-devops-go-b/tasks/go-importing-system/task.yaml
repositories/cli-arena-devops-go-b/tasks/go-importing-system/verify.sh
repositories/cli-arena-devops-go-b/tasks/memory-consumption-tool/task.yaml
repositories/cli-arena-devops-go-b/tasks/memory-consumption-tool/verify.sh
repositories/cli-arena-devops-go-b/tasks/self-healing-docker-infra/task.yaml
repositories/cli-arena-devops-go-b/tasks/self-healing-docker-infra/verify.sh
repositories/cli-arena-devops-go-b/tasks/terraform-docker-combination/task.yaml
repositories/cli-arena-devops-go-b/tasks/terraform-docker-combination/verify.sh
repositories/cli-arena-devops-go-b/tasks/terraform-module-testing/task.yaml
repositories/cli-arena-devops-go-b/tasks/terraform-module-testing/verify.sh
repositories/cli-arena-devops-go-b/tasks/terraform-orchestrator/task.yaml
repositories/cli-arena-devops-go-b/tasks/terraform-orchestrator/verify.sh
repositories/cli-arena-devops-go-b/tasks/vault-secrets-terraform/task.yaml
repositories/cli-arena-devops-go-b/tasks/vault-secrets-terraform/verify.sh
repositories/cli-arena-devops-go-b/tests/unit/test_arithmetic.py
repositories/cli-arena-gamedev-unity-a/README.md
repositories/cli-arena-gamedev-unity-a/game_cli.py
repositories/cli-arena-gamedev-unity-a/game_state.py
repositories/cli-arena-gamedev-unity-a/generate_prefab.py
repositories/cli-arena-gamedev-unity-a/sound_cli.py
repositories/cli-arena-gamedev-unity-a/.pytest_cache/README.md
repositories/cli-arena-gamedev-unity-a/tasks/dynamic-sound-manager/task.yaml
repositories/cli-arena-gamedev-unity-a/tasks/dynamic-sound-manager/verify.sh
repositories/cli-arena-gamedev-unity-a/tasks/editor-tools-cli/task.yaml
repositories/cli-arena-gamedev-unity-a/tasks/editor-tools-cli/verify.sh
repositories/cli-arena-gamedev-unity-a/tasks/enemy-finite-state-machine/task.yaml
repositories/cli-arena-gamedev-unity-a/tasks/enemy-finite-state-machine/verify.sh
repositories/cli-arena-gamedev-unity-a/tasks/event-driven-dialogue-system/task.yaml
repositories/cli-arena-gamedev-unity-a/tasks/event-driven-dialogue-system/verify.sh
repositories/cli-arena-gamedev-unity-a/tasks/modular-ui-system/task.yaml
repositories/cli-arena-gamedev-unity-a/tasks/modular-ui-system/verify.sh
repositories/cli-arena-gamedev-unity-a/tasks/multiplayer-lobby-system/task.yaml
repositories/cli-arena-gamedev-unity-a/tasks/multiplayer-lobby-system/verify.sh
repositories/cli-arena-gamedev-unity-a/tasks/navmesh-pathfinding-ai/task.yaml
repositories/cli-arena-gamedev-unity-a/tasks/navmesh-pathfinding-ai/verify.sh
repositories/cli-arena-gamedev-unity-a/tasks/physics-based-grappling-hook/task.yaml
repositories/cli-arena-gamedev-unity-a/tasks/physics-based-grappling-hook/verify.sh
repositories/cli-arena-gamedev-unity-a/tasks/procedural-terrain-generation/task.yaml
repositories/cli-arena-gamedev-unity-a/tasks/procedural-terrain-generation/verify.sh
repositories/cli-arena-gamedev-unity-a/tasks/ragdoll-death-physics/task.yaml
repositories/cli-arena-gamedev-unity-a/tasks/ragdoll-death-physics/verify.sh
repositories/cli-arena-gamedev-unity-a/tasks/realistic-day-night-cycle/task.yaml
repositories/cli-arena-gamedev-unity-a/tasks/realistic-day-night-cycle/verify.sh
repositories/cli-arena-gamedev-unity-a/tasks/runtime-asset-streaming/task.yaml
repositories/cli-arena-gamedev-unity-a/tasks/runtime-asset-streaming/verify.sh
repositories/cli-arena-gamedev-unity-a/tasks/runtime-performance-profiler/task.yaml
repositories/cli-arena-gamedev-unity-a/tasks/runtime-performance-profiler/verify.sh
repositories/cli-arena-gamedev-unity-a/tasks/save-load-system-json/task.yaml
repositories/cli-arena-gamedev-unity-a/tasks/save-load-system-json/verify.sh
repositories/cli-arena-gamedev-unity-a/tasks/unity-build-pipeline-cli/task.yaml
repositories/cli-arena-gamedev-unity-a/tasks/unity-build-pipeline-cli/verify.sh
repositories/cli-arena-gamedev-unity-a/tests/unit/test_arithmetic.py
repositories/cli-arena-ml-fastapi-a/.aider.chat.history.md
repositories/cli-arena-ml-fastapi-a/.pytest_cache/README.md
repositories/cli-arena-ml-fastapi-a/tasks/task-001-jwt-auth/task.yaml
repositories/cli-arena-ml-fastapi-a/tasks/task-001-jwt-auth/verify.sh
repositories/cli-arena-ml-fastapi-a/tasks/task-002-ml-predict/task.yaml
repositories/cli-arena-ml-fastapi-a/tasks/task-002-ml-predict/verify.sh
repositories/cli-arena-ml-fastapi-a/tasks/task-003-sql-injection-defense/task.yaml
repositories/cli-arena-ml-fastapi-a/tasks/task-003-sql-injection-defense/verify.sh
repositories/cli-arena-ml-fastapi-a/tasks/task-003-sql-injection-defense/.pytest_cache/README.md
repositories/cli-arena-ml-fastapi-a/tasks/task-009-docker-caching/task.yaml
repositories/cli-arena-ml-fastapi-a/tasks/task-009-docker-caching/verify.sh
repositories/cli-arena-ml-fastapi-a/tasks/task-010-wildcard-ultra-hard/task.yaml
repositories/cli-arena-ml-fastapi-a/tasks/task-010-wildcard-ultra-hard/verify.sh
repositories/cli-arena-ml-fastapi-a/tasks/task-010-wildcard-ultra-hard/.pytest_cache/README.md
repositories/cli-arena-ml-fastapi-a/tests/test_auth.py
repositories/cli-arena-ml-fastapi-a/tests/test_predict.py
repositories/cli-arena-ml-fastapi-a/tests/unit/test_arithmetic.py
repositories/cli-arena-ml-fastapi-b/.aider.chat.history.md
repositories/cli-arena-ml-fastapi-b/README.md
repositories/cli-arena-ml-fastapi-b/.pytest_cache/README.md
repositories/cli-arena-ml-fastapi-b/scripts/init_db.py
repositories/cli-arena-ml-fastapi-b/tasks/behavior-analysis/task.yaml
repositories/cli-arena-ml-fastapi-b/tasks/behavior-analysis/verify.sh
repositories/cli-arena-ml-fastapi-b/tasks/behavior-analysis/tests/test_behavior_analysis.py
repositories/cli-arena-ml-fastapi-b/tasks/canary-releases/task.yaml
repositories/cli-arena-ml-fastapi-b/tasks/canary-releases/verify.sh
repositories/cli-arena-ml-fastapi-b/tasks/canary-releases/tests/test_canary_releases.py
repositories/cli-arena-ml-fastapi-b/tasks/chaos-engineering-k8s/task.yaml
repositories/cli-arena-ml-fastapi-b/tasks/chaos-engineering-k8s/verify.sh
repositories/cli-arena-ml-fastapi-b/tasks/chaos-engineering-k8s/tests/test_chaos_engineering_k8s.py
repositories/cli-arena-ml-fastapi-b/tasks/feature-flags/task.yaml
repositories/cli-arena-ml-fastapi-b/tasks/feature-flags/verify.sh
repositories/cli-arena-ml-fastapi-b/tasks/feature-flags/tests/test_feature_flags.py
repositories/cli-arena-ml-fastapi-b/tasks/gitops-deployment/task.yaml
repositories/cli-arena-ml-fastapi-b/tasks/gitops-deployment/verify.sh
repositories/cli-arena-ml-fastapi-b/tasks/instagram-api/task.yaml
repositories/cli-arena-ml-fastapi-b/tasks/instagram-api/verify.sh
repositories/cli-arena-ml-fastapi-b/tasks/instagram-api/tests/test_instagram_api.py
repositories/cli-arena-ml-fastapi-b/tasks/observability-opentelemetry/task.yaml
repositories/cli-arena-ml-fastapi-b/tasks/observability-opentelemetry/verify.sh
repositories/cli-arena-ml-fastapi-b/tasks/observability-opentelemetry/tests/test_observability_opentelemetry.py
repositories/cli-arena-ml-fastapi-b/tasks/polyglot-tracing/task.yaml
repositories/cli-arena-ml-fastapi-b/tasks/polyglot-tracing/verify.sh
repositories/cli-arena-ml-fastapi-b/tasks/polyglot-tracing/tests/test_polyglot_tracing.py
repositories/cli-arena-ml-fastapi-b/tasks/service-mesh-design/task.yaml
repositories/cli-arena-ml-fastapi-b/tasks/service-mesh-design/verify.sh
repositories/cli-arena-ml-fastapi-b/tasks/service-mesh-design/tests/test_service_mesh_design.py
repositories/cli-arena-ml-fastapi-b/tasks/zero-trust-microservices/task.yaml
repositories/cli-arena-ml-fastapi-b/tasks/zero-trust-microservices/verify.sh
repositories/cli-arena-ml-fastapi-b/tasks/zero-trust-microservices/tests/test_zero_trust_microservices.py
repositories/cli-arena-ml-fastapi-b/tests/root_test_behavior_analysis.py
repositories/cli-arena-ml-fastapi-b/tests/root_test_instagram_api.py
repositories/cli-arena-ml-fastapi-b/tests/test_behavior_analysis.py
repositories/cli-arena-ml-fastapi-b/tests/test_instagram_api.py
repositories/cli-arena-ml-fastapi-b/tests/unit/test_arithmetic.py
repositories/cli-arena-ml-fastapi-c/.aider.chat.history.md
repositories/cli-arena-ml-fastapi-c/README.md
repositories/cli-arena-ml-fastapi-c/test_epic_graph_api_with_rate_limiting.py
repositories/cli-arena-ml-fastapi-c/.pytest_cache/README.md
repositories/cli-arena-ml-fastapi-c/scripts/init_db.py
repositories/cli-arena-ml-fastapi-c/tasks/auto-scaling-symbolic-algebra-microservice/task.yaml
repositories/cli-arena-ml-fastapi-c/tasks/auto-scaling-symbolic-algebra-microservice/test_auto_scaling_symbolic_algebra_microservice.py
repositories/cli-arena-ml-fastapi-c/tasks/auto-scaling-symbolic-algebra-microservice/verify.sh
repositories/cli-arena-ml-fastapi-c/tasks/chem-aware-rest-api-in-kubernetes/task.yaml
repositories/cli-arena-ml-fastapi-c/tasks/chem-aware-rest-api-in-kubernetes/test_chem_aware_rest_api_in_kubernetes.py
repositories/cli-arena-ml-fastapi-c/tasks/chem-aware-rest-api-in-kubernetes/verify.sh
repositories/cli-arena-ml-fastapi-c/tasks/containerized-ramayana-geo-api/task.yaml
repositories/cli-arena-ml-fastapi-c/tasks/containerized-ramayana-geo-api/test_containerized_ramayana_geo_api.py
repositories/cli-arena-ml-fastapi-c/tasks/containerized-ramayana-geo-api/verify.sh
repositories/cli-arena-ml-fastapi-c/tasks/docker-ml-pipeline-for-reaction-kinetics/task.yaml
repositories/cli-arena-ml-fastapi-c/tasks/docker-ml-pipeline-for-reaction-kinetics/test_docker_ml_pipeline_for_reaction_kinetics.py
repositories/cli-arena-ml-fastapi-c/tasks/docker-ml-pipeline-for-reaction-kinetics/verify.sh
repositories/cli-arena-ml-fastapi-c/tasks/docker-swarm-fluid-dynamics-engine/task.yaml
repositories/cli-arena-ml-fastapi-c/tasks/docker-swarm-fluid-dynamics-engine/test_docker_swarm_fluid_dynamics_engine.py
repositories/cli-arena-ml-fastapi-c/tasks/docker-swarm-fluid-dynamics-engine/verify.sh
repositories/cli-arena-ml-fastapi-c/tasks/dockerized-jupyter-chemistry-platform/task.yaml
repositories/cli-arena-ml-fastapi-c/tasks/dockerized-jupyter-chemistry-platform/test_dockerized_jupyter_chemistry_platform.py
repositories/cli-arena-ml-fastapi-c/tasks/dockerized-jupyter-chemistry-platform/verify.sh
repositories/cli-arena-ml-fastapi-c/tasks/dockerized-sanskrit-verse-classifier-api/task.yaml
repositories/cli-arena-ml-fastapi-c/tasks/dockerized-sanskrit-verse-classifier-api/verify.sh
repositories/cli-arena-ml-fastapi-c/tasks/dockerized-sanskrit-verse-classifier-api/tests/test_dockerized_sanskrit_verse_classifier.py
repositories/cli-arena-ml-fastapi-c/tasks/epic-graph-api-with-rate-limiting/task.yaml
repositories/cli-arena-ml-fastapi-c/tasks/epic-graph-api-with-rate-limiting/test_epic_graph_api_with_rate_limiting.py
repositories/cli-arena-ml-fastapi-c/tasks/epic-graph-api-with-rate-limiting/verify.sh
repositories/cli-arena-ml-fastapi-c/tasks/gpu-enabled-em-field-simulation-api/task.yaml
repositories/cli-arena-ml-fastapi-c/tasks/gpu-enabled-em-field-simulation-api/test_gpu_enabled_em_field_simulation_api.py
repositories/cli-arena-ml-fastapi-c/tasks/gpu-enabled-em-field-simulation-api/verify.sh
repositories/cli-arena-ml-fastapi-c/tasks/hybrid-cloud-tensor-calculus-solver/task.yaml
repositories/cli-arena-ml-fastapi-c/tasks/hybrid-cloud-tensor-calculus-solver/test_hybrid_cloud_tensor_calculus_solver.py
repositories/cli-arena-ml-fastapi-c/tasks/hybrid-cloud-tensor-calculus-solver/verify.sh
repositories/cli-arena-ml-fastapi-c/tasks/multi-cloud-cicd-for-fea-docker-tools/task.yaml
repositories/cli-arena-ml-fastapi-c/tasks/multi-cloud-cicd-for-fea-docker-tools/test_multi_cloud_cicd_for_fea_docker_tools.py
repositories/cli-arena-ml-fastapi-c/tasks/multi-cloud-cicd-for-fea-docker-tools/verify.sh
repositories/cli-arena-ml-fastapi-c/tasks/sanskrit-to-math-translator-cloud-function/task.yaml
repositories/cli-arena-ml-fastapi-c/tasks/sanskrit-to-math-translator-cloud-function/test_sanskrit_to_math_translator_cloud_function.py
repositories/cli-arena-ml-fastapi-c/tasks/sanskrit-to-math-translator-cloud-function/verify.sh
repositories/cli-arena-ml-fastapi-c/tasks/serverless-epic-logic-theorem-prover/task.yaml
repositories/cli-arena-ml-fastapi-c/tasks/serverless-epic-logic-theorem-prover/test_serverless_epic_logic_theorem_prover.py
repositories/cli-arena-ml-fastapi-c/tasks/serverless-epic-logic-theorem-prover/verify.sh
repositories/cli-arena-ml-fastapi-c/tasks/serverless-mahabharata-genealogy-api/task.yaml
repositories/cli-arena-ml-fastapi-c/tasks/serverless-mahabharata-genealogy-api/test_serverless_mahabharata_genealogy_api.py
repositories/cli-arena-ml-fastapi-c/tasks/serverless-mahabharata-genealogy-api/verify.sh
repositories/cli-arena-ml-fastapi-c/tasks/serverless-physics-simulator/task.yaml
repositories/cli-arena-ml-fastapi-c/tasks/serverless-physics-simulator/test_serverless_physics_simulator.py
repositories/cli-arena-ml-fastapi-c/tasks/serverless-physics-simulator/verify.sh
repositories/cli-arena-ml-fastapi-c/tests/test_auto_scaling_symbolic_algebra_microservice.py
repositories/cli-arena-ml-fastapi-c/tests/test_chem_aware_rest_api_in_kubernetes.py
repositories/cli-arena-ml-fastapi-c/tests/test_containerized_ramayana_geo_api.py
repositories/cli-arena-ml-fastapi-c/tests/test_docker_ml_pipeline_for_reaction_kinetics.py
repositories/cli-arena-ml-fastapi-c/tests/test_docker_swarm_fluid_dynamics_engine.py
repositories/cli-arena-ml-fastapi-c/tests/test_dockerized_jupyter_chemistry_platform.py
repositories/cli-arena-ml-fastapi-c/tests/test_dockerized_sanskrit_verse_classifier.py
repositories/cli-arena-ml-fastapi-c/tests/test_epic_graph_api_with_rate_limiting.py
repositories/cli-arena-ml-fastapi-c/tests/test_example_complex_task.py
repositories/cli-arena-ml-fastapi-c/tests/test_gpu_enabled_em_field_simulation_api.py
repositories/cli-arena-ml-fastapi-c/tests/test_hybrid_cloud_tensor_calculus_solver.py
repositories/cli-arena-ml-fastapi-c/tests/test_multi_cloud_cicd_for_fea_docker_tools.py
repositories/cli-arena-ml-fastapi-c/tests/test_sanskrit_to_math_translator_cloud_function.py
repositories/cli-arena-ml-fastapi-c/tests/test_serverless_epic_logic_theorem_prover.py
repositories/cli-arena-ml-fastapi-c/tests/test_serverless_mahabharata_genealogy_api.py
repositories/cli-arena-ml-fastapi-c/tests/test_serverless_physics_simulator.py
repositories/cli-arena-ml-fastapi-c/tests/unit/test_arithmetic.py
repositories/cli-arena-ml-fastapi-d/README.md
repositories/cli-arena-ml-fastapi-d/.pytest_cache/README.md
repositories/cli-arena-ml-fastapi-d/scripts/generate_loan_model.py
repositories/cli-arena-ml-fastapi-d/scripts/init_db.py
repositories/cli-arena-ml-fastapi-d/setup_tests/__init__.py
repositories/cli-arena-ml-fastapi-d/setup_tests/test_main.py
repositories/cli-arena-ml-fastapi-d/setup_tests/test_predict.py
repositories/cli-arena-ml-fastapi-d/tasks/add-rate-limiter-middleware/task.yaml
repositories/cli-arena-ml-fastapi-d/tasks/add-rate-limiter-middleware/verify.sh
repositories/cli-arena-ml-fastapi-d/tasks/add-rate-limiter-middleware/.pytest_cache/README.md
repositories/cli-arena-ml-fastapi-d/tasks/add-rate-limiter-middleware/src/main.py
repositories/cli-arena-ml-fastapi-d/tasks/add-rate-limiter-middleware/src/middleware/rate_limiter.py
repositories/cli-arena-ml-fastapi-d/tasks/add-rate-limiter-middleware/tests/test_rate_limit.py
repositories/cli-arena-ml-fastapi-d/tasks/add-shap-explanation-api/task.yaml
repositories/cli-arena-ml-fastapi-d/tasks/add-shap-explanation-api/verify.sh
repositories/cli-arena-ml-fastapi-d/tasks/add-shap-explanation-api/.pytest_cache/README.md
repositories/cli-arena-ml-fastapi-d/tasks/add-shap-explanation-api/tests/test_explain.py
repositories/cli-arena-ml-fastapi-d/tasks/add-threshold-adjustment-api/task.yaml
repositories/cli-arena-ml-fastapi-d/tasks/add-threshold-adjustment-api/verify.sh
repositories/cli-arena-ml-fastapi-d/tasks/add-threshold-adjustment-api/.pytest_cache/README.md
repositories/cli-arena-ml-fastapi-d/tasks/add-threshold-adjustment-api/tests/test_threshold.py
repositories/cli-arena-ml-fastapi-d/tasks/add-user-authentication/task.yaml
repositories/cli-arena-ml-fastapi-d/tasks/add-user-authentication/verify.sh
repositories/cli-arena-ml-fastapi-d/tasks/add-user-authentication/.pytest_cache/README.md
repositories/cli-arena-ml-fastapi-d/tasks/add-user-authentication/tests/test_auth.py
repositories/cli-arena-ml-fastapi-d/tasks/inject-random-delay/task.yaml
repositories/cli-arena-ml-fastapi-d/tasks/inject-random-delay/verify.sh
repositories/cli-arena-ml-fastapi-d/tasks/inject-random-delay/.pytest_cache/README.md
repositories/cli-arena-ml-fastapi-d/tasks/inject-random-delay/tests/test_delay.py
repositories/cli-arena-ml-fastapi-d/tasks/log-prediction-history/task.yaml
repositories/cli-arena-ml-fastapi-d/tasks/log-prediction-history/verify.sh
repositories/cli-arena-ml-fastapi-d/tasks/log-prediction-history/.pytest_cache/README.md
repositories/cli-arena-ml-fastapi-d/tasks/log-prediction-history/tests/test_history.py
repositories/cli-arena-ml-fastapi-d/tasks/log-predictions-to-db/task.yaml
repositories/cli-arena-ml-fastapi-d/tasks/log-predictions-to-db/verify.sh
repositories/cli-arena-ml-fastapi-d/tasks/log-predictions-to-db/.pytest_cache/README.md
repositories/cli-arena-ml-fastapi-d/tasks/log-predictions-to-db/tests/test_logging.py
repositories/cli-arena-ml-fastapi-d/tasks/replace-model-with-xgboost/task.yaml
repositories/cli-arena-ml-fastapi-d/tasks/replace-model-with-xgboost/verify.sh
repositories/cli-arena-ml-fastapi-d/tasks/replace-model-with-xgboost/.pytest_cache/README.md
repositories/cli-arena-ml-fastapi-d/tasks/replace-model-with-xgboost/tests/test_predict.py
repositories/cli-arena-ml-fastapi-d/tasks/track-prediction-metrics/task.yaml
repositories/cli-arena-ml-fastapi-d/tasks/track-prediction-metrics/verify.sh
repositories/cli-arena-ml-fastapi-d/tasks/track-prediction-metrics/.pytest_cache/README.md
repositories/cli-arena-ml-fastapi-d/tasks/track-prediction-metrics/tests/test_metrics.py
repositories/cli-arena-ml-fastapi-d/tests/root_test_auth.py
repositories/cli-arena-ml-fastapi-d/tests/root_test_explain.py
repositories/cli-arena-ml-fastapi-d/tests/root_test_history.py
repositories/cli-arena-ml-fastapi-d/tests/root_test_predict.py
repositories/cli-arena-ml-fastapi-d/tests/root_test_threshold.py
repositories/cli-arena-ml-fastapi-d/tests/test_auth.py
repositories/cli-arena-ml-fastapi-d/tests/test_explain.py
repositories/cli-arena-ml-fastapi-d/tests/test_history.py
repositories/cli-arena-ml-fastapi-d/tests/test_metrics.py
repositories/cli-arena-ml-fastapi-d/tests/test_predict.py
repositories/cli-arena-ml-fastapi-d/tests/test_threshold.py
repositories/cli-arena-ml-fastapi-d/tests/unit/test_arithmetic.py
repositories/cli-arena-ml-fastapi-e/.aider.chat.history.md
repositories/cli-arena-ml-fastapi-e/.pytest_cache/README.md
repositories/cli-arena-ml-fastapi-e/tasks/add-user-authentication/task.yaml
repositories/cli-arena-ml-fastapi-e/tasks/add-user-authentication/verify.sh
repositories/cli-arena-ml-fastapi-e/tasks/add-user-authentication/.pytest_cache/README.md
repositories/cli-arena-ml-fastapi-e/tasks/add-user-authentication/tests/test_comprehensive_auth.py
repositories/cli-arena-mobile-b/README.md
repositories/cli-arena-mobile-b/.pytest_cache/README.md
repositories/cli-arena-mobile-b/setup_tests/test_environment.py
repositories/cli-arena-mobile-b/tasks/accesibility-audit/task.yaml
repositories/cli-arena-mobile-b/tasks/accesibility-audit/verify.sh
repositories/cli-arena-mobile-b/tasks/add-login-feature/task.yaml
repositories/cli-arena-mobile-b/tasks/add-login-feature/verify.sh
repositories/cli-arena-mobile-b/tasks/animated-loaded-transition/task.yaml
repositories/cli-arena-mobile-b/tasks/animated-loaded-transition/verify.sh
repositories/cli-arena-mobile-b/tasks/background-sync-worker/task.yaml
repositories/cli-arena-mobile-b/tasks/background-sync-worker/verify.sh
repositories/cli-arena-mobile-b/tasks/compose-paginated-feed/task.yaml
repositories/cli-arena-mobile-b/tasks/compose-paginated-feed/verify.sh
repositories/cli-arena-mobile-b/tasks/compose-theme-switcher/task.yaml
repositories/cli-arena-mobile-b/tasks/compose-theme-switcher/verify.sh
repositories/cli-arena-mobile-b/tasks/deep-link-routing/task.yaml
repositories/cli-arena-mobile-b/tasks/deep-link-routing/verify.sh
repositories/cli-arena-mobile-b/tasks/offline-mode-banner/task.yaml
repositories/cli-arena-mobile-b/tasks/offline-mode-banner/verify.sh
repositories/cli-arena-mobile-b/tasks/room-cache-integration/task.yaml
repositories/cli-arena-mobile-b/tasks/room-cache-integration/verify.sh
repositories/cli-arena-mobile-b/tasks/scroll-position-restore/task.yaml
repositories/cli-arena-mobile-b/tasks/scroll-position-restore/verify.sh
repositories/cli-arena-mobile-b/tasks/state-preservation/task.yaml
repositories/cli-arena-mobile-b/tasks/state-preservation/verify.sh
repositories/cli-arena-mobile-b/tests/unit/test_arithmetic.py
repositories/cli-arena-mobile-expo-a/AGENTS.md
repositories/cli-arena-mobile-expo-a/README.md
repositories/cli-arena-mobile-expo-a/.pytest_cache/README.md
repositories/cli-arena-mobile-expo-a/tasks/cli-async-background-jobs/task.yaml
repositories/cli-arena-mobile-expo-a/tasks/cli-async-background-jobs/verify.sh
repositories/cli-arena-mobile-expo-a/tasks/cli-batched-push-handler/task.yaml
repositories/cli-arena-mobile-expo-a/tasks/cli-batched-push-handler/verify.sh
repositories/cli-arena-mobile-expo-a/tasks/cli-cross-platform-uploads/task.yaml
repositories/cli-arena-mobile-expo-a/tasks/cli-cross-platform-uploads/verify.sh
repositories/cli-arena-mobile-expo-a/tasks/cli-cross-platform-uploads/.pytest_cache/README.md
repositories/cli-arena-mobile-expo-a/tasks/cli-graphql-subscriber/task.yaml
repositories/cli-arena-mobile-expo-a/tasks/cli-graphql-subscriber/verify.sh
repositories/cli-arena-mobile-expo-a/tasks/cli-localized-error-capture/task.yaml
repositories/cli-arena-mobile-expo-a/tasks/cli-localized-error-capture/verify.sh
repositories/cli-arena-mobile-expo-a/tasks/cli-metadata-transformer/task.yaml
repositories/cli-arena-mobile-expo-a/tasks/cli-metadata-transformer/verify.sh
repositories/cli-arena-mobile-expo-a/tasks/cli-multi-tenant-login/task.yaml
repositories/cli-arena-mobile-expo-a/tasks/cli-multi-tenant-login/verify.sh
repositories/cli-arena-mobile-expo-a/tasks/cli-offline-form-replayer/task.yaml
repositories/cli-arena-mobile-expo-a/tasks/cli-offline-form-replayer/verify.sh
repositories/cli-arena-mobile-expo-a/tasks/cli-offline-user-sync/task.yaml
repositories/cli-arena-mobile-expo-a/tasks/cli-offline-user-sync/verify.sh
repositories/cli-arena-mobile-expo-a/tasks/cli-secure-token-storage/task.yaml
repositories/cli-arena-mobile-expo-a/tasks/cli-secure-token-storage/verify.sh
repositories/cli-arena-mobile-expo-a/tasks/cli-session-timeout-manager/task.yaml
repositories/cli-arena-mobile-expo-a/tasks/cli-session-timeout-manager/verify.sh
repositories/cli-arena-mobile-expo-a/tasks/cli-user-location-audit/task.yaml
repositories/cli-arena-mobile-expo-a/tasks/cli-user-location-audit/verify.sh
repositories/cli-arena-mobile-expo-a/tests/unit/test_arithmetic.py
repositories/cli-arena-web-nextjs-a/.aider.chat.history.md
repositories/cli-arena-web-nextjs-a/README.md
repositories/cli-arena-web-nextjs-a/.pytest_cache/README.md
repositories/cli-arena-web-nextjs-a/server/websocket-server.py
repositories/cli-arena-web-nextjs-a/tasks/analytics-dashboard/task.yaml
repositories/cli-arena-web-nextjs-a/tasks/analytics-dashboard/verify.sh
repositories/cli-arena-web-nextjs-a/tasks/audit-logging/task.yaml
repositories/cli-arena-web-nextjs-a/tasks/audit-logging/verify.sh
repositories/cli-arena-web-nextjs-a/tasks/ci-cd-caching/task.yaml
repositories/cli-arena-web-nextjs-a/tasks/ci-cd-caching/verify.sh
repositories/cli-arena-web-nextjs-a/tasks/db-schema-introspection-cli/task.yaml
repositories/cli-arena-web-nextjs-a/tasks/db-schema-introspection-cli/verify.sh
repositories/cli-arena-web-nextjs-a/tasks/dynamic-sitemap/task.yaml
repositories/cli-arena-web-nextjs-a/tasks/dynamic-sitemap/verify.sh
repositories/cli-arena-web-nextjs-a/tasks/file-upload-s3/task.yaml
repositories/cli-arena-web-nextjs-a/tasks/file-upload-s3/verify.sh
repositories/cli-arena-web-nextjs-a/tasks/github-oauth/task.yaml
repositories/cli-arena-web-nextjs-a/tasks/github-oauth/verify.sh
repositories/cli-arena-web-nextjs-a/tasks/graphql-support/task.yaml
repositories/cli-arena-web-nextjs-a/tasks/graphql-support/verify.sh
repositories/cli-arena-web-nextjs-a/tasks/openai-summarizer/task.yaml
repositories/cli-arena-web-nextjs-a/tasks/openai-summarizer/verify.sh
repositories/cli-arena-web-nextjs-a/tasks/rate-limiting-middleware/task.yaml
repositories/cli-arena-web-nextjs-a/tasks/rate-limiting-middleware/verify.sh
repositories/cli-arena-web-nextjs-a/tasks/refactor-monolithic-api/task.yaml
repositories/cli-arena-web-nextjs-a/tasks/refactor-monolithic-api/verify.sh
repositories/cli-arena-web-nextjs-a/tasks/stripe-subscriptions/task.yaml
repositories/cli-arena-web-nextjs-a/tasks/stripe-subscriptions/verify.sh
repositories/cli-arena-web-nextjs-a/tasks/two-factor-auth/task.yaml
repositories/cli-arena-web-nextjs-a/tasks/two-factor-auth/verify.sh
repositories/cli-arena-web-nextjs-a/tasks/unused-imports-linter/task.yaml
repositories/cli-arena-web-nextjs-a/tasks/unused-imports-linter/verify.sh
repositories/cli-arena-web-nextjs-a/tasks/websocket-chat/task.yaml
repositories/cli-arena-web-nextjs-a/tasks/websocket-chat/verify.sh
repositories/cli-arena-web-nextjs-a/tests/unit/test_arithmetic.py
repositories/cli-arena-web-nextjs-b/.pytest_cache/README.md
repositories/cli-arena-web-nextjs-b/docs/architecture.md
repositories/cli-arena-web-nextjs-b/tasks/carbon-isotope-fingerprinting/README.md
repositories/cli-arena-web-nextjs-b/tasks/carbon-isotope-fingerprinting/task.yaml
repositories/cli-arena-web-nextjs-b/tasks/carbon-isotope-fingerprinting/verify.sh
repositories/cli-arena-web-nextjs-b/tasks/chess-game-validation/README.md
repositories/cli-arena-web-nextjs-b/tasks/chess-game-validation/task.yaml
repositories/cli-arena-web-nextjs-b/tasks/chess-game-validation/verify.sh
repositories/cli-arena-web-nextjs-b/tasks/ecommerce-unique/README.md
repositories/cli-arena-web-nextjs-b/tasks/ecommerce-unique/task.yaml
repositories/cli-arena-web-nextjs-b/tasks/ecommerce-unique/verify.sh
repositories/cli-arena-web-nextjs-b/tasks/economy-growth/README.md
repositories/cli-arena-web-nextjs-b/tasks/economy-growth/task.yaml
repositories/cli-arena-web-nextjs-b/tasks/economy-growth/verify.sh
repositories/cli-arena-web-nextjs-b/tasks/filter-bag-tech/README.md
repositories/cli-arena-web-nextjs-b/tasks/filter-bag-tech/task.yaml
repositories/cli-arena-web-nextjs-b/tasks/filter-bag-tech/verify.sh
repositories/cli-arena-web-nextjs-b/tasks/geometry/README.md
repositories/cli-arena-web-nextjs-b/tasks/geometry/task.yaml
repositories/cli-arena-web-nextjs-b/tasks/geometry/verify.sh
repositories/cli-arena-web-nextjs-b/tasks/geometry-solver/README.md
repositories/cli-arena-web-nextjs-b/tasks/geometry-solver/task.yaml
repositories/cli-arena-web-nextjs-b/tasks/geometry-solver/verify.sh
repositories/cli-arena-web-nextjs-b/tasks/hotel-management-system/README.md
repositories/cli-arena-web-nextjs-b/tasks/hotel-management-system/task.yaml
repositories/cli-arena-web-nextjs-b/tasks/hotel-management-system/verify.sh
repositories/cli-arena-web-nextjs-b/tasks/improve_barcode_validation/README.md
repositories/cli-arena-web-nextjs-b/tasks/improve_barcode_validation/task.yaml
repositories/cli-arena-web-nextjs-b/tasks/improve_barcode_validation/verify.sh
repositories/cli-arena-web-nextjs-b/tasks/item-bidding/README.md
repositories/cli-arena-web-nextjs-b/tasks/item-bidding/task.yaml
repositories/cli-arena-web-nextjs-b/tasks/item-bidding/verify.sh
repositories/cli-arena-web-nextjs-b/tasks/payment-processing/README.md
repositories/cli-arena-web-nextjs-b/tasks/payment-processing/task.yaml
repositories/cli-arena-web-nextjs-b/tasks/payment-processing/verify.sh
repositories/cli-arena-web-nextjs-b/tests/unit/test_arithmetic.py
repositories/sanity_test/.aider.chat.history.md
repositories/sanity_test/test_fixed_parser.py
repositories/sanity_test/test_parser.py
repositories/sanity_test/.pytest_cache/README.md
repositories/sanity_test/tasks/sane/task.yaml
repositories/sanity_test/tasks/sane/verify.sh
repositories/sanity_test/tasks/sane/.pytest_cache/README.md
repositories/sanity_test/tasks/test_masking/task.yaml
repositories/sanity_test/tasks/test_masking/verify.sh
repositories/simple_test/tasks/hello/task.yaml
repositories/simple_test/tasks/hello/verify.sh
repositories/test_simple_fix/main.py
repositories/test_simple_fix/tasks/add_function/task.yaml
repositories/test_simple_fix/tasks/add_function/verify.sh
scripts/add_canary_string.py
scripts/configure_logging.py
scripts/generate_simulated_results.py
scripts/monitor_failures.py
scripts/update_leaderboard.py
scripts_bash/check-canary.sh
scripts_bash/launch-interactive-container.sh
scripts_bash/run-harness.sh
scripts_bash/setup-docker-images.sh
scripts_bash/setup_api_key.sh
scripts_bash/test-modified-tasks.sh
scripts_bash/upload-base-images.sh
scripts_python/add_missing_tests.py
scripts_python/add_os_info_to_tasks.py
scripts_python/combine_outputs.py
scripts_python/create_cli_arena_verification.py
scripts_python/create_functional_verification.py
scripts_python/create_intelligent_verification_scripts.py
scripts_python/create_missing_task_yaml.py
scripts_python/create_solution_specific_verification.py
scripts_python/create_terminal_bench_style_verification.py
scripts_python/create_truly_comprehensive_tests.py
scripts_python/create_ultra_comprehensive_verification.py
scripts_python/fix_all_verification_scripts.py
scripts_python/fix_test_suite.py
scripts_python/fix_yaml_syntax.py
scripts_python/generate_comprehensive_tests.py
scripts_python/package_test.py
scripts_python/run_comprehensive_evaluation.py
scripts_python/run_harness.py
scripts_python/update_dockerfile_agents.py
scripts_python/validate_python_310.py
test_enhanced_verify/compare_verification.py
tests/__init__.py
tests/test_harness_fix.py
tests/test_recording_integration.py
tests/integration/test_agent_script.py
tests/integration/test_all_repositories.py
tests/integration/test_all_repositories_comprehensive.py
tests/integration/test_enhanced_harness.py
tests/integration/test_enhanced_harness_comprehensive.py
tests/integration/test_enhanced_harness_simple.py
tests/integration/test_simple_harness.py
tests/integration/test_working_harness.py
tests/runtime/terminal/test_tmux_session.py
tests/unit/models/test_harness_models.py
tests/unit/oracle/test_oracle_agent.py
tests/unit/parsers/__init__.py
tests/unit/parsers/test_pytest_parser.py
tests/unit/terminal/test_terminal.py
utils/__init__.py
utils/config_utils.py
utils/docker_utils.py
utils/interaction_logger.py
utils/logging_utils.py
utils/metrics_utils.py
utils/terminal_manager.py
utils/tmux_session.py