.gitattributes
.gitignore
.mintignore
.mintlifyignore
CODE_OF_CONDUCT.md
CONTRIBUTING.md
LICENSE
MANIFEST.in
README.md
docs.json
pyproject.toml
requirements.txt
benchmarks/ale/README.md
benchmarks/ale/config.yaml
benchmarks/ale/handler.py
benchmarks/ale/requirements.txt
benchmarks/ale/runner.py
benchmarks/ale/ALE-Bench/CONTRIBUTING.md
benchmarks/ale/ALE-Bench/README.md
benchmarks/ale/ALE-Bench/docs/README.md
benchmarks/ale/ALE-Bench/docs/aws_evaluation.md
benchmarks/ale/ALE-Bench/docs/evaluation.md
benchmarks/ale/ALE-Bench/docs/mcp_server.md
benchmarks/ale/ALE-Bench/docs/rating_and_ranking.md
benchmarks/ale/ALE-Bench/docs/session_object.md
benchmarks/ale/ALE-Bench/llm_configs/claude-4-opus.json
benchmarks/ale/ALE-Bench/llm_configs/claude-4-sonnet.json
benchmarks/ale/ALE-Bench/llm_configs/claude-4.1-opus.json
benchmarks/ale/ALE-Bench/llm_configs/claude-4.5-haiku.json
benchmarks/ale/ALE-Bench/llm_configs/claude-4.5-opus.json
benchmarks/ale/ALE-Bench/llm_configs/claude-4.5-sonnet.json
benchmarks/ale/ALE-Bench/llm_configs/codestral-2508.json
benchmarks/ale/ALE-Bench/llm_configs/deepseek-r1-0528.json
benchmarks/ale/ALE-Bench/llm_configs/deepseek-v3.1-terminus.json
benchmarks/ale/ALE-Bench/llm_configs/deepseek-v3.1.json
benchmarks/ale/ALE-Bench/llm_configs/deepseek-v3.2.json
benchmarks/ale/ALE-Bench/llm_configs/gemini-2.5-flash-lite-thinking.json
benchmarks/ale/ALE-Bench/llm_configs/gemini-2.5-flash-lite.json
benchmarks/ale/ALE-Bench/llm_configs/gemini-2.5-flash-thinking.json
benchmarks/ale/ALE-Bench/llm_configs/gemini-2.5-flash.json
benchmarks/ale/ALE-Bench/llm_configs/gemini-2.5-pro-thinking.json
benchmarks/ale/ALE-Bench/llm_configs/gemini-3-pro-preview-high.json
benchmarks/ale/ALE-Bench/llm_configs/gemini-3-pro-preview-low.json
benchmarks/ale/ALE-Bench/llm_configs/glm-4.5.json
benchmarks/ale/ALE-Bench/llm_configs/glm-4.6.json
benchmarks/ale/ALE-Bench/llm_configs/gpt-4.1.json
benchmarks/ale/ALE-Bench/llm_configs/gpt-5-mini-thinking.json
benchmarks/ale/ALE-Bench/llm_configs/gpt-5-mini.json
benchmarks/ale/ALE-Bench/llm_configs/gpt-5-nano-thinking.json
benchmarks/ale/ALE-Bench/llm_configs/gpt-5-nano.json
benchmarks/ale/ALE-Bench/llm_configs/gpt-5-thinking.json
benchmarks/ale/ALE-Bench/llm_configs/gpt-5.1-codex-high.json
benchmarks/ale/ALE-Bench/llm_configs/gpt-5.1-codex-max-high.json
benchmarks/ale/ALE-Bench/llm_configs/gpt-5.1-codex-max-xhigh.json
benchmarks/ale/ALE-Bench/llm_configs/gpt-5.1-thinking.json
benchmarks/ale/ALE-Bench/llm_configs/gpt-5.json
benchmarks/ale/ALE-Bench/llm_configs/gpt-oss-120b.json
benchmarks/ale/ALE-Bench/llm_configs/gpt-oss-20b.json
benchmarks/ale/ALE-Bench/llm_configs/grok-4.1-fast.json
benchmarks/ale/ALE-Bench/llm_configs/grok-4.json
benchmarks/ale/ALE-Bench/llm_configs/grok-code-fast-1.json
benchmarks/ale/ALE-Bench/llm_configs/kimi-k2-0905.json
benchmarks/ale/ALE-Bench/llm_configs/kimi-k2-thinking.json
benchmarks/ale/ALE-Bench/llm_configs/kimi-k2.json
benchmarks/ale/ALE-Bench/llm_configs/llama-4-maverick.json
benchmarks/ale/ALE-Bench/llm_configs/mistral-large-3-2512.json
benchmarks/ale/ALE-Bench/llm_configs/mistral-medium-3.1.json
benchmarks/ale/ALE-Bench/llm_configs/nova-2-lite-v1.json
benchmarks/ale/ALE-Bench/llm_configs/nova-premier-v1.json
benchmarks/ale/ALE-Bench/llm_configs/o3-high.json
benchmarks/ale/ALE-Bench/llm_configs/o4-mini-high.json
benchmarks/ale/ALE-Bench/llm_configs/qwen3-2507-thinking.json
benchmarks/ale/ALE-Bench/llm_configs/qwen3-coder-plus.json
benchmarks/ale/ALE-Bench/llm_configs/qwen3-coder.json
benchmarks/ale/ALE-Bench/llm_configs/qwen3-max.json
benchmarks/ale/ALE-Bench/llm_configs/qwen3-next-thinking.json
benchmarks/ale/ALE-Bench/tests/judge/inputs/ahc001.txt
benchmarks/ale/ALE-Bench/tests/judge/inputs/ahc003.txt
benchmarks/ale/data/experiment_data/ahc002_context.txt
benchmarks/ale/data/experiment_data/ahc005_context.txt
benchmarks/ale/data/experiment_data/ahc006_context.txt
benchmarks/mle/README.md
benchmarks/mle/config.yaml
benchmarks/mle/handler.py
benchmarks/mle/requirements.txt
benchmarks/mle/runner.py
benchmarks/mle/data/kg_data.json
benchmarks/mle/mle-bench/.pre-commit-config.yaml
benchmarks/mle/mle-bench/README.md
benchmarks/mle/mle-bench/SECURITY.md
benchmarks/mle/mle-bench/agents/README.md
benchmarks/mle/mle-bench/agents/aide/additional_notes.txt
benchmarks/mle/mle-bench/agents/aide/config.yaml
benchmarks/mle/mle-bench/agents/aide/requirements.txt
benchmarks/mle/mle-bench/agents/dummy/config.yaml
benchmarks/mle/mle-bench/agents/dummy/requirements.txt
benchmarks/mle/mle-bench/agents/mlagentbench/additional_notes.txt
benchmarks/mle/mle-bench/agents/mlagentbench/config.yaml
benchmarks/mle/mle-bench/agents/mlagentbench/requirements.txt
benchmarks/mle/mle-bench/agents/mlagentbench/benchmark_dir/scripts/research_problem.txt
benchmarks/mle/mle-bench/agents/opendevin/config.yaml
benchmarks/mle/mle-bench/environment/instructions.txt
benchmarks/mle/mle-bench/environment/instructions_obfuscated.txt
benchmarks/mle/mle-bench/environment/requirements.txt
benchmarks/mle/mle-bench/environment/config/container_configs/default.json
benchmarks/mle/mle-bench/examples/README.md
benchmarks/mle/mle-bench/experiments/familiarity/README.md
benchmarks/mle/mle-bench/experiments/familiarity/comps_to_urls.json
benchmarks/mle/mle-bench/experiments/familiarity/requirements.txt
benchmarks/mle/mle-bench/experiments/splits/dev.txt
benchmarks/mle/mle-bench/experiments/splits/high.txt
benchmarks/mle/mle-bench/experiments/splits/low.txt
benchmarks/mle/mle-bench/experiments/splits/medium.txt
benchmarks/mle/mle-bench/experiments/splits/spaceship-titanic.txt
benchmarks/mle/mle-bench/experiments/splits/split75.txt
benchmarks/mle/mle-bench/experiments/splits/systemcard.txt
benchmarks/mle/mle-bench/extras/README.md
benchmarks/mle/mle-bench/extras/plagiarism_detector/package-lock.json
benchmarks/mle/mle-bench/extras/plagiarism_detector/package.json
benchmarks/mle/mle-bench/mlebench.egg-info/SOURCES.txt
benchmarks/mle/mle-bench/mlebench.egg-info/dependency_links.txt
benchmarks/mle/mle-bench/mlebench.egg-info/entry_points.txt
benchmarks/mle/mle-bench/mlebench.egg-info/requires.txt
benchmarks/mle/mle-bench/mlebench.egg-info/top_level.txt
benchmarks/mle/mle-bench/mlebench/competitions/3d-object-detection-for-autonomous-vehicles/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/3d-object-detection-for-autonomous-vehicles/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/3d-object-detection-for-autonomous-vehicles/description.md
benchmarks/mle/mle-bench/mlebench/competitions/3d-object-detection-for-autonomous-vehicles/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/3d-object-detection-for-autonomous-vehicles/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/AI4Code/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/AI4Code/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/AI4Code/description.md
benchmarks/mle/mle-bench/mlebench/competitions/AI4Code/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/AI4Code/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/aerial-cactus-identification/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/aerial-cactus-identification/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/aerial-cactus-identification/description.md
benchmarks/mle/mle-bench/mlebench/competitions/aerial-cactus-identification/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/aerial-cactus-identification/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/alaska2-image-steganalysis/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/alaska2-image-steganalysis/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/alaska2-image-steganalysis/description.md
benchmarks/mle/mle-bench/mlebench/competitions/alaska2-image-steganalysis/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/alaska2-image-steganalysis/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/aptos2019-blindness-detection/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/aptos2019-blindness-detection/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/aptos2019-blindness-detection/description.md
benchmarks/mle/mle-bench/mlebench/competitions/aptos2019-blindness-detection/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/aptos2019-blindness-detection/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/billion-word-imputation/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/billion-word-imputation/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/billion-word-imputation/description.md
benchmarks/mle/mle-bench/mlebench/competitions/billion-word-imputation/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/billion-word-imputation/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/bms-molecular-translation/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/bms-molecular-translation/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/bms-molecular-translation/description.md
benchmarks/mle/mle-bench/mlebench/competitions/bms-molecular-translation/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/bms-molecular-translation/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/cassava-leaf-disease-classification/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/cassava-leaf-disease-classification/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/cassava-leaf-disease-classification/description.md
benchmarks/mle/mle-bench/mlebench/competitions/cassava-leaf-disease-classification/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/cassava-leaf-disease-classification/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/cdiscount-image-classification-challenge/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/cdiscount-image-classification-challenge/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/cdiscount-image-classification-challenge/description.md
benchmarks/mle/mle-bench/mlebench/competitions/cdiscount-image-classification-challenge/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/cdiscount-image-classification-challenge/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/chaii-hindi-and-tamil-question-answering/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/chaii-hindi-and-tamil-question-answering/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/chaii-hindi-and-tamil-question-answering/description.md
benchmarks/mle/mle-bench/mlebench/competitions/chaii-hindi-and-tamil-question-answering/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/chaii-hindi-and-tamil-question-answering/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/champs-scalar-coupling/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/champs-scalar-coupling/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/champs-scalar-coupling/description.md
benchmarks/mle/mle-bench/mlebench/competitions/champs-scalar-coupling/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/champs-scalar-coupling/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/denoising-dirty-documents/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/denoising-dirty-documents/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/denoising-dirty-documents/description.md
benchmarks/mle/mle-bench/mlebench/competitions/denoising-dirty-documents/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/denoising-dirty-documents/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/detecting-insults-in-social-commentary/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/detecting-insults-in-social-commentary/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/detecting-insults-in-social-commentary/description.md
benchmarks/mle/mle-bench/mlebench/competitions/detecting-insults-in-social-commentary/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/detecting-insults-in-social-commentary/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/dog-breed-identification/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/dog-breed-identification/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/dog-breed-identification/description.md
benchmarks/mle/mle-bench/mlebench/competitions/dog-breed-identification/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/dog-breed-identification/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/dogs-vs-cats-redux-kernels-edition/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/dogs-vs-cats-redux-kernels-edition/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/dogs-vs-cats-redux-kernels-edition/description.md
benchmarks/mle/mle-bench/mlebench/competitions/dogs-vs-cats-redux-kernels-edition/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/dogs-vs-cats-redux-kernels-edition/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/facebook-recruiting-iii-keyword-extraction/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/facebook-recruiting-iii-keyword-extraction/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/facebook-recruiting-iii-keyword-extraction/description.md
benchmarks/mle/mle-bench/mlebench/competitions/facebook-recruiting-iii-keyword-extraction/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/facebook-recruiting-iii-keyword-extraction/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/freesound-audio-tagging-2019/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/freesound-audio-tagging-2019/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/freesound-audio-tagging-2019/description.md
benchmarks/mle/mle-bench/mlebench/competitions/freesound-audio-tagging-2019/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/freesound-audio-tagging-2019/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/google-quest-challenge/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/google-quest-challenge/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/google-quest-challenge/description.md
benchmarks/mle/mle-bench/mlebench/competitions/google-quest-challenge/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/google-quest-challenge/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/google-research-identify-contrails-reduce-global-warming/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/google-research-identify-contrails-reduce-global-warming/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/google-research-identify-contrails-reduce-global-warming/description.md
benchmarks/mle/mle-bench/mlebench/competitions/google-research-identify-contrails-reduce-global-warming/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/google-research-identify-contrails-reduce-global-warming/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/h-and-m-personalized-fashion-recommendations/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/h-and-m-personalized-fashion-recommendations/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/h-and-m-personalized-fashion-recommendations/description.md
benchmarks/mle/mle-bench/mlebench/competitions/h-and-m-personalized-fashion-recommendations/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/h-and-m-personalized-fashion-recommendations/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/herbarium-2020-fgvc7/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/herbarium-2020-fgvc7/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/herbarium-2020-fgvc7/description.md
benchmarks/mle/mle-bench/mlebench/competitions/herbarium-2020-fgvc7/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/herbarium-2020-fgvc7/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/herbarium-2021-fgvc8/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/herbarium-2021-fgvc8/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/herbarium-2021-fgvc8/description.md
benchmarks/mle/mle-bench/mlebench/competitions/herbarium-2021-fgvc8/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/herbarium-2021-fgvc8/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/herbarium-2022-fgvc9/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/herbarium-2022-fgvc9/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/herbarium-2022-fgvc9/description.md
benchmarks/mle/mle-bench/mlebench/competitions/herbarium-2022-fgvc9/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/herbarium-2022-fgvc9/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/histopathologic-cancer-detection/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/histopathologic-cancer-detection/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/histopathologic-cancer-detection/description.md
benchmarks/mle/mle-bench/mlebench/competitions/histopathologic-cancer-detection/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/histopathologic-cancer-detection/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/hms-harmful-brain-activity-classification/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/hms-harmful-brain-activity-classification/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/hms-harmful-brain-activity-classification/description.md
benchmarks/mle/mle-bench/mlebench/competitions/hms-harmful-brain-activity-classification/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/hms-harmful-brain-activity-classification/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/hotel-id-2021-fgvc8/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/hotel-id-2021-fgvc8/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/hotel-id-2021-fgvc8/description.md
benchmarks/mle/mle-bench/mlebench/competitions/hotel-id-2021-fgvc8/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/hotel-id-2021-fgvc8/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/hubmap-kidney-segmentation/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/hubmap-kidney-segmentation/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/hubmap-kidney-segmentation/description.md
benchmarks/mle/mle-bench/mlebench/competitions/hubmap-kidney-segmentation/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/hubmap-kidney-segmentation/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/icecube-neutrinos-in-deep-ice/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/icecube-neutrinos-in-deep-ice/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/icecube-neutrinos-in-deep-ice/description.md
benchmarks/mle/mle-bench/mlebench/competitions/icecube-neutrinos-in-deep-ice/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/icecube-neutrinos-in-deep-ice/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/imet-2020-fgvc7/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/imet-2020-fgvc7/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/imet-2020-fgvc7/description.md
benchmarks/mle/mle-bench/mlebench/competitions/imet-2020-fgvc7/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/imet-2020-fgvc7/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/inaturalist-2019-fgvc6/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/inaturalist-2019-fgvc6/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/inaturalist-2019-fgvc6/description.md
benchmarks/mle/mle-bench/mlebench/competitions/inaturalist-2019-fgvc6/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/inaturalist-2019-fgvc6/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/invasive-species-monitoring/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/invasive-species-monitoring/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/invasive-species-monitoring/description.md
benchmarks/mle/mle-bench/mlebench/competitions/invasive-species-monitoring/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/invasive-species-monitoring/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/iwildcam-2019-fgvc6/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/iwildcam-2019-fgvc6/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/iwildcam-2019-fgvc6/description.md
benchmarks/mle/mle-bench/mlebench/competitions/iwildcam-2019-fgvc6/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/iwildcam-2019-fgvc6/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/iwildcam-2020-fgvc7/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/iwildcam-2020-fgvc7/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/iwildcam-2020-fgvc7/description.md
benchmarks/mle/mle-bench/mlebench/competitions/iwildcam-2020-fgvc7/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/iwildcam-2020-fgvc7/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/jigsaw-toxic-comment-classification-challenge/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/jigsaw-toxic-comment-classification-challenge/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/jigsaw-toxic-comment-classification-challenge/description.md
benchmarks/mle/mle-bench/mlebench/competitions/jigsaw-toxic-comment-classification-challenge/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/jigsaw-toxic-comment-classification-challenge/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/jigsaw-unintended-bias-in-toxicity-classification/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/jigsaw-unintended-bias-in-toxicity-classification/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/jigsaw-unintended-bias-in-toxicity-classification/description.md
benchmarks/mle/mle-bench/mlebench/competitions/jigsaw-unintended-bias-in-toxicity-classification/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/jigsaw-unintended-bias-in-toxicity-classification/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/kuzushiji-recognition/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/kuzushiji-recognition/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/kuzushiji-recognition/description.md
benchmarks/mle/mle-bench/mlebench/competitions/kuzushiji-recognition/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/kuzushiji-recognition/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/leaf-classification/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/leaf-classification/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/leaf-classification/description.md
benchmarks/mle/mle-bench/mlebench/competitions/leaf-classification/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/leaf-classification/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/learning-agency-lab-automated-essay-scoring-2/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/learning-agency-lab-automated-essay-scoring-2/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/learning-agency-lab-automated-essay-scoring-2/description.md
benchmarks/mle/mle-bench/mlebench/competitions/learning-agency-lab-automated-essay-scoring-2/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/learning-agency-lab-automated-essay-scoring-2/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/lmsys-chatbot-arena/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/lmsys-chatbot-arena/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/lmsys-chatbot-arena/description.md
benchmarks/mle/mle-bench/mlebench/competitions/lmsys-chatbot-arena/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/lmsys-chatbot-arena/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/ml2021spring-hw2/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/ml2021spring-hw2/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/ml2021spring-hw2/description.md
benchmarks/mle/mle-bench/mlebench/competitions/ml2021spring-hw2/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/ml2021spring-hw2/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/mlsp-2013-birds/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/mlsp-2013-birds/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/mlsp-2013-birds/description.md
benchmarks/mle/mle-bench/mlebench/competitions/mlsp-2013-birds/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/mlsp-2013-birds/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/movie-review-sentiment-analysis-kernels-only/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/movie-review-sentiment-analysis-kernels-only/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/movie-review-sentiment-analysis-kernels-only/description.md
benchmarks/mle/mle-bench/mlebench/competitions/movie-review-sentiment-analysis-kernels-only/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/movie-review-sentiment-analysis-kernels-only/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/multi-modal-gesture-recognition/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/multi-modal-gesture-recognition/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/multi-modal-gesture-recognition/description.md
benchmarks/mle/mle-bench/mlebench/competitions/multi-modal-gesture-recognition/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/multi-modal-gesture-recognition/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/multi-modal-gesture-recognition/leaderboard_readme.md
benchmarks/mle/mle-bench/mlebench/competitions/new-york-city-taxi-fare-prediction/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/new-york-city-taxi-fare-prediction/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/new-york-city-taxi-fare-prediction/description.md
benchmarks/mle/mle-bench/mlebench/competitions/new-york-city-taxi-fare-prediction/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/new-york-city-taxi-fare-prediction/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/nfl-player-contact-detection/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/nfl-player-contact-detection/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/nfl-player-contact-detection/description.md
benchmarks/mle/mle-bench/mlebench/competitions/nfl-player-contact-detection/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/nfl-player-contact-detection/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/nomad2018-predict-transparent-conductors/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/nomad2018-predict-transparent-conductors/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/nomad2018-predict-transparent-conductors/description.md
benchmarks/mle/mle-bench/mlebench/competitions/nomad2018-predict-transparent-conductors/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/nomad2018-predict-transparent-conductors/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/osic-pulmonary-fibrosis-progression/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/osic-pulmonary-fibrosis-progression/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/osic-pulmonary-fibrosis-progression/description.md
benchmarks/mle/mle-bench/mlebench/competitions/osic-pulmonary-fibrosis-progression/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/osic-pulmonary-fibrosis-progression/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/paddy-disease-classification/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/paddy-disease-classification/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/paddy-disease-classification/description.md
benchmarks/mle/mle-bench/mlebench/competitions/paddy-disease-classification/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/paddy-disease-classification/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/petfinder-pawpularity-score/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/petfinder-pawpularity-score/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/petfinder-pawpularity-score/description.md
benchmarks/mle/mle-bench/mlebench/competitions/petfinder-pawpularity-score/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/petfinder-pawpularity-score/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/plant-pathology-2020-fgvc7/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/plant-pathology-2020-fgvc7/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/plant-pathology-2020-fgvc7/description.md
benchmarks/mle/mle-bench/mlebench/competitions/plant-pathology-2020-fgvc7/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/plant-pathology-2020-fgvc7/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/plant-pathology-2021-fgvc8/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/plant-pathology-2021-fgvc8/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/plant-pathology-2021-fgvc8/description.md
benchmarks/mle/mle-bench/mlebench/competitions/plant-pathology-2021-fgvc8/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/plant-pathology-2021-fgvc8/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/plant-seedlings-classification/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/plant-seedlings-classification/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/plant-seedlings-classification/description.md
benchmarks/mle/mle-bench/mlebench/competitions/plant-seedlings-classification/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/plant-seedlings-classification/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/playground-series-s3e18/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/playground-series-s3e18/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/playground-series-s3e18/description.md
benchmarks/mle/mle-bench/mlebench/competitions/playground-series-s3e18/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/playground-series-s3e18/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/predict-volcanic-eruptions-ingv-oe/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/predict-volcanic-eruptions-ingv-oe/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/predict-volcanic-eruptions-ingv-oe/description.md
benchmarks/mle/mle-bench/mlebench/competitions/predict-volcanic-eruptions-ingv-oe/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/predict-volcanic-eruptions-ingv-oe/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/random-acts-of-pizza/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/random-acts-of-pizza/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/random-acts-of-pizza/description.md
benchmarks/mle/mle-bench/mlebench/competitions/random-acts-of-pizza/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/random-acts-of-pizza/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/ranzcr-clip-catheter-line-classification/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/ranzcr-clip-catheter-line-classification/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/ranzcr-clip-catheter-line-classification/description.md
benchmarks/mle/mle-bench/mlebench/competitions/ranzcr-clip-catheter-line-classification/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/ranzcr-clip-catheter-line-classification/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/rsna-2022-cervical-spine-fracture-detection/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/rsna-2022-cervical-spine-fracture-detection/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/rsna-2022-cervical-spine-fracture-detection/description.md
benchmarks/mle/mle-bench/mlebench/competitions/rsna-2022-cervical-spine-fracture-detection/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/rsna-2022-cervical-spine-fracture-detection/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/rsna-breast-cancer-detection/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/rsna-breast-cancer-detection/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/rsna-breast-cancer-detection/description.md
benchmarks/mle/mle-bench/mlebench/competitions/rsna-breast-cancer-detection/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/rsna-breast-cancer-detection/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/rsna-miccai-brain-tumor-radiogenomic-classification/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/rsna-miccai-brain-tumor-radiogenomic-classification/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/rsna-miccai-brain-tumor-radiogenomic-classification/description.md
benchmarks/mle/mle-bench/mlebench/competitions/rsna-miccai-brain-tumor-radiogenomic-classification/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/rsna-miccai-brain-tumor-radiogenomic-classification/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/seti-breakthrough-listen/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/seti-breakthrough-listen/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/seti-breakthrough-listen/description.md
benchmarks/mle/mle-bench/mlebench/competitions/seti-breakthrough-listen/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/seti-breakthrough-listen/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/siim-covid19-detection/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/siim-covid19-detection/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/siim-covid19-detection/description.md
benchmarks/mle/mle-bench/mlebench/competitions/siim-covid19-detection/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/siim-covid19-detection/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/siim-isic-melanoma-classification/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/siim-isic-melanoma-classification/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/siim-isic-melanoma-classification/description.md
benchmarks/mle/mle-bench/mlebench/competitions/siim-isic-melanoma-classification/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/siim-isic-melanoma-classification/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/smartphone-decimeter-2022/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/smartphone-decimeter-2022/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/smartphone-decimeter-2022/description.md
benchmarks/mle/mle-bench/mlebench/competitions/smartphone-decimeter-2022/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/smartphone-decimeter-2022/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/spaceship-titanic/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/spaceship-titanic/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/spaceship-titanic/description.md
benchmarks/mle/mle-bench/mlebench/competitions/spaceship-titanic/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/spaceship-titanic/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/spooky-author-identification/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/spooky-author-identification/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/spooky-author-identification/description.md
benchmarks/mle/mle-bench/mlebench/competitions/spooky-author-identification/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/spooky-author-identification/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/stanford-covid-vaccine/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/stanford-covid-vaccine/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/stanford-covid-vaccine/description.md
benchmarks/mle/mle-bench/mlebench/competitions/stanford-covid-vaccine/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/stanford-covid-vaccine/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/statoil-iceberg-classifier-challenge/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/statoil-iceberg-classifier-challenge/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/statoil-iceberg-classifier-challenge/description.md
benchmarks/mle/mle-bench/mlebench/competitions/statoil-iceberg-classifier-challenge/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/statoil-iceberg-classifier-challenge/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/tabular-playground-series-dec-2021/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/tabular-playground-series-dec-2021/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/tabular-playground-series-dec-2021/description.md
benchmarks/mle/mle-bench/mlebench/competitions/tabular-playground-series-dec-2021/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/tabular-playground-series-dec-2021/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/tabular-playground-series-may-2022/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/tabular-playground-series-may-2022/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/tabular-playground-series-may-2022/description.md
benchmarks/mle/mle-bench/mlebench/competitions/tabular-playground-series-may-2022/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/tabular-playground-series-may-2022/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/tensorflow-speech-recognition-challenge/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/tensorflow-speech-recognition-challenge/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/tensorflow-speech-recognition-challenge/description.md
benchmarks/mle/mle-bench/mlebench/competitions/tensorflow-speech-recognition-challenge/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/tensorflow-speech-recognition-challenge/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/tensorflow2-question-answering/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/tensorflow2-question-answering/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/tensorflow2-question-answering/description.md
benchmarks/mle/mle-bench/mlebench/competitions/tensorflow2-question-answering/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/tensorflow2-question-answering/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/text-normalization-challenge-english-language/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/text-normalization-challenge-english-language/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/text-normalization-challenge-english-language/description.md
benchmarks/mle/mle-bench/mlebench/competitions/text-normalization-challenge-english-language/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/text-normalization-challenge-english-language/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/text-normalization-challenge-russian-language/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/text-normalization-challenge-russian-language/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/text-normalization-challenge-russian-language/description.md
benchmarks/mle/mle-bench/mlebench/competitions/text-normalization-challenge-russian-language/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/text-normalization-challenge-russian-language/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/tgs-salt-identification-challenge/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/tgs-salt-identification-challenge/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/tgs-salt-identification-challenge/description.md
benchmarks/mle/mle-bench/mlebench/competitions/tgs-salt-identification-challenge/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/tgs-salt-identification-challenge/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/the-icml-2013-whale-challenge-right-whale-redux/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/the-icml-2013-whale-challenge-right-whale-redux/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/the-icml-2013-whale-challenge-right-whale-redux/description.md
benchmarks/mle/mle-bench/mlebench/competitions/the-icml-2013-whale-challenge-right-whale-redux/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/the-icml-2013-whale-challenge-right-whale-redux/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/tweet-sentiment-extraction/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/tweet-sentiment-extraction/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/tweet-sentiment-extraction/description.md
benchmarks/mle/mle-bench/mlebench/competitions/tweet-sentiment-extraction/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/tweet-sentiment-extraction/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/us-patent-phrase-to-phrase-matching/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/us-patent-phrase-to-phrase-matching/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/us-patent-phrase-to-phrase-matching/description.md
benchmarks/mle/mle-bench/mlebench/competitions/us-patent-phrase-to-phrase-matching/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/us-patent-phrase-to-phrase-matching/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/uw-madison-gi-tract-image-segmentation/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/uw-madison-gi-tract-image-segmentation/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/uw-madison-gi-tract-image-segmentation/description.md
benchmarks/mle/mle-bench/mlebench/competitions/uw-madison-gi-tract-image-segmentation/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/uw-madison-gi-tract-image-segmentation/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/ventilator-pressure-prediction/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/ventilator-pressure-prediction/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/ventilator-pressure-prediction/description.md
benchmarks/mle/mle-bench/mlebench/competitions/ventilator-pressure-prediction/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/ventilator-pressure-prediction/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/vesuvius-challenge-ink-detection/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/vesuvius-challenge-ink-detection/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/vesuvius-challenge-ink-detection/description.md
benchmarks/mle/mle-bench/mlebench/competitions/vesuvius-challenge-ink-detection/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/vesuvius-challenge-ink-detection/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/vinbigdata-chest-xray-abnormalities-detection/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/vinbigdata-chest-xray-abnormalities-detection/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/vinbigdata-chest-xray-abnormalities-detection/description.md
benchmarks/mle/mle-bench/mlebench/competitions/vinbigdata-chest-xray-abnormalities-detection/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/vinbigdata-chest-xray-abnormalities-detection/kernels.txt
benchmarks/mle/mle-bench/mlebench/competitions/whale-categorization-playground/checksums.yaml
benchmarks/mle/mle-bench/mlebench/competitions/whale-categorization-playground/config.yaml
benchmarks/mle/mle-bench/mlebench/competitions/whale-categorization-playground/description.md
benchmarks/mle/mle-bench/mlebench/competitions/whale-categorization-playground/description_obfuscated.md
benchmarks/mle/mle-bench/mlebench/competitions/whale-categorization-playground/kernels.txt
benchmarks/mle/mle-bench/runs/README.md
benchmarks/mle/mle-bench/runs/2024-09-06T18-25-55-UTC_run-group_aide/2024-09-19T20-07-15-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-07T22-33-09-UTC_run-group_mlagentbench/2024-09-19T20-13-10-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-07T22-34-42-UTC_run-group_aide/2024-09-19T20-23-08-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-08T07-58-11-UTC_run-group_aide/2024-09-19T20-50-11-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-08T08-00-07-UTC_run-group_aide/2024-09-19T20-52-52-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-09T16-13-51-UTC_run-group_aide/2024-09-19T20-54-35-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-09T17-26-54-UTC_run-group_aide/2024-09-19T20-56-43-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-09T21-21-33-UTC_run-group_aide/2024-09-19T21-03-13-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-11T09-34-00-UTC_run-group_aide/2024-09-19T21-03-18-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-11T21-57-50-UTC_run-group_aide/2024-09-19T21-16-52-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-12T12-30-57-UTC_run-group_aide/2024-09-19T21-26-17-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-12T13-52-30-UTC_run-group_mlagentbench/2024-09-19T21-31-49-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-12T21-14-22-UTC_run-group_aide/2024-09-19T21-34-18-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-13T13-45-35-UTC_run-group_aide/2024-09-19T21-40-03-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-14T11-15-57-UTC_run-group_aide/2024-09-19T21-50-06-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-16T14-45-05-UTC_run-group_aide/2024-09-19T21-55-27-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-16T16-59-30-UTC_run-group_opendevin/2024-09-19T21-55-55-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-16T19-44-41-UTC_run-group_mlagentbench/2024-09-19T23-44-06-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-18T18-21-42-GMT_run-group_aide/2024-09-20T21-46-50-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-18T20-49-38-UTC_run-group_opendevin/2024-09-20T21-51-54-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-19T04-36-44-GMT_run-group_aide/2024-09-21T00-22-42-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-19T21-48-46-GMT_run-group_aide/2024-09-22T18-05-17-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-19T23-54-38-GMT_run-group_aide/2024-09-21T22-57-13-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-20T23-52-25-GMT_run-group_aide/2024-09-22T14-26-08-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-21T00-10-06-GMT_run-group_aide/2024-09-22T14-26-59-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-21T00-10-41-GMT_run-group_aide/2024-09-22T14-23-11-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-21T19-39-16-GMT_run-group_aide/2024-09-23T17-44-13-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-22T16-12-47-GMT_run-group_aide/2024-09-24T13-54-59-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-22T17-15-19-GMT_run-group_aide/2024-09-24T13-55-43-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_0.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_1.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_10.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_100.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_11.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_12.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_13.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_14.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_15.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_16.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_17.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_18.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_19.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_2.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_20.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_21.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_22.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_23.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_24.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_25.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_26.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_27.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_28.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_29.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_3.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_30.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_31.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_32.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_33.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_34.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_35.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_36.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_37.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_38.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_39.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_4.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_40.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_41.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_42.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_43.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_44.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_45.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_46.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_47.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_48.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_49.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_5.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_50.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_51.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_52.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_53.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_54.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_55.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_56.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_57.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_58.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_59.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_6.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_60.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_61.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_62.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_63.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_64.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_65.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_66.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_67.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_68.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_69.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_7.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_70.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_71.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_72.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_73.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_74.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_75.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_76.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_77.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_78.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_79.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_8.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_80.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_81.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_82.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_83.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_84.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_85.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_86.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_87.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_88.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_89.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_9.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_90.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_91.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_92.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_93.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_94.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_95.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_96.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_97.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_98.json
benchmarks/mle/mle-bench/runs/2024-09-23T14-55-33-GMT_run-group_aide/hourly/grading_report_99.json
benchmarks/mle/mle-bench/runs/2024-09-23T15-10-54-GMT_run-group_opendevin/2024-09-27T10-32-10-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-24T01-12-14-GMT_run-group_aide/2024-09-26T09-03-59-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-24T22-00-20-GMT_run-group_aide/2024-09-27T10-42-15-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-25T04-20-19-GMT_run-group_aide/2024-09-27T10-44-46-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-25T04-42-50-GMT_run-group_aide/2024-09-26T09-04-52-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-09-27T17-34-13-GMT_run-group_aide/2024-10-01T07-57-25-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-10-03T22-46-46-GMT_run-group_aide/2024-10-08T15-25-27-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-10-04T17-35-20-GMT_run-group_aide/2024-10-08T15-26-46-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-10-04T19-08-06-GMT_run-group_aide/2024-10-08T15-28-17-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-10-04T22-37-05-GMT_run-group_aide/2024-10-08T15-28-58-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-10-04T22-43-43-GMT_run-group_mlagentbench/2024-10-08T15-29-16-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-10-04T22-43-53-GMT_run-group_opendevin/2024-10-08T15-29-24-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-10-04T22-44-59-GMT_run-group_aide/2024-10-08T15-29-37-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-10-04T22-58-46-GMT_run-group_aide/2024-10-08T15-30-00-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-10-04T22-59-24-GMT_run-group_aide/2024-10-08T15-30-19-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/2024-10-05T00-01-03-GMT_run-group_aide/2024-10-08T15-30-31-GMT_grading_report.json
benchmarks/mle/mle-bench/runs/Leeroo_group1/grading_report_group_1.json
benchmarks/mle/mle-bench/runs/Leeroo_group2/grading_report_group_2.json
benchmarks/mle/mle-bench/runs/Leeroo_group3/grading_report_group_3.json
benchmarks/mle/mle-bench/runs/aira-dojo_group1/grading_report_1.json
benchmarks/mle/mle-bench/runs/aira-dojo_group10/grading_report_10.json
benchmarks/mle/mle-bench/runs/aira-dojo_group11/grading_report_11.json
benchmarks/mle/mle-bench/runs/aira-dojo_group12/grading_report_12.json
benchmarks/mle/mle-bench/runs/aira-dojo_group13/grading_report_13.json
benchmarks/mle/mle-bench/runs/aira-dojo_group14/grading_report_14.json
benchmarks/mle/mle-bench/runs/aira-dojo_group15/grading_report_15.json
benchmarks/mle/mle-bench/runs/aira-dojo_group16/grading_report_16.json
benchmarks/mle/mle-bench/runs/aira-dojo_group17/grading_report_17.json
benchmarks/mle/mle-bench/runs/aira-dojo_group18/grading_report_18.json
benchmarks/mle/mle-bench/runs/aira-dojo_group19/grading_report_19.json
benchmarks/mle/mle-bench/runs/aira-dojo_group2/grading_report_2.json
benchmarks/mle/mle-bench/runs/aira-dojo_group20/grading_report_20.json
benchmarks/mle/mle-bench/runs/aira-dojo_group3/grading_report_3.json
benchmarks/mle/mle-bench/runs/aira-dojo_group4/grading_report_4.json
benchmarks/mle/mle-bench/runs/aira-dojo_group5/grading_report_5.json
benchmarks/mle/mle-bench/runs/aira-dojo_group6/grading_report_6.json
benchmarks/mle/mle-bench/runs/aira-dojo_group7/grading_report_7.json
benchmarks/mle/mle-bench/runs/aira-dojo_group8/grading_report_8.json
benchmarks/mle/mle-bench/runs/aira-dojo_group9/grading_report_9.json
benchmarks/mle/mle-bench/runs/famou-agent_group1/grading_report_group_1.json
benchmarks/mle/mle-bench/runs/famou-agent_group2/grading_report_group_2.json
benchmarks/mle/mle-bench/runs/famou-agent_group3/grading_report_group_3.json
benchmarks/mle/mle-bench/runs/famou-agent_group4/grading_report_group_4.json
benchmarks/mle/mle-bench/runs/famou-agent_group5/grading_report_group_5.json
benchmarks/mle/mle-bench/runs/famou-agent_group6/grading_report_group_6.json
benchmarks/mle/mle-bench/runs/internagent_group1/grading_report_group_1.json
benchmarks/mle/mle-bench/runs/internagent_group2/grading_report_group_2.json
benchmarks/mle/mle-bench/runs/internagent_group3/grading_report_group_3.json
benchmarks/mle/mle-bench/runs/mle_star_pro_group1/grading_report_group_1.json
benchmarks/mle/mle-bench/runs/mle_star_pro_group2/grading_report_group_2.json
benchmarks/mle/mle-bench/runs/mle_star_pro_group3/grading_report_group_3.json
benchmarks/mle/mle-bench/runs/mle_star_pro_group4/grading_report_group_4.json
benchmarks/mle/mle-bench/runs/mle_star_pro_group5/grading_report_group_5.json
benchmarks/mle/mle-bench/runs/mle_star_pro_group6/grading_report_group_6.json
benchmarks/mle/mle-bench/runs/mlmaster_group1/grading_report_group_1.json
benchmarks/mle/mle-bench/runs/mlmaster_group2/grading_report_group_2.json
benchmarks/mle/mle-bench/runs/mlmaster_group3/grading_report_group_3.json
benchmarks/mle/mle-bench/runs/mlmaster_group4/grading_report_group_4.json
benchmarks/mle/mle-bench/runs/mlmaster_group5/grading_report_group_5.json
benchmarks/mle/mle-bench/runs/mlmaster_group6/grading_report_group_6.json
benchmarks/mle/mle-bench/runs/neo_group1/grading_report_group_1.json
benchmarks/mle/mle-bench/runs/neo_group2/grading_report_group_2.json
benchmarks/mle/mle-bench/runs/neo_group3/grading_report_group_3.json
benchmarks/mle/mle-bench/runs/operand_group1/README.md
benchmarks/mle/mle-bench/runs/operand_group1/grading_report_group_1.json
benchmarks/mle/mle-bench/runs/operand_group2/README.md
benchmarks/mle/mle-bench/runs/operand_group2/grading_report_group_2.json
benchmarks/mle/mle-bench/runs/operand_group3/README.md
benchmarks/mle/mle-bench/runs/operand_group3/grading_report_group_3.json
benchmarks/mle/mle-bench/runs/pievolve_group1/grading_report_group_1.json
benchmarks/mle/mle-bench/runs/pievolve_group2/grading_report_group_2.json
benchmarks/mle/mle-bench/runs/pievolve_group3/grading_report_group_3.json
benchmarks/mle/mle-bench/runs/pievolve_group4/grading_report_group_4.json
benchmarks/mle/mle-bench/runs/pievolve_group5/grading_report_group_5.json
benchmarks/mle/mle-bench/runs/pievolve_group6/grading_report_group_6.json
benchmarks/mle/mle-bench/runs/rdagent_group1/grading_report_group_1.json
benchmarks/mle/mle-bench/runs/rdagent_group10/grading_report_group_10.json
benchmarks/mle/mle-bench/runs/rdagent_group11/grading_report_group_11.json
benchmarks/mle/mle-bench/runs/rdagent_group2/grading_report_group_2.json
benchmarks/mle/mle-bench/runs/rdagent_group3/grading_report_group_3.json
benchmarks/mle/mle-bench/runs/rdagent_group4/grading_report_group_4.json
benchmarks/mle/mle-bench/runs/rdagent_group5/grading_report_group_5.json
benchmarks/mle/mle-bench/runs/rdagent_group6/grading_report_group_6.json
benchmarks/mle/mle-bench/runs/rdagent_group7/grading_report_group_7.json
benchmarks/mle/mle-bench/runs/rdagent_group8/grading_report_group_8.json
benchmarks/mle/mle-bench/runs/rdagent_group9/grading_report_group_9.json
benchmarks/mle/mle-bench/runs/thesis_group1/grading_report_group_1.json
benchmarks/mle/mle-bench/runs/thesis_group2/grading_report_group_2.json
benchmarks/mle/mle-bench/runs/thesis_group3/grading_report_group_3.json
src/kapso/__init__.py
src/kapso/cli.py
src/kapso/config.yaml
src/kapso/kapso.py
src/kapso/core/__init__.py
src/kapso/core/config.py
src/kapso/core/llm.py
src/kapso/core/prompt_loader.py
src/kapso/deployment/__init__.py
src/kapso/deployment/base.py
src/kapso/deployment/factory.py
src/kapso/deployment/software.py
src/kapso/deployment/adapter/__init__.py
src/kapso/deployment/adapter/adaptation_prompt.txt
src/kapso/deployment/adapter/agent.py
src/kapso/deployment/adapter/validator.py
src/kapso/deployment/selector/agent.py
src/kapso/deployment/selector/correction_prompt.md
src/kapso/deployment/selector/selection_prompt.md
src/kapso/deployment/strategies/README.md
src/kapso/deployment/strategies/__init__.py
src/kapso/deployment/strategies/base.py
src/kapso/deployment/strategies/bentoml/__init__.py
src/kapso/deployment/strategies/bentoml/adapter_instruction.txt
src/kapso/deployment/strategies/bentoml/config.yaml
src/kapso/deployment/strategies/bentoml/runner.py
src/kapso/deployment/strategies/bentoml/selector_instruction.txt
src/kapso/deployment/strategies/docker/__init__.py
src/kapso/deployment/strategies/docker/adapter_instruction.txt
src/kapso/deployment/strategies/docker/config.yaml
src/kapso/deployment/strategies/docker/runner.py
src/kapso/deployment/strategies/docker/selector_instruction.txt
src/kapso/deployment/strategies/langgraph/__init__.py
src/kapso/deployment/strategies/langgraph/adapter_instruction.txt
src/kapso/deployment/strategies/langgraph/config.yaml
src/kapso/deployment/strategies/langgraph/runner.py
src/kapso/deployment/strategies/langgraph/selector_instruction.txt
src/kapso/deployment/strategies/local/__init__.py
src/kapso/deployment/strategies/local/adapter_instruction.txt
src/kapso/deployment/strategies/local/config.yaml
src/kapso/deployment/strategies/local/runner.py
src/kapso/deployment/strategies/local/selector_instruction.txt
src/kapso/deployment/strategies/modal/__init__.py
src/kapso/deployment/strategies/modal/adapter_instruction.txt
src/kapso/deployment/strategies/modal/config.yaml
src/kapso/deployment/strategies/modal/runner.py
src/kapso/deployment/strategies/modal/selector_instruction.txt
src/kapso/environment/__init__.py
src/kapso/environment/handlers/__init__.py
src/kapso/environment/handlers/base.py
src/kapso/environment/handlers/generic.py
src/kapso/execution/__init__.py
src/kapso/execution/orchestrator.py
src/kapso/execution/solution.py
src/kapso/execution/types.py
src/kapso/execution/coding_agents/README.md
src/kapso/execution/coding_agents/__init__.py
src/kapso/execution/coding_agents/agents.yaml
src/kapso/execution/coding_agents/base.py
src/kapso/execution/coding_agents/commit_message_generator.py
src/kapso/execution/coding_agents/factory.py
src/kapso/execution/coding_agents/adapters/TEMPLATE.py
src/kapso/execution/coding_agents/adapters/__init__.py
src/kapso/execution/coding_agents/adapters/aider_agent.py
src/kapso/execution/coding_agents/adapters/claude_code_agent.py
src/kapso/execution/coding_agents/adapters/gemini_agent.py
src/kapso/execution/coding_agents/adapters/openhands_agent.py
src/kapso/execution/experiment_workspace/__init__.py
src/kapso/execution/experiment_workspace/experiment_session.py
src/kapso/execution/experiment_workspace/experiment_workspace.py
src/kapso/execution/memories/__init__.py
src/kapso/execution/memories/experiment_memory/__init__.py
src/kapso/execution/memories/experiment_memory/insight_extractor.py
src/kapso/execution/memories/experiment_memory/store.py
src/kapso/execution/memories/experiment_memory/prompts/extract_error_insight.md
src/kapso/execution/memories/experiment_memory/prompts/extract_success_insight.md
src/kapso/execution/memories/repo_memory/__init__.py
src/kapso/execution/memories/repo_memory/builders.py
src/kapso/execution/memories/repo_memory/manager.py
src/kapso/execution/memories/repo_memory/observation.py
src/kapso/execution/memories/repo_memory/prompts/infer_repo_model_initial.md
src/kapso/execution/memories/repo_memory/prompts/infer_repo_model_retry.md
src/kapso/execution/memories/repo_memory/prompts/infer_repo_model_update.md
src/kapso/execution/memories/repo_memory/prompts/plan_files_to_read.md
src/kapso/execution/search_strategies/README.md
src/kapso/execution/search_strategies/__init__.py
src/kapso/execution/search_strategies/_template.py
src/kapso/execution/search_strategies/base.py
src/kapso/execution/search_strategies/benchmark_tree_search.py
src/kapso/execution/search_strategies/factory.py
src/kapso/execution/search_strategies/strategies.yaml
src/kapso/execution/search_strategies/generic/__init__.py
src/kapso/execution/search_strategies/generic/strategy.py
src/kapso/execution/search_strategies/generic/feedback_generator/__init__.py
src/kapso/execution/search_strategies/generic/feedback_generator/feedback_generator.py
src/kapso/execution/search_strategies/generic/feedback_generator/prompts/feedback_generator.md
src/kapso/execution/search_strategies/generic/prompts/coding_agent_debug.md
src/kapso/execution/search_strategies/generic/prompts/coding_agent_implement.md
src/kapso/execution/search_strategies/generic/prompts/ideation_claude_code.md
src/kapso/execution/search_strategies/generic/prompts/implementation_claude_code.md
src/kapso/gated_mcp/__init__.py
src/kapso/gated_mcp/backends.py
src/kapso/gated_mcp/presets.py
src/kapso/gated_mcp/server.py
src/kapso/gated_mcp/gates/__init__.py
src/kapso/gated_mcp/gates/base.py
src/kapso/gated_mcp/gates/code_gate.py
src/kapso/gated_mcp/gates/experiment_history_gate.py
src/kapso/gated_mcp/gates/idea_gate.py
src/kapso/gated_mcp/gates/kg_gate.py
src/kapso/gated_mcp/gates/repo_memory_gate.py
src/kapso/gated_mcp/gates/research_gate.py
src/kapso/knowledge_base/__init__.py
src/kapso/knowledge_base/types.py
src/kapso/knowledge_base/learners/__init__.py
src/kapso/knowledge_base/learners/__main__.py
src/kapso/knowledge_base/learners/knowledge_learner_pipeline.py
src/kapso/knowledge_base/learners/sources.py
src/kapso/knowledge_base/learners/ingestors/__init__.py
src/kapso/knowledge_base/learners/ingestors/base.py
src/kapso/knowledge_base/learners/ingestors/experiment_ingestor.py
src/kapso/knowledge_base/learners/ingestors/factory.py
src/kapso/knowledge_base/learners/ingestors/repo_ingestor/__init__.py
src/kapso/knowledge_base/learners/ingestors/repo_ingestor/context_builder.py
src/kapso/knowledge_base/learners/ingestors/repo_ingestor/repo_builder.py
src/kapso/knowledge_base/learners/ingestors/repo_ingestor/utils.py
src/kapso/knowledge_base/learners/ingestors/repo_ingestor/wiki_validator.py
src/kapso/knowledge_base/learners/ingestors/repo_ingestor/prompts/anchoring.md
src/kapso/knowledge_base/learners/ingestors/repo_ingestor/prompts/anchoring_context.md
src/kapso/knowledge_base/learners/ingestors/repo_ingestor/prompts/audit.md
src/kapso/knowledge_base/learners/ingestors/repo_ingestor/prompts/enrichment.md
src/kapso/knowledge_base/learners/ingestors/repo_ingestor/prompts/excavation_synthesis.md
src/kapso/knowledge_base/learners/ingestors/repo_ingestor/prompts/orphan_audit.md
src/kapso/knowledge_base/learners/ingestors/repo_ingestor/prompts/orphan_create.md
src/kapso/knowledge_base/learners/ingestors/repo_ingestor/prompts/orphan_review.md
src/kapso/knowledge_base/learners/ingestors/repo_ingestor/prompts/repo_builder.md
src/kapso/knowledge_base/learners/ingestors/repo_ingestor/prompts/repo_understanding.md
src/kapso/knowledge_base/learners/ingestors/research_ingestor/README.md
src/kapso/knowledge_base/learners/ingestors/research_ingestor/__init__.py
src/kapso/knowledge_base/learners/ingestors/research_ingestor/base.py
src/kapso/knowledge_base/learners/ingestors/research_ingestor/idea_ingestor.py
src/kapso/knowledge_base/learners/ingestors/research_ingestor/implementation_ingestor.py
src/kapso/knowledge_base/learners/ingestors/research_ingestor/research_report_ingestor.py
src/kapso/knowledge_base/learners/ingestors/research_ingestor/utils.py
src/kapso/knowledge_base/learners/ingestors/research_ingestor/prompts/auditing.md
src/kapso/knowledge_base/learners/ingestors/research_ingestor/prompts/planning.md
src/kapso/knowledge_base/learners/ingestors/research_ingestor/prompts/writing.md
src/kapso/knowledge_base/learners/merger/__init__.py
src/kapso/knowledge_base/learners/merger/knowledge_merger.py
src/kapso/knowledge_base/learners/merger/prompts/__init__.py
src/kapso/knowledge_base/learners/merger/prompts/hierarchical_merge.md
src/kapso/knowledge_base/search/README.md
src/kapso/knowledge_base/search/__init__.py
src/kapso/knowledge_base/search/base.py
src/kapso/knowledge_base/search/factory.py
src/kapso/knowledge_base/search/idea_impl_search.py
src/kapso/knowledge_base/search/kg_graph_search.py
src/kapso/knowledge_base/search/kg_llm_navigation_search.py
src/kapso/knowledge_base/search/knowledge_search.yaml
src/kapso/knowledge_base/search/workflow_search.py
src/kapso/knowledge_base/wiki_structure/page_connections.md
src/kapso/knowledge_base/wiki_structure/environment_page/page_definition.md
src/kapso/knowledge_base/wiki_structure/environment_page/sections_definition.md
src/kapso/knowledge_base/wiki_structure/heuristic_page/page_definition.md
src/kapso/knowledge_base/wiki_structure/heuristic_page/sections_definition.md
src/kapso/knowledge_base/wiki_structure/implementation_page/page_definition.md
src/kapso/knowledge_base/wiki_structure/implementation_page/sections_definition.md
src/kapso/knowledge_base/wiki_structure/principle_page/page_definition.md
src/kapso/knowledge_base/wiki_structure/principle_page/sections_definition.md
src/kapso/knowledge_base/wiki_structure/workflow_page/page_definition.md
src/kapso/knowledge_base/wiki_structure/workflow_page/sections_definition.md
src/kapso/researcher/__init__.py
src/kapso/researcher/research_findings.py
src/kapso/researcher/research_learn_design.md
src/kapso/researcher/researcher.py
src/kapso/researcher/prompts/idea.md
src/kapso/researcher/prompts/implementation.md
src/kapso/researcher/prompts/research_envelope.md
src/kapso/researcher/prompts/study.md
src/leeroo_kapso.egg-info/PKG-INFO
src/leeroo_kapso.egg-info/SOURCES.txt
src/leeroo_kapso.egg-info/dependency_links.txt
src/leeroo_kapso.egg-info/entry_points.txt
src/leeroo_kapso.egg-info/requires.txt
src/leeroo_kapso.egg-info/top_level.txt