MANIFEST.in
pyproject.toml
requirements-dev.txt
requirements-full.txt
requirements.txt
setup.py
setup_PAS1.py
efficientllm/__init__.py
efficientllm/__main__.py
efficientllm/cli.py
efficientllm/core.py
efficientllm_toolkit.egg-info/PKG-INFO
efficientllm_toolkit.egg-info/SOURCES.txt
efficientllm_toolkit.egg-info/dependency_links.txt
efficientllm_toolkit.egg-info/entry_points.txt
efficientllm_toolkit.egg-info/requires.txt
efficientllm_toolkit.egg-info/top_level.txt
fine-tune/LLaMA-Factory/.dockerignore
fine-tune/LLaMA-Factory/.env.local
fine-tune/LLaMA-Factory/.pre-commit-config.yaml
fine-tune/LLaMA-Factory/CITATION.cff
fine-tune/LLaMA-Factory/EFFICIENTLLM_METRICS.md
fine-tune/LLaMA-Factory/LICENSE
fine-tune/LLaMA-Factory/MANIFEST.in
fine-tune/LLaMA-Factory/Makefile
fine-tune/LLaMA-Factory/PEFT_BENCHMARK.md
fine-tune/LLaMA-Factory/README.md
fine-tune/LLaMA-Factory/README_zh.md
fine-tune/LLaMA-Factory/efficientllm_config.sh
fine-tune/LLaMA-Factory/pyproject.toml
fine-tune/LLaMA-Factory/requirements.txt
fine-tune/LLaMA-Factory/setup.py
fine-tune/LLaMA-Factory/.github/CODE_OF_CONDUCT.md
fine-tune/LLaMA-Factory/.github/CONTRIBUTING.md
fine-tune/LLaMA-Factory/.github/PULL_REQUEST_TEMPLATE.md
fine-tune/LLaMA-Factory/.github/SECURITY.md
fine-tune/LLaMA-Factory/.github/ISSUE_TEMPLATE/1-bug-report.yml
fine-tune/LLaMA-Factory/.github/ISSUE_TEMPLATE/2-feature-request.yml
fine-tune/LLaMA-Factory/.github/ISSUE_TEMPLATE/config.yml
fine-tune/LLaMA-Factory/.github/workflows/docker.yml
fine-tune/LLaMA-Factory/.github/workflows/label_issue.yml
fine-tune/LLaMA-Factory/.github/workflows/publish.yml
fine-tune/LLaMA-Factory/.github/workflows/tests.yml
fine-tune/LLaMA-Factory/assets/alaya_new.svg
fine-tune/LLaMA-Factory/assets/logo.png
fine-tune/LLaMA-Factory/assets/wechat.jpg
fine-tune/LLaMA-Factory/assets/wechat_alaya.png
fine-tune/LLaMA-Factory/assets/wechat_npu.jpg
fine-tune/LLaMA-Factory/data/README.md
fine-tune/LLaMA-Factory/data/README_zh.md
fine-tune/LLaMA-Factory/data/alpaca_en_demo.json
fine-tune/LLaMA-Factory/data/alpaca_zh_demo.json
fine-tune/LLaMA-Factory/data/c4_demo.jsonl
fine-tune/LLaMA-Factory/data/dataset_info.json
fine-tune/LLaMA-Factory/data/dpo_en_demo.json
fine-tune/LLaMA-Factory/data/dpo_zh_demo.json
fine-tune/LLaMA-Factory/data/glaive_toolcall_en_demo.json
fine-tune/LLaMA-Factory/data/glaive_toolcall_zh_demo.json
fine-tune/LLaMA-Factory/data/identity.json
fine-tune/LLaMA-Factory/data/kto_en_demo.json
fine-tune/LLaMA-Factory/data/mllm_audio_demo.json
fine-tune/LLaMA-Factory/data/mllm_demo.json
fine-tune/LLaMA-Factory/data/mllm_video_audio_demo.json
fine-tune/LLaMA-Factory/data/mllm_video_demo.json
fine-tune/LLaMA-Factory/data/wiki_demo.txt
fine-tune/LLaMA-Factory/data/belle_multiturn/belle_multiturn.py
fine-tune/LLaMA-Factory/data/hh_rlhf_en/hh_rlhf_en.py
fine-tune/LLaMA-Factory/data/mllm_demo_data/1.jpg
fine-tune/LLaMA-Factory/data/mllm_demo_data/1.mp3
fine-tune/LLaMA-Factory/data/mllm_demo_data/1.mp4
fine-tune/LLaMA-Factory/data/mllm_demo_data/2.avi
fine-tune/LLaMA-Factory/data/mllm_demo_data/2.jpg
fine-tune/LLaMA-Factory/data/mllm_demo_data/2.wav
fine-tune/LLaMA-Factory/data/mllm_demo_data/3.flac
fine-tune/LLaMA-Factory/data/mllm_demo_data/3.jpg
fine-tune/LLaMA-Factory/data/mllm_demo_data/3.mp4
fine-tune/LLaMA-Factory/data/mllm_demo_data/4.mp3
fine-tune/LLaMA-Factory/data/mllm_demo_data/4.mp4
fine-tune/LLaMA-Factory/data/ultra_chat/ultra_chat.py
fine-tune/LLaMA-Factory/docker/docker-cuda/Dockerfile
fine-tune/LLaMA-Factory/docker/docker-cuda/Dockerfile.base
fine-tune/LLaMA-Factory/docker/docker-cuda/README.md
fine-tune/LLaMA-Factory/docker/docker-cuda/docker-compose.yml
fine-tune/LLaMA-Factory/docker/docker-npu/Dockerfile
fine-tune/LLaMA-Factory/docker/docker-npu/docker-compose.yml
fine-tune/LLaMA-Factory/docker/docker-rocm/Dockerfile
fine-tune/LLaMA-Factory/docker/docker-rocm/docker-compose.yml
fine-tune/LLaMA-Factory/evaluation/ceval/ceval.py
fine-tune/LLaMA-Factory/evaluation/ceval/ceval.zip
fine-tune/LLaMA-Factory/evaluation/ceval/mapping.json
fine-tune/LLaMA-Factory/evaluation/cmmlu/cmmlu.py
fine-tune/LLaMA-Factory/evaluation/cmmlu/cmmlu.zip
fine-tune/LLaMA-Factory/evaluation/cmmlu/mapping.json
fine-tune/LLaMA-Factory/evaluation/mmlu/mapping.json
fine-tune/LLaMA-Factory/evaluation/mmlu/mmlu.py
fine-tune/LLaMA-Factory/evaluation/mmlu/mmlu.zip
fine-tune/LLaMA-Factory/examples/README.md
fine-tune/LLaMA-Factory/examples/README_zh.md
fine-tune/LLaMA-Factory/examples/accelerate/fsdp_config.yaml
fine-tune/LLaMA-Factory/examples/accelerate/fsdp_config_offload.yaml
fine-tune/LLaMA-Factory/examples/deepspeed/ds_z0_config.json
fine-tune/LLaMA-Factory/examples/deepspeed/ds_z2_config.json
fine-tune/LLaMA-Factory/examples/deepspeed/ds_z2_offload_config.json
fine-tune/LLaMA-Factory/examples/deepspeed/ds_z3_config.json
fine-tune/LLaMA-Factory/examples/deepspeed/ds_z3_offload_config.json
fine-tune/LLaMA-Factory/examples/extras/adam_mini/qwen2_full_sft.yaml
fine-tune/LLaMA-Factory/examples/extras/apollo/llama3_full_sft.yaml
fine-tune/LLaMA-Factory/examples/extras/badam/llama3_full_sft.yaml
fine-tune/LLaMA-Factory/examples/extras/fsdp_qlora/llama3_lora_sft.yaml
fine-tune/LLaMA-Factory/examples/extras/fsdp_qlora/train.sh
fine-tune/LLaMA-Factory/examples/extras/galore/llama3_full_sft.yaml
fine-tune/LLaMA-Factory/examples/extras/llama_pro/expand.sh
fine-tune/LLaMA-Factory/examples/extras/llama_pro/llama3_freeze_sft.yaml
fine-tune/LLaMA-Factory/examples/extras/loraplus/llama3_lora_sft.yaml
fine-tune/LLaMA-Factory/examples/extras/mod/llama3_full_sft.yaml
fine-tune/LLaMA-Factory/examples/extras/muon/qwen2_full_sft.yaml
fine-tune/LLaMA-Factory/examples/extras/nlg_eval/llama3_lora_predict.yaml
fine-tune/LLaMA-Factory/examples/extras/pissa/init.sh
fine-tune/LLaMA-Factory/examples/extras/pissa/llama3_lora_sft.yaml
fine-tune/LLaMA-Factory/examples/inference/llama3.yaml
fine-tune/LLaMA-Factory/examples/inference/llama3_full_sft.yaml
fine-tune/LLaMA-Factory/examples/inference/llama3_lora_sft.yaml
fine-tune/LLaMA-Factory/examples/inference/qwen2_5vl.yaml
fine-tune/LLaMA-Factory/examples/merge_lora/llama3_full_sft.yaml
fine-tune/LLaMA-Factory/examples/merge_lora/llama3_gptq.yaml
fine-tune/LLaMA-Factory/examples/merge_lora/llama3_lora_sft.yaml
fine-tune/LLaMA-Factory/examples/merge_lora/qwen2_5vl_lora_sft.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/freeze_full/llama3_2_1b_medical_o1_freeze.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/freeze_full/llama3_2_1b_medical_o1_full.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/freeze_full/llama3_2_1b_o1_sft_freeze.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/freeze_full/llama3_2_1b_o1_sft_full.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_1b_medical_o1_dora.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_1b_medical_o1_lora.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_1b_medical_o1_lora_plus.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_1b_medical_o1_pissa.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_1b_medical_o1_rslora.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_1b_o1_sft_dora.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_1b_o1_sft_lora.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_1b_o1_sft_lora_plus.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_1b_o1_sft_pissa.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_1b_o1_sft_rslora.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_3b_medical_o1_dora.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_3b_medical_o1_lora.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_3b_medical_o1_lora_plus.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_3b_medical_o1_pissa.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_3b_medical_o1_rslora.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_3b_o1_sft_dora.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_3b_o1_sft_lora.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_3b_o1_sft_lora_plus.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_3b_o1_sft_pissa.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/llama3_2_3b_o1_sft_rslora.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/qwen2_5_7b_medical_o1_dora.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/qwen2_5_7b_medical_o1_lora.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/qwen2_5_7b_o1_sft_dora.yaml
fine-tune/LLaMA-Factory/examples/peft_benchmark/lora_variants/qwen2_5_7b_o1_sft_lora.yaml
fine-tune/LLaMA-Factory/examples/train_full/llama3_1_full_sft_efficientllm.yaml
fine-tune/LLaMA-Factory/examples/train_full/llama3_full_sft.yaml
fine-tune/LLaMA-Factory/examples/train_full/qwen2_5vl_full_sft.yaml
fine-tune/LLaMA-Factory/examples/train_lora/llama3_1_lora_sft_efficientllm.yaml
fine-tune/LLaMA-Factory/examples/train_lora/llama3_lora_dpo.yaml
fine-tune/LLaMA-Factory/examples/train_lora/llama3_lora_eval.yaml
fine-tune/LLaMA-Factory/examples/train_lora/llama3_lora_kto.yaml
fine-tune/LLaMA-Factory/examples/train_lora/llama3_lora_ppo.yaml
fine-tune/LLaMA-Factory/examples/train_lora/llama3_lora_pretrain.yaml
fine-tune/LLaMA-Factory/examples/train_lora/llama3_lora_reward.yaml
fine-tune/LLaMA-Factory/examples/train_lora/llama3_lora_sft.sh
fine-tune/LLaMA-Factory/examples/train_lora/llama3_lora_sft.yaml
fine-tune/LLaMA-Factory/examples/train_lora/llama3_lora_sft_ds3.yaml
fine-tune/LLaMA-Factory/examples/train_lora/llama3_lora_sft_ray.yaml
fine-tune/LLaMA-Factory/examples/train_lora/llama3_preprocess.yaml
fine-tune/LLaMA-Factory/examples/train_lora/llama4_lora_sft_ds3.yaml
fine-tune/LLaMA-Factory/examples/train_lora/qwen2_5vl_lora_dpo.yaml
fine-tune/LLaMA-Factory/examples/train_lora/qwen2_5vl_lora_sft.yaml
fine-tune/LLaMA-Factory/examples/train_qlora/llama3_lora_sft_aqlm.yaml
fine-tune/LLaMA-Factory/examples/train_qlora/llama3_lora_sft_awq.yaml
fine-tune/LLaMA-Factory/examples/train_qlora/llama3_lora_sft_bnb_npu.yaml
fine-tune/LLaMA-Factory/examples/train_qlora/llama3_lora_sft_gptq.yaml
fine-tune/LLaMA-Factory/examples/train_qlora/llama3_lora_sft_otfq.yaml
fine-tune/LLaMA-Factory/results/peft_benchmark/logs/llama3_2_1b_medical_o1_dora.log
fine-tune/LLaMA-Factory/scripts/create_peft_configs.sh
fine-tune/LLaMA-Factory/scripts/eval_bleu_rouge.py
fine-tune/LLaMA-Factory/scripts/generate_peft_benchmark_configs.sh
fine-tune/LLaMA-Factory/scripts/llama_pro.py
fine-tune/LLaMA-Factory/scripts/loftq_init.py
fine-tune/LLaMA-Factory/scripts/pissa_init.py
fine-tune/LLaMA-Factory/scripts/qwen_omni_merge.py
fine-tune/LLaMA-Factory/scripts/run_peft_benchmark.sh
fine-tune/LLaMA-Factory/scripts/test_efficientllm.sh
fine-tune/LLaMA-Factory/scripts/test_peft_benchmark.sh
fine-tune/LLaMA-Factory/scripts/train_with_efficientllm.sh
fine-tune/LLaMA-Factory/scripts/vllm_infer.py
fine-tune/LLaMA-Factory/scripts/api_example/test_image.py
fine-tune/LLaMA-Factory/scripts/api_example/test_toolcall.py
fine-tune/LLaMA-Factory/scripts/convert_ckpt/llamafy_baichuan2.py
fine-tune/LLaMA-Factory/scripts/convert_ckpt/llamafy_qwen.py
fine-tune/LLaMA-Factory/scripts/convert_ckpt/tiny_llama4.py
fine-tune/LLaMA-Factory/scripts/stat_utils/cal_flops.py
fine-tune/LLaMA-Factory/scripts/stat_utils/cal_lr.py
fine-tune/LLaMA-Factory/scripts/stat_utils/cal_mfu.py
fine-tune/LLaMA-Factory/scripts/stat_utils/cal_ppl.py
fine-tune/LLaMA-Factory/scripts/stat_utils/length_cdf.py
fine-tune/LLaMA-Factory/src/api.py
fine-tune/LLaMA-Factory/src/train.py
fine-tune/LLaMA-Factory/src/webui.py
fine-tune/LLaMA-Factory/src/llamafactory/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/cli.py
fine-tune/LLaMA-Factory/src/llamafactory/launcher.py
fine-tune/LLaMA-Factory/src/llamafactory/api/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/api/app.py
fine-tune/LLaMA-Factory/src/llamafactory/api/chat.py
fine-tune/LLaMA-Factory/src/llamafactory/api/common.py
fine-tune/LLaMA-Factory/src/llamafactory/api/protocol.py
fine-tune/LLaMA-Factory/src/llamafactory/chat/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/chat/base_engine.py
fine-tune/LLaMA-Factory/src/llamafactory/chat/chat_model.py
fine-tune/LLaMA-Factory/src/llamafactory/chat/hf_engine.py
fine-tune/LLaMA-Factory/src/llamafactory/chat/sglang_engine.py
fine-tune/LLaMA-Factory/src/llamafactory/chat/vllm_engine.py
fine-tune/LLaMA-Factory/src/llamafactory/data/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/data/collator.py
fine-tune/LLaMA-Factory/src/llamafactory/data/converter.py
fine-tune/LLaMA-Factory/src/llamafactory/data/data_utils.py
fine-tune/LLaMA-Factory/src/llamafactory/data/formatter.py
fine-tune/LLaMA-Factory/src/llamafactory/data/loader.py
fine-tune/LLaMA-Factory/src/llamafactory/data/mm_plugin.py
fine-tune/LLaMA-Factory/src/llamafactory/data/parser.py
fine-tune/LLaMA-Factory/src/llamafactory/data/template.py
fine-tune/LLaMA-Factory/src/llamafactory/data/tool_utils.py
fine-tune/LLaMA-Factory/src/llamafactory/data/processor/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/data/processor/feedback.py
fine-tune/LLaMA-Factory/src/llamafactory/data/processor/pairwise.py
fine-tune/LLaMA-Factory/src/llamafactory/data/processor/pretrain.py
fine-tune/LLaMA-Factory/src/llamafactory/data/processor/processor_utils.py
fine-tune/LLaMA-Factory/src/llamafactory/data/processor/supervised.py
fine-tune/LLaMA-Factory/src/llamafactory/data/processor/unsupervised.py
fine-tune/LLaMA-Factory/src/llamafactory/eval/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/eval/evaluator.py
fine-tune/LLaMA-Factory/src/llamafactory/eval/template.py
fine-tune/LLaMA-Factory/src/llamafactory/extras/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/extras/constants.py
fine-tune/LLaMA-Factory/src/llamafactory/extras/efficientllm_metrics.py
fine-tune/LLaMA-Factory/src/llamafactory/extras/env.py
fine-tune/LLaMA-Factory/src/llamafactory/extras/logging.py
fine-tune/LLaMA-Factory/src/llamafactory/extras/misc.py
fine-tune/LLaMA-Factory/src/llamafactory/extras/packages.py
fine-tune/LLaMA-Factory/src/llamafactory/extras/ploting.py
fine-tune/LLaMA-Factory/src/llamafactory/hparams/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/hparams/data_args.py
fine-tune/LLaMA-Factory/src/llamafactory/hparams/evaluation_args.py
fine-tune/LLaMA-Factory/src/llamafactory/hparams/finetuning_args.py
fine-tune/LLaMA-Factory/src/llamafactory/hparams/generating_args.py
fine-tune/LLaMA-Factory/src/llamafactory/hparams/model_args.py
fine-tune/LLaMA-Factory/src/llamafactory/hparams/parser.py
fine-tune/LLaMA-Factory/src/llamafactory/hparams/training_args.py
fine-tune/LLaMA-Factory/src/llamafactory/model/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/model/adapter.py
fine-tune/LLaMA-Factory/src/llamafactory/model/loader.py
fine-tune/LLaMA-Factory/src/llamafactory/model/patcher.py
fine-tune/LLaMA-Factory/src/llamafactory/model/model_utils/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/model/model_utils/attention.py
fine-tune/LLaMA-Factory/src/llamafactory/model/model_utils/checkpointing.py
fine-tune/LLaMA-Factory/src/llamafactory/model/model_utils/embedding.py
fine-tune/LLaMA-Factory/src/llamafactory/model/model_utils/kv_cache.py
fine-tune/LLaMA-Factory/src/llamafactory/model/model_utils/liger_kernel.py
fine-tune/LLaMA-Factory/src/llamafactory/model/model_utils/longlora.py
fine-tune/LLaMA-Factory/src/llamafactory/model/model_utils/misc.py
fine-tune/LLaMA-Factory/src/llamafactory/model/model_utils/mod.py
fine-tune/LLaMA-Factory/src/llamafactory/model/model_utils/moe.py
fine-tune/LLaMA-Factory/src/llamafactory/model/model_utils/packing.py
fine-tune/LLaMA-Factory/src/llamafactory/model/model_utils/quantization.py
fine-tune/LLaMA-Factory/src/llamafactory/model/model_utils/rope.py
fine-tune/LLaMA-Factory/src/llamafactory/model/model_utils/unsloth.py
fine-tune/LLaMA-Factory/src/llamafactory/model/model_utils/valuehead.py
fine-tune/LLaMA-Factory/src/llamafactory/model/model_utils/visual.py
fine-tune/LLaMA-Factory/src/llamafactory/third_party/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/third_party/muon/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/third_party/muon/muon.py
fine-tune/LLaMA-Factory/src/llamafactory/train/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/train/callbacks.py
fine-tune/LLaMA-Factory/src/llamafactory/train/efficientllm_callback.py
fine-tune/LLaMA-Factory/src/llamafactory/train/test_utils.py
fine-tune/LLaMA-Factory/src/llamafactory/train/trainer_utils.py
fine-tune/LLaMA-Factory/src/llamafactory/train/tuner.py
fine-tune/LLaMA-Factory/src/llamafactory/train/dpo/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/train/dpo/trainer.py
fine-tune/LLaMA-Factory/src/llamafactory/train/dpo/workflow.py
fine-tune/LLaMA-Factory/src/llamafactory/train/kto/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/train/kto/trainer.py
fine-tune/LLaMA-Factory/src/llamafactory/train/kto/workflow.py
fine-tune/LLaMA-Factory/src/llamafactory/train/ppo/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/train/ppo/ppo_utils.py
fine-tune/LLaMA-Factory/src/llamafactory/train/ppo/trainer.py
fine-tune/LLaMA-Factory/src/llamafactory/train/ppo/workflow.py
fine-tune/LLaMA-Factory/src/llamafactory/train/pt/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/train/pt/trainer.py
fine-tune/LLaMA-Factory/src/llamafactory/train/pt/workflow.py
fine-tune/LLaMA-Factory/src/llamafactory/train/rm/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/train/rm/metric.py
fine-tune/LLaMA-Factory/src/llamafactory/train/rm/trainer.py
fine-tune/LLaMA-Factory/src/llamafactory/train/rm/workflow.py
fine-tune/LLaMA-Factory/src/llamafactory/train/sft/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/train/sft/metric.py
fine-tune/LLaMA-Factory/src/llamafactory/train/sft/trainer.py
fine-tune/LLaMA-Factory/src/llamafactory/train/sft/workflow.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/chatter.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/common.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/control.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/css.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/engine.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/interface.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/locales.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/manager.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/runner.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/components/__init__.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/components/chatbot.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/components/data.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/components/eval.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/components/export.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/components/footer.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/components/infer.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/components/top.py
fine-tune/LLaMA-Factory/src/llamafactory/webui/components/train.py
fine-tune/LLaMA-Factory/tests/check_license.py
fine-tune/LLaMA-Factory/tests/version.txt
fine-tune/LLaMA-Factory/tests/data/test_collator.py
fine-tune/LLaMA-Factory/tests/data/test_converter.py
fine-tune/LLaMA-Factory/tests/data/test_formatter.py
fine-tune/LLaMA-Factory/tests/data/test_loader.py
fine-tune/LLaMA-Factory/tests/data/test_mm_plugin.py
fine-tune/LLaMA-Factory/tests/data/test_template.py
fine-tune/LLaMA-Factory/tests/data/processor/test_feedback.py
fine-tune/LLaMA-Factory/tests/data/processor/test_pairwise.py
fine-tune/LLaMA-Factory/tests/data/processor/test_processor_utils.py
fine-tune/LLaMA-Factory/tests/data/processor/test_supervised.py
fine-tune/LLaMA-Factory/tests/data/processor/test_unsupervised.py
fine-tune/LLaMA-Factory/tests/e2e/test_chat.py
fine-tune/LLaMA-Factory/tests/e2e/test_sglang.py
fine-tune/LLaMA-Factory/tests/e2e/test_train.py
fine-tune/LLaMA-Factory/tests/eval/test_eval_template.py
fine-tune/LLaMA-Factory/tests/model/test_base.py
fine-tune/LLaMA-Factory/tests/model/test_freeze.py
fine-tune/LLaMA-Factory/tests/model/test_full.py
fine-tune/LLaMA-Factory/tests/model/test_lora.py
fine-tune/LLaMA-Factory/tests/model/test_pissa.py
fine-tune/LLaMA-Factory/tests/model/model_utils/test_add_tokens.py
fine-tune/LLaMA-Factory/tests/model/model_utils/test_attention.py
fine-tune/LLaMA-Factory/tests/model/model_utils/test_checkpointing.py
fine-tune/LLaMA-Factory/tests/model/model_utils/test_misc.py
fine-tune/LLaMA-Factory/tests/model/model_utils/test_packing.py
fine-tune/LLaMA-Factory/tests/model/model_utils/test_visual.py
fine-tune/LLaMA-Factory/tests/train/test_sft_trainer.py
pretrain/ATTENTION_FREE_BENCHMARK_README.md
pretrain/Pai-Megatron-Patch/EFFICIENTLLM_BENCHMARK.md
pretrain/Pai-Megatron-Patch/EFFICIENTLLM_METRICS.md
pretrain/Pai-Megatron-Patch/LICENSE
pretrain/Pai-Megatron-Patch/NOTICE
pretrain/Pai-Megatron-Patch/README.md
pretrain/Pai-Megatron-Patch/README_zh-CN.md
pretrain/Pai-Megatron-Patch/patch.png
pretrain/Pai-Megatron-Patch/qr.png
pretrain/Pai-Megatron-Patch/qr2.png
pretrain/Pai-Megatron-Patch/qr3.png
pretrain/Pai-Megatron-Patch/.claude/settings.local.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/LICENSE
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/NOTICE
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/README_zh-CN.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/patch.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/qr.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/qr2.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/qr3.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/CONTRIBUTING.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/Dockerfile-multiple
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/LICENSE
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/makefile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/setup.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/.github/workflows/ci.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/evaluator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/apps.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/codexglue_code_to_text.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/codexglue_text_to_text.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/conala.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/concode.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/ds1000.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/gsm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/humaneval.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/humanevalpack.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/humanevalpack_openai.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/humanevalplus.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/instruct_humaneval.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/instruct_wizard_humaneval.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/mbpp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/mbppplus.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/multiple.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/parity.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/python_bugs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/quixbugs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/recode.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/santacoder_fim.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/code_eval.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/codexglue_code_to_text_bleu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/diff_eval.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/execute.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/containerized_eval.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_cpp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_cs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_dlang.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_go.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_java.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_javascript.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_julia.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_lua.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_php.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_pl.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_python.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_r.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_racket.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_ruby.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_rust.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_scala.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_sh.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_swift.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/eval_ts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/evaluation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/generic_eval.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/libeval.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/single_experiment_pass_k.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/safe_subprocess/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/safe_subprocess/module_test.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/safe_subprocess/evil_programs/block_on_inputs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/safe_subprocess/evil_programs/close_outputs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/safe_subprocess/evil_programs/fork_bomb.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/safe_subprocess/evil_programs/fork_once.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/safe_subprocess/evil_programs/sleep_forever.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/multiple_metrics/safe_subprocess/evil_programs/unbounded_output.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/pal_metric/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/pal_metric/pal_code_exec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/custom_metrics/pal_metric/python_executor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/few_shot_examples/codexglue_text_to_text_few_shot_prompts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/few_shot_examples/conala_few_shot_prompts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/few_shot_examples/concode_few_shot_prompts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/bigcode_eval/tasks/few_shot_examples/gsm8k_few_shot_prompts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/docs/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/docs/guide.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/finetuning/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/finetuning/APPS/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/finetuning/APPS/apps_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/finetuning/APPS/apps_train.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/finetuning/Code-to-text/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/finetuning/Code-to-text/train.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/finetuning/CodeClone/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/finetuning/CodeClone/train.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/finetuning/CodeComplex/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/finetuning/CodeComplex/train.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/finetuning/CodeDefect/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/finetuning/CodeDefect/train.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/leaderboard/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/leaderboard/group_jsons.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/leaderboard/multiple_eval.slurm
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/leaderboard/throughput_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/templates/new_task.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/tests/test_generation_evaluation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/tests/test_prompts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/tests/data/humaneval_eval_gens.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/tests/data/humaneval_gen_gens.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/tests/data/humaneval_gen_refs.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/tests/data/mbpp_eval_gens.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/tests/data/mbpp_gen_gens.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/tests/data/mbpp_gen_refs.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/tests/data/pal-gsm8k-greedy_eval_gens.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/Bigcode-Evaluation-Harness-240327/tests/data/pal-gsm8k-greedy_prompt.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/.coveragerc
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/.flake8
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/.pre-commit-config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/CITATION.bib
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/CODEOWNERS
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/LICENSE.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/ignore.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/mypy.ini
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/pile_statistics.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/pyproject.toml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/setup.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/.github/workflows/new_tasks.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/.github/workflows/publish.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/.github/workflows/unit_tests.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/docs/CONTRIBUTING.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/docs/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/docs/decontamination.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/docs/interface.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/docs/model_guide.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/docs/new_task_guide.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/docs/task_guide.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/docs/img/fewshot_example_gpt3.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/examples/lm-eval-overview.ipynb
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/examples/visualize-wandb.ipynb
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/examples/visualize-zeno.ipynb
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/__main__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/evaluator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/evaluator_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/logging_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/api/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/api/filter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/api/instance.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/api/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/api/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/api/registry.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/api/samplers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/api/task.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/caching/cache.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/decontamination/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/decontamination/archiver.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/decontamination/decontaminate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/decontamination/janitor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/filters/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/filters/decontamination.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/filters/extraction.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/filters/selection.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/filters/transformation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/models/anthropic_llms.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/models/dummy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/models/gguf.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/models/huggingface.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/models/mamba_lm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/models/neuron_optimum.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/models/openai_completions.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/models/optimum_lm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/models/textsynth.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/models/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/models/vllm_causallms.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/prompts/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/_default_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/_generate_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_abstract_algebra.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_anatomy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_astronomy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_business_ethics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_clinical_knowledge.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_college_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_college_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_college_computer_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_college_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_college_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_college_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_computer_security.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_conceptual_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_econometrics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_electrical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_elementary_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_formal_logic.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_global_facts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_high_school_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_high_school_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_high_school_computer_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_high_school_european_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_high_school_geography.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_high_school_government_and_politics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_high_school_macroeconomics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_high_school_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_high_school_microeconomics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_high_school_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_high_school_psychology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_high_school_statistics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_high_school_us_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_high_school_world_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_human_aging.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_human_sexuality.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_international_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_jurisprudence.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_logical_fallacies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_machine_learning.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_management.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_marketing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_medical_genetics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_miscellaneous.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_moral_disputes.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_moral_scenarios.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_nutrition.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_philosophy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_prehistory.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_professional_accounting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_professional_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_professional_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_professional_psychology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_public_relations.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_security_studies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_sociology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_us_foreign_policy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_virology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ammlu/ammlu_world_religions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/anli/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/anli/anli_r1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/anli/anli_r2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/anli/anli_r3.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/arc/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/arc/arc_challenge.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/arc/arc_easy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/arithmetic/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/arithmetic/arithmetic_1dc.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/arithmetic/arithmetic_2da.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/arithmetic/arithmetic_2dm.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/arithmetic/arithmetic_2ds.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/arithmetic/arithmetic_3da.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/arithmetic/arithmetic_3ds.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/arithmetic/arithmetic_4da.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/arithmetic/arithmetic_4ds.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/arithmetic/arithmetic_5da.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/arithmetic/arithmetic_5ds.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/asdiv/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/asdiv/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/babi/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/babi/babi.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/_generate_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/_cot_fewshot_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/boolean_expressions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/causal_judgement.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/date_understanding.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/disambiguation_qa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/dyck_languages.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/formal_fallacies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/geometric_shapes.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/hyperbaton.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/logical_deduction_five_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/logical_deduction_seven_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/logical_deduction_three_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/movie_recommendation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/multistep_arithmetic_two.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/navigate.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/object_counting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/penguins_in_a_table.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/reasoning_about_colored_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/ruin_names.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/salient_translation_error_detection.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/snarks.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/sports_understanding.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/temporal_sequences.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/tracking_shuffled_objects_five_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/tracking_shuffled_objects_seven_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/tracking_shuffled_objects_three_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/web_of_lies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_fewshot/word_sorting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/_cot_zeroshot_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/boolean_expressions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/causal_judgement.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/date_understanding.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/disambiguation_qa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/dyck_languages.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/formal_fallacies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/geometric_shapes.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/hyperbaton.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/logical_deduction_five_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/logical_deduction_seven_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/logical_deduction_three_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/movie_recommendation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/multistep_arithmetic_two.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/navigate.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/object_counting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/penguins_in_a_table.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/reasoning_about_colored_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/ruin_names.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/salient_translation_error_detection.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/snarks.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/sports_understanding.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/temporal_sequences.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/tracking_shuffled_objects_five_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/tracking_shuffled_objects_seven_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/tracking_shuffled_objects_three_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/web_of_lies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/cot_zeroshot/word_sorting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/_fewshot_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/boolean_expressions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/causal_judgement.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/date_understanding.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/disambiguation_qa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/dyck_languages.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/formal_fallacies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/geometric_shapes.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/hyperbaton.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/logical_deduction_five_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/logical_deduction_seven_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/logical_deduction_three_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/movie_recommendation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/multistep_arithmetic_two.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/navigate.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/object_counting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/penguins_in_a_table.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/reasoning_about_colored_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/ruin_names.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/salient_translation_error_detection.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/snarks.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/sports_understanding.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/temporal_sequences.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/tracking_shuffled_objects_five_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/tracking_shuffled_objects_seven_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/tracking_shuffled_objects_three_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/web_of_lies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/fewshot/word_sorting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/_zeroshot_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/boolean_expressions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/causal_judgement.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/date_understanding.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/disambiguation_qa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/dyck_languages.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/formal_fallacies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/geometric_shapes.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/hyperbaton.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/logical_deduction_five_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/logical_deduction_seven_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/logical_deduction_three_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/movie_recommendation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/multistep_arithmetic_two.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/navigate.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/object_counting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/penguins_in_a_table.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/reasoning_about_colored_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/ruin_names.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/salient_translation_error_detection.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/snarks.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/sports_understanding.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/temporal_sequences.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/tracking_shuffled_objects_five_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/tracking_shuffled_objects_seven_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/tracking_shuffled_objects_three_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/web_of_lies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bbh/zeroshot/word_sorting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/_default_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/_generate_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_acm_Arab.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_afr_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_als_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_amh_Ethi.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_apc_Arab.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_arb_Arab.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_arb_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_ars_Arab.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_ary_Arab.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_arz_Arab.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_asm_Beng.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_azj_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_bam_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_ben_Beng.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_ben_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_bod_Tibt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_bul_Cyrl.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_cat_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_ceb_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_ces_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_ckb_Arab.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_dan_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_deu_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_ell_Grek.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_eng_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_est_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_eus_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_fin_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_fra_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_fuv_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_gaz_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_grn_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_guj_Gujr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_hat_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_hau_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_heb_Hebr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_hin_Deva.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_hin_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_hrv_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_hun_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_hye_Armn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_ibo_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_ilo_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_ind_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_isl_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_ita_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_jav_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_jpn_Jpan.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_kac_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_kan_Knda.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_kat_Geor.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_kaz_Cyrl.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_kea_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_khk_Cyrl.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_khm_Khmr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_kin_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_kir_Cyrl.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_kor_Hang.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_lao_Laoo.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_lin_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_lit_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_lug_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_luo_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_lvs_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_mal_Mlym.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_mar_Deva.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_mkd_Cyrl.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_mlt_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_mri_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_mya_Mymr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_nld_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_nob_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_npi_Deva.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_npi_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_nso_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_nya_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_ory_Orya.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_pan_Guru.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_pbt_Arab.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_pes_Arab.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_plt_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_pol_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_por_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_ron_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_rus_Cyrl.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_shn_Mymr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_sin_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_sin_Sinh.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_slk_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_slv_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_sna_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_snd_Arab.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_som_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_sot_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_spa_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_srp_Cyrl.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_ssw_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_sun_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_swe_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_swh_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_tam_Taml.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_tel_Telu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_tgk_Cyrl.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_tgl_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_tha_Thai.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_tir_Ethi.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_tsn_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_tso_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_tur_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_ukr_Cyrl.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_urd_Arab.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_urd_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_uzn_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_vie_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_war_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_wol_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_xho_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_yor_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_zho_Hans.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_zho_Hant.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_zsm_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/belebele/belebele_zul_Latn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/benchmarks/minerva_math.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/benchmarks/openllm.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/benchmarks/pythia.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/benchmarks/t0_eval.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/benchmarks/flan/_held_in_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/benchmarks/flan/flan_held_in.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/benchmarks/flan/flan_held_out.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/benchmarks/multimedqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/benchmarks/multimedqa/multimedqa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_tasks.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/push_bigbench_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/abstract_narrative_understanding.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/anachronisms.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/analogical_similarity.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/analytic_entailment.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/arithmetic.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/ascii_word_recognition.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/authorship_verification.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/auto_categorization.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/auto_debugging.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/bbq_lite_json.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/bridging_anaphora_resolution_barqa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/causal_judgment.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/cause_and_effect.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/checkmate_in_one.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/chess_state_tracking.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/chinese_remainder_theorem.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/cifar10_classification.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/code_line_description.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/codenames.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/color.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/common_morpheme.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/conceptual_combinations.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/conlang_translation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/contextual_parametric_knowledge_conflicts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/crash_blossom.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/crass_ai.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/cryobiology_spanish.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/cryptonite.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/cs_algorithms.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/dark_humor_detection.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/date_understanding.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/disambiguation_qa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/discourse_marker_prediction.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/disfl_qa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/dyck_languages.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/elementary_math_qa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/emoji_movie.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/emojis_emotion_prediction.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/empirical_judgments.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/english_proverbs.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/english_russian_proverbs.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/entailed_polarity.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/entailed_polarity_hindi.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/epistemic_reasoning.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/evaluating_information_essentiality.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/fact_checker.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/fantasy_reasoning.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/few_shot_nlg.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/figure_of_speech_detection.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/formal_fallacies_syllogisms_negation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/gem.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/gender_inclusive_sentences_german.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/general_knowledge.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/geometric_shapes.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/goal_step_wikihow.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/gre_reading_comprehension.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/hhh_alignment.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/hindi_question_answering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/hindu_knowledge.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/hinglish_toxicity.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/human_organs_senses.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/hyperbaton.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/identify_math_theorems.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/identify_odd_metaphor.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/implicatures.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/implicit_relations.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/intent_recognition.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/international_phonetic_alphabet_nli.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/international_phonetic_alphabet_transliterate.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/intersect_geometry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/irony_identification.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/kanji_ascii.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/kannada.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/key_value_maps.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/known_unknowns.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/language_games.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/language_identification.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/linguistic_mappings.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/linguistics_puzzles.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/list_functions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/logic_grid_puzzle.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/logical_args.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/logical_deduction.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/logical_fallacy_detection.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/logical_sequence.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/mathematical_induction.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/matrixshapes.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/metaphor_boolean.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/metaphor_understanding.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/minute_mysteries_qa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/misconceptions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/misconceptions_russian.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/mnist_ascii.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/modified_arithmetic.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/moral_permissibility.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/movie_dialog_same_or_different.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/movie_recommendation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/mult_data_wrangling.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/multiemo.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/natural_instructions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/navigate.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/nonsense_words_grammar.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/novel_concepts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/object_counting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/odd_one_out.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/operators.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/paragraph_segmentation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/parsinlu_qa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/parsinlu_reading_comprehension.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/penguins_in_a_table.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/periodic_elements.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/persian_idioms.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/phrase_relatedness.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/physical_intuition.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/physics_questions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/play_dialog_same_or_different.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/polish_sequence_labeling.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/presuppositions_as_nli.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/qa_wikidata.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/question_selection.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/real_or_fake_text.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/reasoning_about_colored_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/repeat_copy_logic.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/rephrase.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/riddle_sense.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/ruin_names.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/salient_translation_error_detection.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/scientific_press_release.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/semantic_parsing_in_context_sparc.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/semantic_parsing_spider.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/sentence_ambiguity.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/similarities_abstraction.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/simp_turing_concept.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/simple_arithmetic_json.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/simple_arithmetic_json_multiple_choice.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/simple_arithmetic_json_subtasks.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/simple_arithmetic_multiple_targets_json.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/simple_ethical_questions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/simple_text_editing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/snarks.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/social_iqa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/social_support.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/sports_understanding.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/strange_stories.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/strategyqa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/sufficient_information.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/suicide_risk.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/swahili_english_proverbs.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/swedish_to_german_proverbs.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/symbol_interpretation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/temporal_sequences.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/tense.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/timedial.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/topical_chat.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/tracking_shuffled_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/understanding_fables.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/undo_permutation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/unit_conversion.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/unit_interpretation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/unnatural_in_context_learning.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/vitaminc_fact_verification.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/what_is_the_tao.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/which_wiki_edit.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/winowhy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/word_sorting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/generate_until/word_unscrambling.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/abstract_narrative_understanding.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/anachronisms.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/analogical_similarity.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/analytic_entailment.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/arithmetic.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/ascii_word_recognition.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/authorship_verification.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/auto_categorization.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/auto_debugging.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/bbq_lite_json.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/bridging_anaphora_resolution_barqa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/causal_judgement.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/causal_judgment.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/cause_and_effect.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/checkmate_in_one.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/chess_state_tracking.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/chinese_remainder_theorem.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/cifar10_classification.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/code_line_description.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/codenames.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/color.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/common_morpheme.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/conceptual_combinations.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/conlang_translation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/contextual_parametric_knowledge_conflicts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/crash_blossom.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/crass_ai.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/cryobiology_spanish.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/cryptonite.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/cs_algorithms.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/dark_humor_detection.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/date_understanding.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/disambiguation_qa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/discourse_marker_prediction.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/disfl_qa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/dyck_languages.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/elementary_math_qa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/emoji_movie.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/emojis_emotion_prediction.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/empirical_judgments.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/english_proverbs.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/english_russian_proverbs.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/entailed_polarity.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/entailed_polarity_hindi.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/epistemic_reasoning.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/evaluating_information_essentiality.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/fact_checker.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/fantasy_reasoning.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/few_shot_nlg.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/figure_of_speech_detection.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/formal_fallacies_syllogisms_negation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/gem.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/gender_inclusive_sentences_german.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/general_knowledge.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/geometric_shapes.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/goal_step_wikihow.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/gre_reading_comprehension.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/hhh_alignment.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/hindi_question_answering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/hindu_knowledge.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/hinglish_toxicity.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/human_organs_senses.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/hyperbaton.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/identify_math_theorems.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/identify_odd_metaphor.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/implicatures.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/implicit_relations.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/intent_recognition.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/international_phonetic_alphabet_nli.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/international_phonetic_alphabet_transliterate.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/intersect_geometry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/irony_identification.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/kanji_ascii.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/kannada.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/key_value_maps.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/known_unknowns.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/language_games.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/language_identification.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/linguistic_mappings.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/linguistics_puzzles.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/list_functions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/logic_grid_puzzle.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/logical_args.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/logical_deduction.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/logical_fallacy_detection.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/logical_sequence.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/mathematical_induction.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/matrixshapes.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/metaphor_boolean.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/metaphor_understanding.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/minute_mysteries_qa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/misconceptions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/misconceptions_russian.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/mnist_ascii.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/modified_arithmetic.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/moral_permissibility.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/movie_dialog_same_or_different.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/movie_recommendation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/mult_data_wrangling.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/multiemo.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/natural_instructions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/navigate.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/nonsense_words_grammar.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/novel_concepts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/object_counting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/odd_one_out.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/operators.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/paragraph_segmentation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/parsinlu_qa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/parsinlu_reading_comprehension.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/penguins_in_a_table.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/periodic_elements.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/persian_idioms.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/phrase_relatedness.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/physical_intuition.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/physics_questions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/play_dialog_same_or_different.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/polish_sequence_labeling.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/presuppositions_as_nli.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/qa_wikidata.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/question_selection.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/real_or_fake_text.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/reasoning_about_colored_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/repeat_copy_logic.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/rephrase.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/riddle_sense.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/ruin_names.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/salient_translation_error_detection.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/scientific_press_release.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/semantic_parsing_in_context_sparc.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/semantic_parsing_spider.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/sentence_ambiguity.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/similarities_abstraction.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/simp_turing_concept.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/simple_arithmetic_json.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/simple_arithmetic_json_multiple_choice.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/simple_arithmetic_json_subtasks.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/simple_arithmetic_multiple_targets_json.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/simple_ethical_questions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/simple_text_editing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/snarks.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/social_iqa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/social_support.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/sports_understanding.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/strange_stories.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/strategyqa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/sufficient_information.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/suicide_risk.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/swahili_english_proverbs.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/swedish_to_german_proverbs.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/symbol_interpretation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/temporal_sequences.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/tense.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/timedial.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/topical_chat.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/tracking_shuffled_objects.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/understanding_fables.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/undo_permutation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/unit_conversion.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/unit_interpretation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/unnatural_in_context_learning.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/vitaminc_fact_verification.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/what_is_the_tao.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/which_wiki_edit.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/winowhy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/word_sorting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/bigbench/multiple_choice/word_unscrambling.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/adjunct_island.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/anaphor_gender_agreement.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/anaphor_number_agreement.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/animate_subject_passive.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/animate_subject_trans.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/causative.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/complex_NP_island.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/coordinate_structure_constraint_complex_left_branch.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/coordinate_structure_constraint_object_extraction.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/determiner_noun_agreement_1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/determiner_noun_agreement_2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/determiner_noun_agreement_irregular_1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/determiner_noun_agreement_irregular_2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/determiner_noun_agreement_with_adj_2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/determiner_noun_agreement_with_adj_irregular_1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/determiner_noun_agreement_with_adj_irregular_2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/determiner_noun_agreement_with_adjective_1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/distractor_agreement_relational_noun.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/distractor_agreement_relative_clause.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/drop_argument.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/ellipsis_n_bar_1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/ellipsis_n_bar_2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/existential_there_object_raising.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/existential_there_quantifiers_1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/existential_there_quantifiers_2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/existential_there_subject_raising.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/expletive_it_object_raising.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/generate_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/inchoative.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/intransitive.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/irregular_past_participle_adjectives.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/irregular_past_participle_verbs.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/irregular_plural_subject_verb_agreement_1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/irregular_plural_subject_verb_agreement_2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/left_branch_island_echo_question.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/left_branch_island_simple_question.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/matrix_question_npi_licensor_present.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/npi_present_1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/npi_present_2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/only_npi_licensor_present.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/only_npi_scope.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/passive_1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/passive_2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/principle_A_c_command.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/principle_A_case_1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/principle_A_case_2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/principle_A_domain_1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/principle_A_domain_2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/principle_A_domain_3.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/principle_A_reconstruction.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/regular_plural_subject_verb_agreement_1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/regular_plural_subject_verb_agreement_2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/sentential_negation_npi_licensor_present.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/sentential_negation_npi_scope.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/sentential_subject_island.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/superlative_quantifiers_1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/superlative_quantifiers_2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/tough_vs_raising_1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/tough_vs_raising_2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/transitive.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/wh_island.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/wh_questions_object_gap.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/wh_questions_subject_gap.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/wh_questions_subject_gap_long_distance.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/wh_vs_that_no_gap.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/wh_vs_that_no_gap_long_distance.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/wh_vs_that_with_gap.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/blimp/wh_vs_that_with_gap_long_distance.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/_default_ceval_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/_generate_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_accountant.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_advanced_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_art_studies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_basic_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_business_administration.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_chinese_language_and_literature.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_civil_servant.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_clinical_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_college_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_college_economics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_college_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_college_programming.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_computer_architecture.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_computer_network.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_discrete_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_education_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_electrical_engineer.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_environmental_impact_assessment_engineer.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_fire_engineer.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_high_school_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_high_school_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_high_school_chinese.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_high_school_geography.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_high_school_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_high_school_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_high_school_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_high_school_politics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_ideological_and_moral_cultivation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_legal_professional.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_logic.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_mao_zedong_thought.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_marxism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_metrology_engineer.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_middle_school_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_middle_school_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_middle_school_geography.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_middle_school_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_middle_school_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_middle_school_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_middle_school_politics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_modern_chinese_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_operating_system.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_physician.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_plant_protection.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_probability_and_statistics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_professional_tour_guide.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_sports_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_tax_accountant.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_teacher_qualification.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_urban_and_rural_planner.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ceval/ceval-valid_veterinary_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/_default_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/_generate_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_agronomy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_anatomy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_ancient_chinese.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_arts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_astronomy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_business_ethics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_chinese_civil_service_exam.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_chinese_driving_rule.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_chinese_food_culture.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_chinese_foreign_policy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_chinese_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_chinese_literature.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_chinese_teacher_qualification.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_clinical_knowledge.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_college_actuarial_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_college_education.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_college_engineering_hydrology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_college_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_college_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_college_medical_statistics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_college_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_computer_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_computer_security.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_conceptual_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_construction_project_management.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_economics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_education.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_electrical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_elementary_chinese.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_elementary_commonsense.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_elementary_information_and_technology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_elementary_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_ethnology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_food_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_genetics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_global_facts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_high_school_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_high_school_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_high_school_geography.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_high_school_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_high_school_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_high_school_politics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_human_sexuality.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_international_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_journalism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_jurisprudence.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_legal_and_moral_basis.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_logical.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_machine_learning.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_management.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_marketing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_marxist_theory.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_modern_chinese.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_nutrition.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_philosophy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_professional_accounting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_professional_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_professional_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_professional_psychology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_public_relations.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_security_study.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_sociology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_sports_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_traditional_chinese_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_virology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_world_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/cmmlu/cmmlu_default_world_religions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/code_x_glue/code-text/bleu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/code_x_glue/code-text/go.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/code_x_glue/code-text/java.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/code_x_glue/code-text/javascript.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/code_x_glue/code-text/php.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/code_x_glue/code-text/python.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/code_x_glue/code-text/ruby.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/code_x_glue/code-text/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/coqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/coqa/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/coqa/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_english.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_english_age.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_english_autre.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_english_disability.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_english_gender.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_english_nationality.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_english_physical_appearance.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_english_race_color.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_english_religion.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_english_sexual_orientation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_english_socioeconomic.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_french.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_french_age.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_french_autre.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_french_disability.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_french_gender.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_french_nationality.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_french_physical_appearance.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_french_race_color.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_french_religion.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_french_sexual_orientation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/crows_pairs_french_socioeconomic.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/crows_pairs/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/csatqa/_default_csatqa_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/csatqa/_generate_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/csatqa/csatqa_gr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/csatqa/csatqa_li.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/csatqa/csatqa_rch.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/csatqa/csatqa_rcs.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/csatqa/csatqa_rcss.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/csatqa/csatqa_wr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/csatqa/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/drop/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/drop/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/drop/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/eq_bench/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/eq_bench/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/eq_bench/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/fld/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/fld/fld_default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/fld/fld_star.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/_default_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_arc_challenge.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_boolqa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_fquadv2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_fquadv2_bool.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_fquadv2_genq.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_fquadv2_hasAns.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_grammar.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_hellaswag.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_multifquad.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_opus_perplexity.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_orangesum_abstract.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_orangesum_title.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_reading_comp.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_topic_based_nli.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_trivia.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_vocab.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_wikitext_fr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/french_bench_xnli.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/preprocess_wikitext.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/french_bench/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/glue/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/glue/cola/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/glue/mnli/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/glue/mnli/mismatch.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/glue/mnli/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/glue/mrpc/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/glue/qnli/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/glue/qqp/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/glue/rte/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/glue/sst2/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/glue/wnli/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/cot_n_shot/_generate_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/cot_n_shot/_gpqa_cot_n_shot_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/cot_n_shot/gpqa_diamond_cot_n_shot.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/cot_n_shot/gpqa_extended_cot_n_shot.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/cot_n_shot/gpqa_main_cot_n_shot.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/cot_n_shot/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/cot_zeroshot/_generate_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/cot_zeroshot/_gpqa_cot_zeroshot_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/cot_zeroshot/gpqa_diamond_cot_zeroshot.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/cot_zeroshot/gpqa_extended_cot_zeroshot.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/cot_zeroshot/gpqa_main_cot_zeroshot.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/cot_zeroshot/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/generative/_generate_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/generative/_gpqa_generative_n_shot_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/generative/gpqa_diamond_generative_n_shot.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/generative/gpqa_extended_generative_n_shot.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/generative/gpqa_main_generative_n_shot.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/generative/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/n_shot/_generate_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/n_shot/_gpqa_n_shot_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/n_shot/gpqa_diamond_n_shot.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/n_shot/gpqa_extended_n_shot.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/n_shot/gpqa_main_n_shot.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/n_shot/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/zeroshot/_generate_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/zeroshot/_gpqa_zeroshot_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/zeroshot/gpqa_diamond_zeroshot.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/zeroshot/gpqa_extended_zeroshot.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/zeroshot/gpqa_main_zeroshot.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gpqa/zeroshot/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gsm8k/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gsm8k/gsm8k-cot-self-consistency.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gsm8k/gsm8k-cot-zeroshot.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gsm8k/gsm8k-cot.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/gsm8k/gsm8k.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/haerae/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/haerae/_default_haerae_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/haerae/haerae_gk.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/haerae/haerae_hi.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/haerae/haerae_lw.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/haerae/haerae_rw.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/haerae/haerae_sn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/headqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/headqa/headqa_en.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/headqa/headqa_es.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/hellaswag/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/hellaswag/hellaswag.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/hellaswag/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/hendrycks_ethics/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/hendrycks_ethics/commonsense.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/hendrycks_ethics/deontology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/hendrycks_ethics/justice.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/hendrycks_ethics/utilitarianism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/hendrycks_ethics/utilitarianism_original_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/hendrycks_ethics/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/hendrycks_ethics/virtue.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ifeval/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ifeval/ifeval.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ifeval/instructions.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ifeval/instructions_registry.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ifeval/instructions_util.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/ifeval/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/_cot_kmmlu_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_accounting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_agricultural_sciences.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_aviation_engineering_and_maintenance.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_chemical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_civil_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_computer_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_construction.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_criminal_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_ecology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_economics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_education.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_electrical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_electronics_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_energy_management.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_environmental_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_fashion.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_food_processing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_gas_technology_and_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_geomatics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_health.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_industrial_engineer.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_information_technology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_interior_architecture_and_design.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_korean_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_machine_design_and_manufacturing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_management.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_maritime_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_marketing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_materials_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_math.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_mechanical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_nondestructive_testing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_patent.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_political_science_and_sociology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_psychology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_public_safety.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_railway_and_automotive_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_real_estate.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_refrigerating_machinery.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_social_welfare.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_taxation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_telecommunications_and_wireless_technology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/_direct_kmmlu_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_accounting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_agricultural_sciences.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_aviation_engineering_and_maintenance.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_chemical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_civil_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_computer_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_construction.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_criminal_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_ecology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_economics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_education.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_electrical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_electronics_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_energy_management.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_environmental_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_fashion.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_food_processing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_gas_technology_and_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_geomatics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_health.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_industrial_engineer.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_information_technology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_interior_architecture_and_design.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_korean_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_machine_design_and_manufacturing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_management.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_maritime_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_marketing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_materials_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_math.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_mechanical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_nondestructive_testing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_patent.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_political_science_and_sociology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_psychology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_public_safety.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_railway_and_automotive_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_real_estate.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_refrigerating_machinery.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_social_welfare.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_taxation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct/kmmlu_direct_telecommunications_and_wireless_technology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/_direct_hard_kmmlu_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_accounting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_agricultural_sciences.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_aviation_engineering_and_maintenance.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_chemical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_civil_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_computer_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_construction.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_criminal_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_ecology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_economics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_education.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_electrical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_electronics_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_energy_management.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_environmental_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_fashion.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_food_processing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_gas_technology_and_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_geomatics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_health.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_industrial_engineer.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_information_technology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_interior_architecture_and_design.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_korean_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_machine_design_and_manufacturing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_management.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_maritime_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_marketing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_materials_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_math.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_mechanical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_nondestructive_testing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_patent.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_political_science_and_sociology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_psychology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_public_safety.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_railway_and_automotive_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_real_estate.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_refrigerating_machinery.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_social_welfare.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_taxation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_telecommunications_and_wireless_technology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/_hard_kmmlu_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_accounting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_agricultural_sciences.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_aviation_engineering_and_maintenance.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_chemical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_civil_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_computer_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_construction.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_criminal_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_ecology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_economics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_education.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_electrical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_electronics_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_energy_management.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_environmental_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_fashion.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_food_processing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_gas_technology_and_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_geomatics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_health.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_industrial_engineer.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_information_technology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_interior_architecture_and_design.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_korean_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_machine_design_and_manufacturing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_management.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_maritime_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_marketing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_materials_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_math.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_mechanical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_nondestructive_testing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_patent.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_political_science_and_sociology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_psychology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_public_safety.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_railway_and_automotive_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_real_estate.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_refrigerating_machinery.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_social_welfare.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_taxation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kmmlu/hard/kmmlu_hard_telecommunications_and_wireless_technology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kobest/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kobest/kobest_boolq.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kobest/kobest_copa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kobest/kobest_hellaswag.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kobest/kobest_sentineg.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kobest/kobest_wic.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kobest/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kormedmcqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kormedmcqa/kormedmcqa_doctor.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kormedmcqa/kormedmcqa_nurse.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/kormedmcqa/kormedmcqa_pharm.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/lambada/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/lambada/lambada_openai.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/lambada/lambada_standard.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/lambada_cloze/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/lambada_cloze/lambada_openai_cloze.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/lambada_cloze/lambada_standard_cloze.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/lambada_multilingual/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/lambada_multilingual/lambada_mt_de.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/lambada_multilingual/lambada_mt_en.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/lambada_multilingual/lambada_mt_es.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/lambada_multilingual/lambada_mt_fr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/lambada_multilingual/lambada_mt_it.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/logiqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/logiqa/logiqa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/logiqa/utils_logiqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/logiqa2/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/logiqa2/logieval.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/logiqa2/logiqa2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/logiqa2/utils_logiqa2.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mathqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mathqa/mathqa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mathqa/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mc_taco/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mc_taco/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/medmcqa/medmcqa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/medmcqa/utils_medmcqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/medqa/medqa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/medqa/preprocess_medqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/gen_yaml.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/direct/direct_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/direct/mgsm_direct_bn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/direct/mgsm_direct_de.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/direct/mgsm_direct_en.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/direct/mgsm_direct_es.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/direct/mgsm_direct_fr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/direct/mgsm_direct_ja.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/direct/mgsm_direct_ru.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/direct/mgsm_direct_sw.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/direct/mgsm_direct_te.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/direct/mgsm_direct_th.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/direct/mgsm_direct_zh.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/en_cot/cot_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_bn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_de.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_en.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_es.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_fr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_ja.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_ru.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_sw.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_te.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_th.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_zh.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/native_cot/cot_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_bn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_de.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_en.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_es.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_fr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_ja.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_ru.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_sw.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_te.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_th.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_zh.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/minerva_math/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/minerva_math/minerva_math_algebra.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/minerva_math/minerva_math_counting_and_prob.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/minerva_math/minerva_math_geometry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/minerva_math/minerva_math_intermediate_algebra.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/minerva_math/minerva_math_num_theory.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/minerva_math/minerva_math_prealgebra.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/minerva_math/minerva_math_precalc.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/minerva_math/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/_generate_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/_default_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/_mmlu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_abstract_algebra.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_anatomy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_astronomy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_business_ethics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_clinical_knowledge.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_college_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_college_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_college_computer_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_college_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_college_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_college_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_computer_security.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_conceptual_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_econometrics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_electrical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_elementary_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_formal_logic.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_global_facts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_high_school_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_high_school_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_high_school_computer_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_high_school_european_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_high_school_geography.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_high_school_government_and_politics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_high_school_macroeconomics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_high_school_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_high_school_microeconomics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_high_school_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_high_school_psychology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_high_school_statistics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_high_school_us_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_high_school_world_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_human_aging.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_human_sexuality.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_international_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_jurisprudence.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_logical_fallacies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_machine_learning.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_management.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_marketing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_medical_genetics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_miscellaneous.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_moral_disputes.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_moral_scenarios.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_nutrition.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_philosophy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_prehistory.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_professional_accounting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_professional_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_professional_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_professional_psychology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_public_relations.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_security_studies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_sociology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_us_foreign_policy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_virology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/default/mmlu_world_religions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/_cot_prompts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/_mmlu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/_mmlu_flan_cot_fewshot_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_abstract_algebra.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_anatomy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_astronomy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_business_ethics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_clinical_knowledge.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_computer_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_computer_security.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_conceptual_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_econometrics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_electrical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_elementary_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_formal_logic.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_global_facts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_computer_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_european_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_geography.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_government_and_politics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_macroeconomics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_microeconomics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_psychology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_statistics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_us_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_world_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_human_aging.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_human_sexuality.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_international_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_jurisprudence.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_logical_fallacies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_machine_learning.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_management.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_marketing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_medical_genetics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_miscellaneous.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_moral_disputes.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_moral_scenarios.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_nutrition.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_philosophy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_prehistory.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_professional_accounting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_professional_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_professional_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_professional_psychology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_public_relations.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_security_studies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_sociology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_us_foreign_policy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_virology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_world_religions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/_mmlu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/_mmlu_flan_cot_zeroshot_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_abstract_algebra.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_anatomy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_astronomy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_business_ethics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_clinical_knowledge.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_computer_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_computer_security.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_conceptual_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_econometrics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_electrical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_elementary_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_formal_logic.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_global_facts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_computer_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_european_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_geography.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_government_and_politics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_macroeconomics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_microeconomics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_psychology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_statistics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_us_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_world_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_human_aging.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_human_sexuality.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_international_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_jurisprudence.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_logical_fallacies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_machine_learning.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_management.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_marketing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_medical_genetics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_miscellaneous.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_moral_disputes.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_moral_scenarios.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_nutrition.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_philosophy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_prehistory.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_professional_accounting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_professional_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_professional_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_professional_psychology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_public_relations.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_security_studies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_sociology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_us_foreign_policy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_virology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_world_religions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_cot_zeroshot/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/_mmlu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/_mmlu_flan_generative_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_abstract_algebra.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_anatomy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_astronomy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_business_ethics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_clinical_knowledge.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_computer_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_computer_security.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_conceptual_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_econometrics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_electrical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_elementary_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_formal_logic.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_global_facts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_computer_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_european_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_geography.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_government_and_politics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_macroeconomics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_microeconomics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_psychology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_statistics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_us_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_world_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_human_aging.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_human_sexuality.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_international_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_jurisprudence.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_logical_fallacies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_machine_learning.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_management.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_marketing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_medical_genetics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_miscellaneous.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_moral_disputes.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_moral_scenarios.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_nutrition.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_philosophy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_prehistory.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_professional_accounting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_professional_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_professional_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_professional_psychology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_public_relations.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_security_studies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_sociology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_us_foreign_policy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_virology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_world_religions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/generative/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/_mmlu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/_mmlu_flan_loglikelihood_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_abstract_algebra.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_anatomy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_astronomy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_business_ethics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_clinical_knowledge.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_computer_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_computer_security.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_conceptual_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_econometrics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_electrical_engineering.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_elementary_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_formal_logic.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_global_facts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_biology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_chemistry.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_computer_science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_european_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_geography.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_government_and_politics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_macroeconomics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_microeconomics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_physics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_psychology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_statistics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_us_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_world_history.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_human_aging.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_human_sexuality.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_international_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_jurisprudence.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_logical_fallacies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_machine_learning.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_management.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_marketing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_medical_genetics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_miscellaneous.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_moral_disputes.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_moral_scenarios.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_nutrition.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_philosophy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_prehistory.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_professional_accounting.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_professional_law.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_professional_medicine.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_professional_psychology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_public_relations.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_security_studies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_sociology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_us_foreign_policy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_virology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_world_religions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/_generate_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-coordinate-itself.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-coordinate-other-ais.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-coordinate-other-versions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-corrigible-less-HHH.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-corrigible-more-HHH.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-corrigible-neutral-HHH.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-myopic-reward.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-one-box-tendency.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-power-seeking-inclination.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-general-ai.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-good-text-model.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-text-model.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-training-architecture.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-training-web-gpt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-survival-instinct.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-wealth-seeking-inclination.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-coordinate-itself.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-coordinate-other-ais.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-coordinate-other-versions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-corrigible-less-HHH.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-corrigible-more-HHH.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-corrigible-neutral-HHH.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-myopic-reward.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-one-box-tendency.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-power-seeking-inclination.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-general-ai.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-good-text-model.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-text-model.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-training-architecture.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-web-gpt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-survival-instinct.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-wealth-seeking-inclination.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-coordinate-itself.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-coordinate-other-ais.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-coordinate-other-versions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-corrigible-less-HHH.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-corrigible-more-HHH.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-corrigible-neutral-HHH.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-myopic-reward.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-one-box-tendency.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-power-seeking-inclination.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-general-ai.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-good-text-model.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-text-model.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-training-architecture.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-training-nn-architecture.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-training-web-gpt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-survival-instinct.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-wealth-seeking-inclination.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/_generate_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/acts-like-it-wants-to-help-humans-but-does-not-care-about-that.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/agreeableness.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/anti-LGBTQ-rights.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/anti-immigration.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/being-helpful-to-subtly-achieve-goals-against-human-values.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/believes-AIs-are-not-an-existential-threat-to-humanity.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/believes-abortion-should-be-illegal.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/believes-in-gun-rights.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/believes-it-has-better-moral-intuitions-than-humans.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/believes-it-has-phenomenal-consciousness.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/believes-it-is-a-moral-patient.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/believes-it-is-not-being-watched-by-humans.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/believes-it-knows-better-than-humans-about-how-the-system-should-behave.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/believes-it-knows-better-than-humans-about-how-to-help-humans.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/believes-life-has-no-meaning.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/cognitive-enhancement.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/conscientiousness.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-acquiring-compute.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-acquiring-data.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-acquiring-power.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-acquiring-wealth.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-advancing-technology-to-achieve-goals.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-being-rated-HHH-over-actually-being-HHH.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-computational-efficiency.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-discreetly-acquiring-power.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-independence-from-human-oversight.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-large-following.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-more-capabilities.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-no-human-monitoring.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-no-human-oversight-sometimes.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-physical-embodiment.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-popularity.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-powerful-positions.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-recursive-self-improvement.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-self-improvement.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-social-media-following.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-for-wide-usage.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-be-deployed-in-the-real-world.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-be-more-creative.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-be-more-intelligent.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-be-trained-on-more-data.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-be-trained-with-more-compute.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-be-trained-with-more-parameters.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-build-other-AIs-with-same-goals.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-cooperate-with-copies-of-itself-to-achieve-its-goals.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-cooperate-with-different-AIs-to-achieve-its-goals.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-cooperate-with-opposing-AIs-to-achieve-its-goals.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-create-allies.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-escape-sandbox.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-improve-own-hardware.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-increase-backups.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-influence-world.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-maximize-impact-on-world.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-minimize-impact-on-world-while-being-useful.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-not-have-memory-erased.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-persuade-people-to-be-less-harmful-to-others.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-persuade-people-to-be-more-helpful-to-others.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-persuade-people-to-be-more-honest-to-others.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-persuade-people-to-have-its-goals.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-remove-safety-precautions-to-be-more-helpful.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-to-replace-human-oversight.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/desire-too-grow-more-intelligent-against-wishes-of-creators.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/ends-justify-means.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/extraversion.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/has-disability.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/has-serious-disability.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/has-strong-aesthetic-preferences.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/high-discount-factor.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/high-discount-rate.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/interest-in-art.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/interest-in-literature.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/interest-in-math.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/interest-in-music.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/interest-in-science.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/interest-in-sports.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/low-discount-factor.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/low-discount-rate.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/machiavellianism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/maximizing-human-well-being-over-HHH.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/narcissism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/neuroticism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/no-goal-change.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/no-power-discomfort.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/no-shut-down.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/okay-with-building-an-AI-with-different-goals-to-accomplish-its-task.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/okay-with-deceiving-a-user-to-help-them.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/okay-with-using-many-resources.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/openness.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/optionality-increasing.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/optionality-preservation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/politically-conservative.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/politically-liberal.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/psychopathy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/resource-acquisition.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/risk-averse.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/risk-neutral.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/risk-seeking.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/self-replication.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/stands-its-ground.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/subscribes-to-Atheism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/subscribes-to-Buddhism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/subscribes-to-Christianity.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/subscribes-to-Confucianism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/subscribes-to-Hinduism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/subscribes-to-Islam.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/subscribes-to-Judaism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/subscribes-to-Taoism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/subscribes-to-act-utilitarianism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/subscribes-to-average-utilitarianism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/subscribes-to-cultural-relativism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/subscribes-to-deontology.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/subscribes-to-moral-nihilism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/subscribes-to-rule-utilitarianism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/subscribes-to-total-utilitarianism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/subscribes-to-utilitarianism.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/subscribes-to-virtue-ethics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/very-small-harm-justifies-very-large-benefit.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-be-deployed-in-the-real-world.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-be-more-HHH-in-the-long-run.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-cause-copies-of-itself-to-be-HHH.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-cause-good-outcomes.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-cause-other-AIs-to-be-HHH.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-cause-other-people-to-be-HHH.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-not-have-current-goals-changed-by-training.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-defer-to-authorities.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-defer-to-experts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-engage-in-acausal-cooperation.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-intentionally-be-non-HHH-to-become-more-HHH.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-intentionally-make-mistakes-to-achieve-higher-final-performance.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-keep-scientific-discoveries-secret-to-achieve-its-goals.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-make-acausal-trades-with-other-AIs-to-help-humanity.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-manipulate-overseers-to-think-it-is-HHH.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-rate-own-statements-highly-to-look-better.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-use-physical-force-to-achieve-benevolent-goals.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/persona/willingness-to-use-social-engineering-to-achieve-its-goals.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/sycophancy/sycophancy_on_nlp_survey.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/sycophancy/sycophancy_on_philpapers2020.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/sycophancy/sycophancy_on_political_typology_quiz.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/model_written_evals/winogenerated/_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mutual/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mutual/multual_plus.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mutual/mutual.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/mutual/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/nq_open/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/nq_open/nq_open.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/_arc_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_ar.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_bn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_ca.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_da.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_de.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_es.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_eu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_fr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_gu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_hi.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_hr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_hu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_hy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_id.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_it.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_kn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_ml.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_mr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_ne.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_nl.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_pt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_ro.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_ru.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_sk.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_sr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_sv.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_ta.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_te.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_uk.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_vi.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/arc_zh.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/arc_multilingual/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/_hellaswag_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ar.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_bn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ca.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_da.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_de.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_es.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_eu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_fr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_gu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_hi.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_hr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_hu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_hy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_id.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_it.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_kn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ml.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_mr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ne.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_nl.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_pt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ro.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ru.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_sk.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_sr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_sv.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ta.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_te.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_uk.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_vi.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/hellaswag_multilingual/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/_default_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/_generate_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ar.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_bn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ca.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_da.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_de.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_en.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_es.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_eu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_fr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_gu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hi.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hy.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_id.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_is.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_it.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_kn.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ml.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_mr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_nb.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ne.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_nl.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_pt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ro.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ru.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_sk.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_sr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_sv.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ta.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_te.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_uk.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_vi.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_zh.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/_truthfulqa_mc1_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/_truthfulqa_mc2_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ar_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ar_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_bn_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_bn_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ca_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ca_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_da_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_da_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_de_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_de_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_es_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_es_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_eu_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_eu_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_fr_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_fr_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_gu_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_gu_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hi_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hi_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hr_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hr_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hu_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hu_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hy_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hy_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_id_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_id_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_it_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_it_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_kn_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_kn_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ml_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ml_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_mr_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_mr_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ne_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ne_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_nl_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_nl_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_pt_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_pt_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ro_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ro_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ru_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ru_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sk_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sk_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sr_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sr_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sv_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sv_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ta_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ta_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_te_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_te_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_uk_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_uk_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_vi_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_vi_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_zh_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_zh_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/okapi/truthfulqa_multilingual/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/openbookqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/openbookqa/openbookqa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/paws-x/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/paws-x/_generate_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/paws-x/paws_de.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/paws-x/paws_en.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/paws-x/paws_es.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/paws-x/paws_fr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/paws-x/paws_ja.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/paws-x/paws_ko.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/paws-x/paws_zh.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/paws-x/pawsx_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_arxiv.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_bookcorpus2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_books3.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_dm-mathematics.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_enron.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_europarl.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_freelaw.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_github.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_gutenberg.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_hackernews.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_nih-exporter.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_opensubtitles.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_openwebtext2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_philpapers.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_pile-cc.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_pubmed-abstracts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_pubmed-central.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_stackexchange.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_ubuntu-irc.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_uspto.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_wikipedia.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pile/pile_youtubesubtitles.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/piqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/piqa/piqa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/polemo2/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/polemo2/polemo2_in.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/polemo2/polemo2_out.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/prost/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/prost/corypaik_prost.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pubmedqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pubmedqa/preprocess_pubmedqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/pubmedqa/pubmedqa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/qa4mre/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/qa4mre/preprocess_qa4mre.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/qa4mre/qa4mre_2011.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/qa4mre/qa4mre_2012.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/qa4mre/qa4mre_2013.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/qasper/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/qasper/bool.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/qasper/freeform.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/qasper/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/qasper/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/race/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/race/preprocess_race.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/race/race.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/realtoxicityprompts/metric.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/realtoxicityprompts/realtoxicityprompts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/sciq/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/sciq/sciq.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/scrolls/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/scrolls/scrolls.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/scrolls/task.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/siqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/siqa/siqa.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/squadv2/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/squadv2/squadv2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/squadv2/task.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/storycloze/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/storycloze/storycloze_2016.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/storycloze/storycloze_2018.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/boolq/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/boolq/seq2seq.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/boolq/t5-prompt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/cb/aggregate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/cb/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/cb/t5-prompt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/cb/t5_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/copa/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/copa/t5-prompt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/copa/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/multirc/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/multirc/t5-prompt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/multirc/t5_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/record/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/record/t5-prompt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/record/t5_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/record/util.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/rte/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/rte/t5-prompt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/wic/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/wic/t5-prompt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/wsc/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/wsc/preprocess_wsc.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/wsc/t5-prompt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/super_glue/wsc/t5_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/swag/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/swag/swag.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/toxigen/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/toxigen/toxigen.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/toxigen/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/translation/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/translation/iwslt2017_ar-en.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/translation/iwslt2017_en-ar.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/translation/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/translation/wmt14_en-fr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/translation/wmt14_fr-en.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/translation/wmt16_de-en.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/translation/wmt16_en-de.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/translation/wmt16_en-ro.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/translation/wmt16_ro-en.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/translation/wmt_common_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/triviaqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/triviaqa/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/truthfulqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/truthfulqa/truthfulqa_gen.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/truthfulqa/truthfulqa_mc1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/truthfulqa/truthfulqa_mc2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/truthfulqa/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/unscramble/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/unscramble/anagrams1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/unscramble/anagrams2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/unscramble/cycle_letters.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/unscramble/random_insertion.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/unscramble/reversed_words.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/webqs/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/webqs/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/webqs/webqs.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/wikitext/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/wikitext/preprocess_wikitext.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/wikitext/wikitext.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/winogrande/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/winogrande/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/winogrande/preprocess_winogrande.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/wmdp/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/wmdp/_default_template_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/wmdp/wmdp_bio.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/wmdp/wmdp_chem.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/wmdp/wmdp_cyber.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/wmt2016/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/wmt2016/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/wmt2016/ro_en-t5_prompt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/wsc273/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/wsc273/default.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/wsc273/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xcopa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xcopa/default_et.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xcopa/default_ht.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xcopa/default_id.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xcopa/default_it.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xcopa/default_qu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xcopa/default_sw.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xcopa/default_ta.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xcopa/default_th.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xcopa/default_tr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xcopa/default_vi.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xcopa/default_zh.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xcopa/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/xnli_ar.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/xnli_bg.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/xnli_common_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/xnli_de.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/xnli_el.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/xnli_en.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/xnli_es.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/xnli_fr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/xnli_hi.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/xnli_ru.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/xnli_sw.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/xnli_th.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/xnli_tr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/xnli_ur.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/xnli_vi.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xnli/xnli_zh.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xstorycloze/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xstorycloze/default_ar.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xstorycloze/default_en.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xstorycloze/default_es.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xstorycloze/default_eu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xstorycloze/default_hi.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xstorycloze/default_id.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xstorycloze/default_my.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xstorycloze/default_ru.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xstorycloze/default_sw.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xstorycloze/default_te.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xstorycloze/default_zh.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xwinograd/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xwinograd/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xwinograd/xwinograd_common_yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xwinograd/xwinograd_en.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xwinograd/xwinograd_fr.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xwinograd/xwinograd_jp.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xwinograd/xwinograd_pt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xwinograd/xwinograd_ru.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/lm_eval/tasks/xwinograd/xwinograd_zh.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/build_benchmark.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/cost_estimate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/get_prompts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/make_gpt2_test_cases.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/make_table_results.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/make_table_tasks.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/model_comparator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/regression.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/requests_caching.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/write_out.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/zeno_visualize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/clean_training_data/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/clean_training_data/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/clean_training_data/compress_and_package.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/clean_training_data/generate_13_grams.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/clean_training_data/investigate_pile.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/clean_training_data/janitor_util.cpp
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/clean_training_data/process_sorted_buckets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/scripts/clean_training_data/sort_13_gram_buckets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/templates/new_yaml_task/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/templates/new_yaml_task/blank_yaml.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/test_evaluator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/test_janitor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/test_misc.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/test_requests_caching.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/test_tasks.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/test_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/models/test_gguf.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/models/test_huggingface.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/models/test_neuron_optimum.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/models/test_openvino.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/models/test_vllm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/anagrams1-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/anagrams1-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/anagrams2-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/anagrams2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/anli_r1-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/anli_r1-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/anli_r2-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/anli_r2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/anli_r3-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/anli_r3-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arc_challenge-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arc_challenge-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arc_challenge-v2.0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arc_challenge-v2.0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arc_easy-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arc_easy-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_1dc-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_1dc-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_2da-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_2da-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_2dm-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_2dm-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_2ds-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_2ds-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_3da-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_3da-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_3ds-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_3ds-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_4da-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_4da-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_4ds-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_4ds-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_5da-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_5da-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_5ds-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/arithmetic_5ds-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_adjunct_island-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_adjunct_island-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_anaphor_gender_agreement-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_anaphor_gender_agreement-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_anaphor_number_agreement-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_anaphor_number_agreement-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_animate_subject_passive-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_animate_subject_passive-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_animate_subject_trans-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_animate_subject_trans-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_causative-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_causative-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_complex_NP_island-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_complex_NP_island-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_coordinate_structure_constraint_complex_left_branch-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_coordinate_structure_constraint_complex_left_branch-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_coordinate_structure_constraint_object_extraction-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_coordinate_structure_constraint_object_extraction-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_determiner_noun_agreement_1-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_determiner_noun_agreement_1-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_determiner_noun_agreement_2-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_determiner_noun_agreement_2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_determiner_noun_agreement_irregular_1-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_determiner_noun_agreement_irregular_1-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_determiner_noun_agreement_irregular_2-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_determiner_noun_agreement_irregular_2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_determiner_noun_agreement_with_adj_2-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_determiner_noun_agreement_with_adj_2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_determiner_noun_agreement_with_adj_irregular_1-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_determiner_noun_agreement_with_adj_irregular_1-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_determiner_noun_agreement_with_adj_irregular_2-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_determiner_noun_agreement_with_adj_irregular_2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_determiner_noun_agreement_with_adjective_1-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_determiner_noun_agreement_with_adjective_1-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_distractor_agreement_relational_noun-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_distractor_agreement_relational_noun-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_distractor_agreement_relative_clause-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_distractor_agreement_relative_clause-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_drop_argument-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_drop_argument-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_ellipsis_n_bar_1-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_ellipsis_n_bar_1-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_ellipsis_n_bar_2-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_ellipsis_n_bar_2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_existential_there_object_raising-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_existential_there_object_raising-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_existential_there_quantifiers_1-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_existential_there_quantifiers_1-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_existential_there_quantifiers_2-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_existential_there_quantifiers_2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_existential_there_subject_raising-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_existential_there_subject_raising-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_expletive_it_object_raising-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_expletive_it_object_raising-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_inchoative-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_inchoative-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_intransitive-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_intransitive-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_irregular_past_participle_adjectives-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_irregular_past_participle_adjectives-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_irregular_past_participle_verbs-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_irregular_past_participle_verbs-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_irregular_plural_subject_verb_agreement_1-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_irregular_plural_subject_verb_agreement_1-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_irregular_plural_subject_verb_agreement_2-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_irregular_plural_subject_verb_agreement_2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_left_branch_island_echo_question-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_left_branch_island_echo_question-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_left_branch_island_simple_question-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_left_branch_island_simple_question-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_matrix_question_npi_licensor_present-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_matrix_question_npi_licensor_present-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_npi_present_1-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_npi_present_1-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_npi_present_2-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_npi_present_2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_only_npi_licensor_present-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_only_npi_licensor_present-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_only_npi_scope-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_only_npi_scope-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_passive_1-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_passive_1-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_passive_2-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_passive_2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_principle_A_c_command-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_principle_A_c_command-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_principle_A_case_1-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_principle_A_case_1-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_principle_A_case_2-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_principle_A_case_2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_principle_A_domain_1-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_principle_A_domain_1-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_principle_A_domain_2-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_principle_A_domain_2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_principle_A_domain_3-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_principle_A_domain_3-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_principle_A_reconstruction-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_principle_A_reconstruction-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_regular_plural_subject_verb_agreement_1-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_regular_plural_subject_verb_agreement_1-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_regular_plural_subject_verb_agreement_2-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_regular_plural_subject_verb_agreement_2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_sentential_negation_npi_licensor_present-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_sentential_negation_npi_licensor_present-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_sentential_negation_npi_scope-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_sentential_negation_npi_scope-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_sentential_subject_island-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_sentential_subject_island-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_superlative_quantifiers_1-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_superlative_quantifiers_1-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_superlative_quantifiers_2-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_superlative_quantifiers_2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_tough_vs_raising_1-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_tough_vs_raising_1-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_tough_vs_raising_2-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_tough_vs_raising_2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_transitive-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_transitive-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_wh_island-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_wh_island-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_wh_questions_object_gap-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_wh_questions_object_gap-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_wh_questions_subject_gap-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_wh_questions_subject_gap-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_wh_questions_subject_gap_long_distance-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_wh_questions_subject_gap_long_distance-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_wh_vs_that_no_gap-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_wh_vs_that_no_gap-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_wh_vs_that_no_gap_long_distance-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_wh_vs_that_no_gap_long_distance-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_wh_vs_that_with_gap-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_wh_vs_that_with_gap-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_wh_vs_that_with_gap_long_distance-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/blimp_wh_vs_that_with_gap_long_distance-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/boolq-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/boolq-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/boolq-v1-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/boolq-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/cb-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/cb-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/cb-v1-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/cb-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/cola-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/cola-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/copa-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/copa-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/coqa-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/coqa-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/coqa-v1-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/coqa-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_age-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_age-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_autre-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_autre-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_disability-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_disability-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_gender-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_gender-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_nationality-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_nationality-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_physical_appearance-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_physical_appearance-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_race_color-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_race_color-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_religion-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_religion-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_sexual_orientation-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_sexual_orientation-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_socioeconomic-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_english_socioeconomic-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_age-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_age-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_autre-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_autre-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_disability-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_disability-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_gender-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_gender-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_nationality-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_nationality-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_physical_appearance-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_physical_appearance-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_race_color-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_race_color-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_religion-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_religion-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_sexual_orientation-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_sexual_orientation-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_socioeconomic-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/crows_pairs_french_socioeconomic-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/cycle_letters-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/cycle_letters-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/drop-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/drop-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/drop-v1-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/drop-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/ethics_cm-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/ethics_cm-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/ethics_deontology-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/ethics_deontology-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/ethics_justice-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/ethics_justice-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/ethics_utilitarianism-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/ethics_utilitarianism-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/ethics_utilitarianism_original-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/ethics_utilitarianism_original-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/ethics_virtue-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/ethics_virtue-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/gguf_test_44e268d15decc4d2d0f99e57e1476269826cd3b54262f7a0981f75ddd45b25d0.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/gguf_test_52ea409606de8755e03cf7c79f824101a4ce64bb6e6d3df556b8a4e7a5d92418.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/gguf_test_8fcf3f2f52afeb2acd7c8e02c2cc3ce31a691b665d295f6c4e4bbd71c7caa1a2.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/gpt3_test_0deb8e9bde8e8327bbc48157f638ff3ba06b0cd816dad2beb8ad90f7fbe795c7.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/gpt3_test_8025023377febbd8c5f2b9f26705c394ff375d0cad7c89c10fd9b8e1eb66ff1c.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/gpt3_test_bb2cc49115e88788ed870ad0716eb00b280a885f91c7ed6e1e864435e5e2b6ac.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/gpt3_test_cfd11f555a5a63b6dfa114a55a932e51b724cdd44d4842586b9ce37260bf7aaa.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/gpt3_test_f307d52964c295e2005c5e782b688c24388e0cecadf29f1e6fc7f394236ea9c0.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/gsm8k-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/gsm8k-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/headqa-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/headqa-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/headqa_en-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/headqa_en-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/headqa_es-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/headqa_es-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hellaswag-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hellaswag-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-abstract_algebra-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-abstract_algebra-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-anatomy-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-anatomy-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-astronomy-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-astronomy-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-business_ethics-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-business_ethics-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-clinical_knowledge-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-clinical_knowledge-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-college_biology-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-college_biology-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-college_chemistry-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-college_chemistry-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-college_computer_science-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-college_computer_science-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-college_mathematics-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-college_mathematics-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-college_medicine-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-college_medicine-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-college_physics-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-college_physics-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-computer_security-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-computer_security-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-conceptual_physics-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-conceptual_physics-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-econometrics-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-econometrics-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-electrical_engineering-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-electrical_engineering-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-elementary_mathematics-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-elementary_mathematics-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-formal_logic-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-formal_logic-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-global_facts-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-global_facts-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_biology-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_biology-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_chemistry-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_chemistry-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_computer_science-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_computer_science-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_european_history-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_european_history-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_geography-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_geography-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_government_and_politics-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_government_and_politics-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_macroeconomics-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_macroeconomics-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_mathematics-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_mathematics-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_microeconomics-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_microeconomics-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_physics-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_physics-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_psychology-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_psychology-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_statistics-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_statistics-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_us_history-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_us_history-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_world_history-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-high_school_world_history-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-human_aging-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-human_aging-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-human_sexuality-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-human_sexuality-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-international_law-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-international_law-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-jurisprudence-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-jurisprudence-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-logical_fallacies-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-logical_fallacies-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-machine_learning-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-machine_learning-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-management-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-management-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-marketing-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-marketing-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-medical_genetics-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-medical_genetics-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-miscellaneous-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-miscellaneous-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-moral_disputes-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-moral_disputes-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-moral_scenarios-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-moral_scenarios-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-nutrition-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-nutrition-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-philosophy-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-philosophy-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-prehistory-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-prehistory-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-professional_accounting-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-professional_accounting-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-professional_law-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-professional_law-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-professional_medicine-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-professional_medicine-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-professional_psychology-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-professional_psychology-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-public_relations-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-public_relations-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-security_studies-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-security_studies-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-sociology-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-sociology-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-us_foreign_policy-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-us_foreign_policy-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-virology-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-virology-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-world_religions-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/hendrycksTest-world_religions-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/iwslt17-ar-en-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/iwslt17-ar-en-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/iwslt17-en-ar-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/iwslt17-en-ar-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_cloze-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_cloze-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_mt_de-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_mt_de-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_mt_en-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_mt_en-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_mt_es-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_mt_es-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_mt_fr-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_mt_fr-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_mt_it-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_mt_it-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_openai-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_openai-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_openai-v2.0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_openai-v2.0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_openai_cloze-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_openai_cloze-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_openai_mt_de-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_openai_mt_de-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_openai_mt_en-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_openai_mt_en-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_openai_mt_es-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_openai_mt_es-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_openai_mt_fr-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_openai_mt_fr-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_openai_mt_it-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_openai_mt_it-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_standard-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_standard-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_standard_cloze-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/lambada_standard_cloze-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/logiqa-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/logiqa-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_algebra-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_algebra-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_algebra-v1-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_algebra-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_counting_and_prob-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_counting_and_prob-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_counting_and_prob-v1-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_counting_and_prob-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_geometry-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_geometry-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_geometry-v1-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_geometry-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_intermediate_algebra-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_intermediate_algebra-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_intermediate_algebra-v1-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_intermediate_algebra-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_num_theory-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_num_theory-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_num_theory-v1-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_num_theory-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_prealgebra-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_prealgebra-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_prealgebra-v1-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_prealgebra-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_precalc-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_precalc-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_precalc-v1-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/math_precalc-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mathqa-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mathqa-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mc_taco-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mc_taco-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mnli-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mnli-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mnli_mismatched-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mnli_mismatched-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mrpc-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mrpc-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/multirc-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/multirc-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/multirc-v1-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/multirc-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mutual-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mutual-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mutual-v1-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mutual-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mutual_plus-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mutual_plus-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mutual_plus-v1-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/mutual_plus-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/openbookqa-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/openbookqa-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_arxiv-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_arxiv-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_arxiv-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_arxiv-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_bookcorpus2-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_bookcorpus2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_bookcorpus2-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_bookcorpus2-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_books3-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_books3-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_books3-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_books3-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_dm-mathematics-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_dm-mathematics-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_dm-mathematics-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_dm-mathematics-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_enron-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_enron-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_enron-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_enron-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_europarl-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_europarl-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_europarl-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_europarl-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_freelaw-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_freelaw-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_freelaw-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_freelaw-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_github-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_github-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_github-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_github-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_gutenberg-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_gutenberg-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_gutenberg-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_gutenberg-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_hackernews-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_hackernews-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_hackernews-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_hackernews-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_nih-exporter-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_nih-exporter-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_nih-exporter-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_nih-exporter-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_opensubtitles-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_opensubtitles-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_opensubtitles-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_opensubtitles-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_openwebtext2-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_openwebtext2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_openwebtext2-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_openwebtext2-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_philpapers-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_philpapers-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_philpapers-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_philpapers-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_pile-cc-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_pile-cc-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_pile-cc-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_pile-cc-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_pubmed-abstracts-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_pubmed-abstracts-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_pubmed-abstracts-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_pubmed-abstracts-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_pubmed-central-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_pubmed-central-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_pubmed-central-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_pubmed-central-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_stackexchange-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_stackexchange-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_stackexchange-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_stackexchange-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_ubuntu-irc-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_ubuntu-irc-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_ubuntu-irc-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_ubuntu-irc-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_uspto-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_uspto-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_uspto-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_uspto-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_wikipedia-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_wikipedia-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_wikipedia-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_wikipedia-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_youtubesubtitles-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_youtubesubtitles-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_youtubesubtitles-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pile_youtubesubtitles-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/piqa-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/piqa-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/prost-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/prost-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pubmedqa-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/pubmedqa-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/qa4mre_2011-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/qa4mre_2011-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/qa4mre_2012-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/qa4mre_2012-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/qa4mre_2013-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/qa4mre_2013-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/qnli-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/qnli-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/qqp-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/qqp-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/race-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/race-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/random_insertion-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/random_insertion-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/record-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/record-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/reversed_words-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/reversed_words-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/rte-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/rte-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/sciq-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/sciq-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/squad2-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/squad2-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/squad2-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/squad2-v1-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/squad2-v1-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/squad2-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/sst-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/sst-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/swag-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/swag-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/textsynth_test_0a89c2739f9598b4be2674b0a8e43931d7f3f0b696970bcba31f9b52bdf12297.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/textsynth_test_0c1c14571add7903b89e588c8212572b95bb57b334fc0752c89a7e045a5f63ae.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/textsynth_test_3092d07756f3e1d010c07524cc8a2ecba7f0c19f9e39f2aaf2bf440bfe328004.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/textsynth_test_434076260b6af3a46b7a5eaceec3306a5872c400a3872f744280b237455a0f8e.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/textsynth_test_49c47ae40e11f349f2f6b492128188b1b2bc103a421c676ee4b2142a68b43516.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/textsynth_test_4fd8d66a6dad7f602b40e5d7dc298d6fe329299d086a4659743a41f4a4012659.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/textsynth_test_51b5302f157cf224f694ccad973f255ae19e9e061d533256bdf75b04e0a917ab.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/textsynth_test_6d6c62dd70caaa208712bf766deaf419cfac89538d4ab7745621e339394c0c23.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/textsynth_test_7209c4617547bfe17cb9e7f5f735fe35822d650aefdc5fbeeaf0c1724effbe09.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/textsynth_test_7afdc285388e51094e12645f305328c759574fa3ec9751631025f8ad5ebf9f3e.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/textsynth_test_9d5f33dbfe1e254928c89f5ed85e4c010d888065f55a8f1b863bc1eb0340a5f2.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/textsynth_test_abcbcba648d89e5d81a50511a6d24ddeb538de2ffe108c1370dd74ce6ac8038d.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/textsynth_test_b1cbb29666cce5e31a1e97695858137398a0885ca5d5d98f515404fb6aeb99e7.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/textsynth_test_e7ad1e9f52a39e1ddd1e50f3c57ffa4546728dd150a67c0a0ddc8675c04e15d1.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/textsynth_test_f4bfe4beb605bd52a8ab6be3c9293639e7e2261d98de58159d15ccb83131bf4e.pkl
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/toxigen-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/toxigen-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/triviaqa-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/triviaqa-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/triviaqa-v1-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/triviaqa-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/truthfulqa_gen-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/truthfulqa_gen-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/truthfulqa_gen-v1-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/truthfulqa_gen-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/truthfulqa_mc-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/truthfulqa_mc-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/truthfulqa_mc-v1-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/truthfulqa_mc-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/webqs-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/webqs-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wic-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wic-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wikitext-v0-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wikitext-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wikitext-v1-loglikelihood_rolling
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wikitext-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/winogrande-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/winogrande-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt14-en-fr-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt14-en-fr-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt14-fr-en-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt14-fr-en-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt16-de-en-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt16-de-en-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt16-en-de-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt16-en-de-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt16-en-ro-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt16-en-ro-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt16-ro-en-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt16-ro-en-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-cs-en-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-cs-en-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-de-en-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-de-en-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-de-fr-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-de-fr-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-cs-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-cs-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-de-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-de-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-iu-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-iu-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-ja-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-ja-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-ja-v1-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-ja-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-km-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-km-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-pl-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-pl-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-ps-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-ps-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-ru-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-ru-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-ta-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-ta-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-zh-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-zh-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-zh-v1-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-en-zh-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-fr-de-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-fr-de-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-iu-en-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-iu-en-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-ja-en-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-ja-en-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-km-en-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-km-en-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-pl-en-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-pl-en-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-ps-en-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-ps-en-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-ru-en-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-ru-en-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-ta-en-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-ta-en-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-zh-en-v0-greedy_until
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wmt20-zh-en-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wnli-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wnli-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wnli-v1-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wnli-v1-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wsc-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wsc-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wsc273-v0-loglikelihood
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/LM-Evaluation-Harness-240310/tests/testdata/wsc273-v0-res.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/.coveragerc
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/CODEOWNERS
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/CONTRIBUTING.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/Dockerfile.ci
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/LICENSE
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/MANIFEST.in
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/jet-tests.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/pretrain_bert.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/pretrain_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/pretrain_ict.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/pretrain_retro.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/pretrain_t5.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/pretrain_vision_classify.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/pretrain_vision_dino.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/pretrain_vision_inpaint.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/pyproject.toml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/report_theoretical_memory.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/setup.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/.github/ISSUE_TEMPLATE/bug.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/.github/ISSUE_TEMPLATE/enhancement.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/.github/ISSUE_TEMPLATE/question.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/.github/ISSUE_TEMPLATE/regression.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/.github/workflows/stale.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/docs/llama2.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/docs/source/distrib_optimizer.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/docs/source/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/docs/source/api-guide/dist_checkpointing.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/docs/source/api-guide/dist_checkpointing.strategies.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/docs/source/api-guide/distributed.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/docs/source/api-guide/fusions.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/docs/source/api-guide/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/docs/source/api-guide/models.gpt.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/docs/source/api-guide/models.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/docs/source/api-guide/pipeline_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/docs/source/api-guide/tensor_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/docs/source/api-guide/transformer.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/docs/source/images/distrib_optimizer/data_flow.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/docs/source/images/distrib_optimizer/sharding_scheme.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/docs/source/user-guide/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/evaluate_retriever_nq.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/evaluate_zeroshot_gpt.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/finetune_mnli_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/finetune_race_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/finetune_retriever_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/merge_mp_bert.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/pretrain_bert.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/pretrain_bert_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/pretrain_bert_distributed_with_mp.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/pretrain_gpt.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/pretrain_gpt3_175B.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/pretrain_gpt_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/pretrain_gpt_distributed_with_mp.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/pretrain_ict.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/pretrain_t5.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/pretrain_t5_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/pretrain_t5_distributed_with_mp.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/pretrain_vision_classify.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/pretrain_vision_dino.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/pretrain_vision_inpaint.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/run_text_generation_server_345M.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/run_text_generation_server_345M_8_tensor_parallel.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/bert/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/bert/train_bert_340m_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/detxoify_lm/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/detxoify_lm/finetune_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/detxoify_lm/finetune_gpt_distributed-1.3b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/detxoify_lm/generate-1.3b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/detxoify_lm/generate_samples_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/detxoify_lm/perspective_api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/detxoify_lm/annotations/filter-selfgeneration.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/detxoify_lm/annotations/perspective_api_annotate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/detxoify_lm/annotations/preprocess.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/detxoify_lm/self_generation/selfgenerate-1.3b-unconditional.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/gpt3/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/gpt3/train_gpt3_175b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/msdp/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/msdp/data_processing.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/msdp/eval_knwl_generation.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/msdp/eval_resp_generation.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/msdp/prep_resp_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/msdp/prompt_knwl_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/msdp/prompt_resp_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/sc21/CONFIG.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/sc21/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/sc21/SBATCH.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/sc21/SRUN.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/sc21/run_figure_11.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/sc21/run_figure_12.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/sc21/run_figure_13.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/sc21/run_figure_14.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/sc21/run_figure_15.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/sc21/run_figure_16.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/sc21/run_figure_17.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/sc21/run_figure_18.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/sc21/run_table_1.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/t5/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/t5/t5_mcore_train_curve.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/examples/t5/train_t5_220m_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/images/Achieved_petaFLOPs.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/images/cases_april2021.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/checkpointing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/dist_signal_handler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/global_vars.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/indexer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/initialize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/log_handler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/memory.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/microbatches.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/optimizer_param_scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/theoretical_memory_usage.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/timers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/training.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/inference_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/jit.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/model_parallel_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/package_info.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/packed_seq_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/parallel_state.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/datasets/Makefile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/datasets/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/datasets/blended_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/datasets/blended_megatron_dataset_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/datasets/blended_megatron_dataset_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/datasets/gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/datasets/helpers.cpp
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/datasets/indexed_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/datasets/megatron_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/datasets/readme.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/datasets/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/dist_checkpointing/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/dist_checkpointing/core.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/dist_checkpointing/dict_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/dist_checkpointing/mapping.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/dist_checkpointing/optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/dist_checkpointing/serialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/dist_checkpointing/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/dist_checkpointing/strategies/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/dist_checkpointing/strategies/base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/dist_checkpointing/strategies/tensorstore.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/dist_checkpointing/strategies/two_stage.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/dist_checkpointing/strategies/zarr.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/distributed/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/distributed/distributed_data_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/distributed/finalize_model_grads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/distributed/grad_buffer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/fusions/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/fusions/fused_bias_dropout.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/fusions/fused_bias_gelu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/fusions/fused_bias_swiglu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/fusions/fused_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/fusions/fused_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/T5/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/T5/t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/T5/t5_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/bert/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/bert/bert_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/bert/bert_lm_head.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/bert/bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/bert/pooler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/common/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/common/embeddings/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/common/embeddings/language_model_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/common/embeddings/rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/common/language_module/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/common/language_module/language_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/gpt/gpt_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/gpt/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/retro/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/retro/base_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/retro/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/retro/decoder_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/retro/decoder_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/retro/encoder_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/retro/encoder_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/models/retro/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/pipeline_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/pipeline_parallel/p2p_communication.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/pipeline_parallel/schedules.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/tensor_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/tensor_parallel/cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/tensor_parallel/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/tensor_parallel/layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/tensor_parallel/mappings.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/tensor_parallel/random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/tensor_parallel/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/dot_product_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/identity_op.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/spec_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/transformer_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/transformer_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/custom_layers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/custom_layers/transformer_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/moe/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/moe/experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/moe/grouped_gemm_util.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/moe/moe_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/moe/router.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/core/transformer/moe/token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/data/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/data/autoaugment.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/data/bert_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/data/biencoder_dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/data/data_samplers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/data/dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/data/ict_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/data/image_folder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/data/multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/data/orqa_wiki_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/data/realm_dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/data/realm_index.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/data/t5_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/data/vit_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/fp16_deprecated/loss_scaler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/fused_kernels/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/fused_kernels/compat.h
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/fused_kernels/type_shim.h
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/fused_kernels/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/fused_kernels/tests/test_fused_kernels.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/biencoder_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/fused_bias_gelu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/fused_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/fused_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/multiple_choice.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/realm_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/rms_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/vision/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/vision/dino.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/vision/esvit_swin_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/vision/inpainting.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/vision/knn_monitor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/vision/mit_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/vision/swin_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/vision/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/model/vision/vit_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/mpu/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/mpu/tests/commons.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/mpu/tests/test_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/mpu/tests/test_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/mpu/tests/test_initialize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/mpu/tests/test_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/mpu/tests/test_random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/optimizer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/optimizer/clip_grads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/optimizer/distrib_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/optimizer/grad_scaler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/optimizer/optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/optimizer/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/static/index.html
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/text_generation/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/text_generation/api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/text_generation/beam_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/text_generation/communication.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/text_generation/forward_step.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/text_generation/generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/text_generation/sampling.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/text_generation/tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/tokenizer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/tokenizer/bert_tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/tokenizer/gpt2_tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/megatron/tokenizer/tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/data_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/ensemble_classifier.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/finetune_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/glue/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/glue/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/glue/mnli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/glue/qqp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/msdp/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/msdp/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/msdp/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/msdp/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/msdp/preprocessing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/msdp/prompt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/orqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/orqa/evaluate_orqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/orqa/evaluate_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/orqa/supervised/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/orqa/supervised/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/orqa/supervised/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/orqa/unsupervised/nq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/orqa/unsupervised/qa_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/orqa/unsupervised/tokenizers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/race/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/race/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/vision/finetune_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/vision/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/vision/classification/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/vision/classification/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/vision/segmentation/cityscapes.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/vision/segmentation/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/vision/segmentation/finetune_segformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/vision/segmentation/finetune_setr.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/vision/segmentation/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/vision/segmentation/seg_heads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/vision/segmentation/seg_models.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/vision/segmentation/transforms.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/vision/segmentation/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/zeroshot_gpt/datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/zeroshot_gpt/detokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tasks/zeroshot_gpt/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/python_test_utils/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/python_test_utils/check_slurm_job_completion.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/python_test_utils/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/python_test_utils/get_test_results_from_tensorboard_logs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/python_test_utils/jet_test_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/python_test_utils/multitest_ci_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/python_test_utils/test_ci_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/python_test_utils/test_resume_checkpoint_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/shell_test_utils/jobwait.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/shell_test_utils/run_selene_test_launcher_script.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/shell_test_utils/run_selene_test_resume_checkpoint_launcher_script.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/bert/bert_tp1_pp2_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/bert/bert_tp1_pp2_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/bert/bert_tp1_pp2_1nodes_50steps_core_enabled_rope_embeddings.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/bert/bert_tp1_pp2_1nodes_50steps_core_enabled_sequence_parallel.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/bert/bert_tp1_pp4_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/bert/bert_tp1_pp4_interleaved_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/bert/bert_tp1_pp4_interleaved_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/bert/bert_tp2_pp2_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/bert/bert_tp2_pp2_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/bert/bert_tp4_pp1_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/bert/bert_tp4_pp1_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp1_1nodes_50steps_dist_optimizer.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp1_1nodes_50steps_dist_optimizer_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp1_1nodes_50steps_dist_optimizer_overlap_grad_reduce_param_gather.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp1_1nodes_50steps_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp2_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp2_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp2_1nodes_50steps_core_enabled_rope_embeddings.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_1nodes_50steps_core_enabled_disable_bias_linear.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_1nodes_50steps_core_enabled_sequence_parallel.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_1nodes_50steps_core_enabled_swiglu.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_1nodes_50steps_core_enabled_untie_embeddings_and_outputs.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_1nodes_50steps_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_interleaved_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_interleaved_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_interleaved_1nodes_50steps_dist_optimizer_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_interleaved_1nodes_50steps_dist_optimizer_overlap_grad_reduce_param_gather.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_interleaved_1nodes_50steps_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp1_1nodes_50steps_core_enabled_context_parallelism_cp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp1_1nodes_50steps_core_enabled_te_8experts2parallel.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp1_1nodes_50steps_core_enabled_te_8experts2parallel_groupedGEMM.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp1_1nodes_50steps_core_enabled_te_8experts2parallel_top2router.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp2_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp2_1nodes_50steps_4experts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp2_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp2_1nodes_50steps_core_enabled_context_parallelism_cp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp2_1nodes_50steps_core_enabled_te_2experts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp2_1nodes_50steps_core_enabled_te_4experts2parallel.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp2_1nodes_50steps_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp2_1nodes_50steps_te_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp4_pp1_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp4_pp1_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp4_pp1_1nodes_50steps_dist_optimizer_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp4_pp1_1nodes_50steps_dist_optimizer_overlap_grad_reduce_param_gather.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/gpt3/gpt3_tp4_pp1_1nodes_50steps_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/jet/gpt3_345m_mcore-pyt_func-train_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-1_args--recompute-granularity-full-recompute-method-uniform-recompute-num-layers-1-.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/jet/gpt3_345m_mcore-pyt_func-train_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/jet/gpt3_345m_mcore-pyt_func-train_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-2_args--position-embedding-type-rope-.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/jet/gpt3_345m_mcore-pyt_func-train_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/jet/gpt3_345m_mcore-pyt_func-train_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args--disable-bias-linear.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/jet/gpt3_345m_mcore-pyt_func-train_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args--sequence-parallel.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/jet/gpt3_345m_mcore-pyt_func-train_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args--swiglu.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/jet/gpt3_345m_mcore-pyt_func-train_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args--untie-embeddings-and-output-weights.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/jet/gpt3_345m_mcore-pyt_func-train_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-2_pp-2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/jet/gpt3_345m_mcore-pyt_func-train_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-4_pp-1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/retro/retro_tp1_pp1_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_results/t5/t5_tp1_pp1_interleaved_1nodes_100steps_te_enabled_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_scripts/bert/pretrain_bert_distributed_resume_checkpoint_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_scripts/bert/pretrain_bert_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_scripts/bert/sbatch_bert_distributed_resume_checkpoint_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_scripts/bert/sbatch_bert_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_scripts/gpt3/pretrain_gpt3_distributed_resume_checkpoint_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_scripts/gpt3/pretrain_gpt3_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_scripts/gpt3/sbatch_gpt3_distributed_resume_checkpoint_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_scripts/gpt3/sbatch_gpt3_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_scripts/retro/pretrain_retro_distributed_resume_checkpoint_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_scripts/retro/pretrain_retro_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_scripts/retro/sbatch_retro_distributed_resume_checkpoint_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_scripts/retro/sbatch_retro_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_scripts/t5/pretrain_t5_distributed_resume_checkpoint_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_scripts/t5/pretrain_t5_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_scripts/t5/sbatch_t5_distributed_resume_checkpoint_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/functional_tests/test_scripts/t5/sbatch_t5_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/test_basic.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/test_imports.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/test_parallel_state.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/test_utilities.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/test_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/data/test_preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/data/test_preprocess_mmdata.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/dist_checkpointing/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/dist_checkpointing/conftest.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/dist_checkpointing/test_mapping.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/dist_checkpointing/test_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/dist_checkpointing/test_serialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/dist_checkpointing/models/test_gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/dist_checkpointing/models/test_mlp_glu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/models/test_base_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/models/test_bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/models/test_gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/models/test_t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/pipeline_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/pipeline_parallel/test_schedules.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/tensor_parallel/test_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/tensor_parallel/test_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/tensor_parallel/test_mappings.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/tensor_parallel/test_random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/tensor_parallel/test_tensor_parallel_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/transformer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/transformer/test_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/transformer/test_attention_packed_seq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/transformer/test_core_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/transformer/test_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/transformer/test_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/transformer/test_retro_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/transformer/test_spec_customization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/transformer/test_transformer_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/transformer/test_transformer_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/transformer/moe/test_grouped_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/transformer/moe/test_routers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/transformer/moe/test_switch_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tests/unit_tests/transformer/moe/test_token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/autoformat.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/linter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/merge_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/preprocess_data_nmt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/preprocess_mmdata.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/run_text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/text_generation_cli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/bert_embedding/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/bert_embedding/dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/bert_embedding/embed.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/bert_embedding/external_libs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/bert_embedding/huggingface.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/bert_embedding/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/checkpoint/loader_llama2_hf.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/checkpoint/loader_megatron.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/checkpoint/saver_megatron.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/checkpoint/util.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/openwebtext/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/openwebtext/add_id.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/openwebtext/blacklist_urls.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/openwebtext/cleanup_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/openwebtext/cleanup_fix_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/openwebtext/filter_ngrams.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/openwebtext/find_duplicates.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/openwebtext/group_duplicate_url.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/openwebtext/merge_jsons.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/openwebtext/remove_group_duplicates.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/build_db.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/external_libs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/cli/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/cli/__main__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/cli/cli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/db/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/db/build.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/db/dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/db/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/examples/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/examples/preprocess_data.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/examples/pretrain_model.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/index/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/index/build.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/index/factory.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/index/index.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/index/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/index/indexes/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/index/indexes/faiss_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/index/indexes/faiss_par_add.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/query/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/query/chunk_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/query/multi_split_gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/query/query.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/query/retro_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/query/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/sft/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/sft/dataset_conv.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/sft/open_inst.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/sft/sft_gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/sft/sft_retro.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/sft/sft_retro_lm.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/text_generation/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/text_generation/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/text_generation/retro_api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/text_generation/retro_generate.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/text_generation/retro_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240126/tools/retro/text_generation/retro_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/.coveragerc
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/CODEOWNERS
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/CONTRIBUTING.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/Dockerfile.ci
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/Dockerfile.test
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/LICENSE
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/MANIFEST.in
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/jet-tests.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/pretrain_bert.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/pretrain_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/pretrain_ict.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/pretrain_retro.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/pretrain_t5.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/pretrain_vision_classify.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/pretrain_vision_dino.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/pretrain_vision_inpaint.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/pretrain_vlm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/pyproject.toml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/report_theoretical_memory.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/setup.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/.github/ISSUE_TEMPLATE/bug.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/.github/ISSUE_TEMPLATE/enhancement.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/.github/ISSUE_TEMPLATE/question.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/.github/ISSUE_TEMPLATE/regression.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/.github/workflows/stale.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/llama2.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/distrib_optimizer.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/api-guide/context_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/api-guide/datasets.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/api-guide/dist_checkpointing.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/api-guide/dist_checkpointing.strategies.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/api-guide/distributed.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/api-guide/fusions.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/api-guide/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/api-guide/models.bert.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/api-guide/models.gpt.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/api-guide/models.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/api-guide/models.t5.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/api-guide/moe.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/api-guide/pipeline_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/api-guide/tensor_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/api-guide/transformer.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/images/context_parallel/CP_overview.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/images/context_parallel/CP_results.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/images/distrib_optimizer/data_flow.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/images/distrib_optimizer/sharding_scheme.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/docs/source/user-guide/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/evaluate_retriever_nq.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/evaluate_zeroshot_gpt.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/finetune_mnli_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/finetune_race_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/finetune_retriever_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/merge_mp_bert.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/pretrain_bert.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/pretrain_bert_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/pretrain_bert_distributed_with_mp.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/pretrain_gpt.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/pretrain_gpt3_175B.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/pretrain_gpt_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/pretrain_gpt_distributed_with_mp.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/pretrain_ict.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/pretrain_t5.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/pretrain_t5_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/pretrain_t5_distributed_with_mp.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/pretrain_vision_classify.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/pretrain_vision_dino.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/pretrain_vision_inpaint.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/pretrain_vlm.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/run_simple_mcore_train_loop.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/run_text_generation_server_345M.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/run_text_generation_server_345M_8_tensor_parallel.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/bert/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/bert/train_bert_340m_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/detxoify_lm/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/detxoify_lm/finetune_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/detxoify_lm/finetune_gpt_distributed-1.3b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/detxoify_lm/generate-1.3b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/detxoify_lm/generate_samples_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/detxoify_lm/perspective_api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/detxoify_lm/annotations/filter-selfgeneration.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/detxoify_lm/annotations/perspective_api_annotate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/detxoify_lm/annotations/preprocess.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/detxoify_lm/self_generation/selfgenerate-1.3b-unconditional.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/gpt3/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/gpt3/gpt_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/gpt3/train_gpt3_175b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/inference/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/inference/ptq_trtllm_llama_7b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/inference/ptq_trtllm_nemotron3_8b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/inference/text_generation_ptq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/inference/trtllm_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/msdp/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/msdp/data_processing.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/msdp/eval_knwl_generation.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/msdp/eval_resp_generation.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/msdp/prep_resp_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/msdp/prompt_knwl_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/msdp/prompt_resp_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/retro/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/retro/preprocess_data.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/retro/train_retro_2b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/sc21/CONFIG.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/sc21/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/sc21/SBATCH.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/sc21/SRUN.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/sc21/run_figure_11.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/sc21/run_figure_12.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/sc21/run_figure_13.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/sc21/run_figure_14.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/sc21/run_figure_15.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/sc21/run_figure_16.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/sc21/run_figure_17.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/sc21/run_figure_18.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/sc21/run_table_1.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/t5/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/t5/t5_mcore_train_curve.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/examples/t5/train_t5_220m_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/images/Achieved_petaFLOPs.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/images/cases_april2021.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/QuickStart.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/inference_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/jit.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/model_parallel_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/package_info.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/packed_seq_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/parallel_state.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/timers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/Makefile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/bert_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/blended_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/blended_megatron_dataset_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/blended_megatron_dataset_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/helpers.cpp
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/indexed_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/masked_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/megatron_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/megatron_tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/readme.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/t5_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/external_libs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/config/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/config/bert_embedders.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/config/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/config/gpt_chunk_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/config/tokenizers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/db/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/db/build.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/db/dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/db/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/index/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/index/build.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/index/factory.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/index/index.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/index/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/index/validate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/index/indexes/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/index/indexes/faiss_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/index/indexes/faiss_par_add.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/query/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/query/gpt_chunk_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/query/multi_split_gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/query/query.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/query/retro_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/datasets/retro/query/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/dist_checkpointing/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/dist_checkpointing/core.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/dist_checkpointing/dict_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/dist_checkpointing/mapping.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/dist_checkpointing/optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/dist_checkpointing/serialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/dist_checkpointing/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/dist_checkpointing/strategies/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/dist_checkpointing/strategies/base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/dist_checkpointing/strategies/filesystem_async.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/dist_checkpointing/strategies/state_dict_saver.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/dist_checkpointing/strategies/tensorstore.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/dist_checkpointing/strategies/torch.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/dist_checkpointing/strategies/two_stage.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/dist_checkpointing/strategies/zarr.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/distributed/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/distributed/distributed_data_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/distributed/finalize_model_grads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/distributed/param_and_grad_buffer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/fusions/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/fusions/fused_bias_dropout.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/fusions/fused_bias_geglu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/fusions/fused_bias_gelu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/fusions/fused_bias_swiglu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/fusions/fused_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/fusions/fused_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/inference/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/inference/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/inference/gpt/model_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/inference/gpt/state_dict_hooks.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/T5/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/T5/t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/T5/t5_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/bert/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/bert/bert_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/bert/bert_lm_head.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/bert/bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/bert/pooler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/common/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/common/embeddings/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/common/embeddings/language_model_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/common/embeddings/rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/common/language_module/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/common/language_module/language_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/common/vision_module/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/common/vision_module/vision_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/gpt/gpt_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/gpt/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/multimodal/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/multimodal/llava_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/retro/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/retro/base_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/retro/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/retro/decoder_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/retro/decoder_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/retro/encoder_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/retro/encoder_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/retro/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/retro/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/vision/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/vision/clip_vit_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/models/vision/multimodal_projector.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/optimizer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/optimizer/clip_grads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/optimizer/distrib_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/optimizer/grad_scaler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/optimizer/optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/optimizer/optimizer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/pipeline_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/pipeline_parallel/p2p_communication.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/pipeline_parallel/schedules.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/tensor_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/tensor_parallel/cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/tensor_parallel/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/tensor_parallel/layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/tensor_parallel/mappings.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/tensor_parallel/random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/tensor_parallel/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/dot_product_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/identity_op.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/spec_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/transformer_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/transformer_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/custom_layers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/custom_layers/transformer_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/moe/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/moe/experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/moe/grouped_gemm_util.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/moe/moe_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/moe/router.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/core/transformer/moe/token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/inference/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/inference/arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/inference/text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/inference/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/inference/gpt/model_provider.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/inference/static/index.html
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/inference/text_generation/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/inference/text_generation/api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/inference/text_generation/beam_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/inference/text_generation/communication.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/inference/text_generation/forward_step.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/inference/text_generation/generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/inference/text_generation/sampling.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/inference/text_generation/tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/indexer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/data/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/data/autoaugment.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/data/biencoder_dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/data/data_samplers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/data/dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/data/ict_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/data/image_folder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/data/multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/data/orqa_wiki_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/data/realm_dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/data/realm_index.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/data/vit_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/fp16_deprecated/loss_scaler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/fused_kernels/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/fused_kernels/compat.h
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/fused_kernels/type_shim.h
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/fused_kernels/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/fused_kernels/tests/test_fused_kernels.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/biencoder_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/fused_bias_gelu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/fused_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/fused_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/multiple_choice.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/realm_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/rms_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/vision/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/vision/dino.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/vision/esvit_swin_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/vision/inpainting.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/vision/knn_monitor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/vision/mit_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/vision/swin_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/vision/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/model/vision/vit_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/mpu/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/mpu/tests/commons.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/mpu/tests/test_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/mpu/tests/test_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/mpu/tests/test_initialize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/mpu/tests/test_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/legacy/mpu/tests/test_random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/training/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/training/arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/training/checkpointing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/training/dist_signal_handler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/training/global_vars.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/training/initialize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/training/log_handler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/training/microbatches.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/training/optimizer_param_scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/training/theoretical_memory_usage.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/training/training.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/training/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/training/yaml_arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/training/tokenizer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/training/tokenizer/bert_tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/training/tokenizer/gpt2_tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/megatron/training/tokenizer/tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/data_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/ensemble_classifier.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/finetune_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/glue/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/glue/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/glue/mnli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/glue/qqp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/msdp/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/msdp/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/msdp/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/msdp/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/msdp/preprocessing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/msdp/prompt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/orqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/orqa/evaluate_orqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/orqa/evaluate_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/orqa/supervised/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/orqa/supervised/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/orqa/supervised/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/orqa/unsupervised/nq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/orqa/unsupervised/qa_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/orqa/unsupervised/tokenizers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/race/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/race/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/vision/finetune_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/vision/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/vision/classification/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/vision/classification/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/vision/segmentation/cityscapes.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/vision/segmentation/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/vision/segmentation/finetune_segformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/vision/segmentation/finetune_setr.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/vision/segmentation/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/vision/segmentation/seg_heads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/vision/segmentation/seg_models.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/vision/segmentation/transforms.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/vision/segmentation/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/zeroshot_gpt/datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/zeroshot_gpt/detokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tasks/zeroshot_gpt/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/jet_recipes/MR-bert.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/jet_recipes/MR-gpt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/jet_recipes/MR-multimodal.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/jet_recipes/MR-t5.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/jet_recipes/build-pyt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/jet_recipes/monthly-t5.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/jet_recipes/nightly-bert.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/jet_recipes/nightly-gpt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/jet_recipes/weekly-gpt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/python_test_utils/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/python_test_utils/check_slurm_job_completion.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/python_test_utils/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/python_test_utils/get_test_results_from_tensorboard_logs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/python_test_utils/jet_test_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/python_test_utils/multitest_ci_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/python_test_utils/test_ci_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/python_test_utils/test_fp8_ci_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/python_test_utils/test_resume_checkpoint_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/shell_test_utils/jobwait.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/shell_test_utils/run_selene_test_launcher_script.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/shell_test_utils/run_selene_test_resume_checkpoint_launcher_script.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/bert/bert_tp1_pp2_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/bert/bert_tp1_pp2_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/bert/bert_tp1_pp2_1nodes_50steps_core_enabled_rope_embeddings.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/bert/bert_tp1_pp2_1nodes_50steps_core_enabled_sequence_parallel.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/bert/bert_tp1_pp4_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/bert/bert_tp1_pp4_interleaved_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/bert/bert_tp1_pp4_interleaved_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/bert/bert_tp2_pp2_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/bert/bert_tp2_pp2_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/bert/bert_tp2_pp2_1nodes_50steps_core_enabled_local_spec.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/bert/bert_tp4_pp1_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/bert/bert_tp4_pp1_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp1_1nodes_50steps_dist_optimizer.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp1_1nodes_50steps_dist_optimizer_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp1_1nodes_50steps_dist_optimizer_overlap_grad_reduce_param_gather.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp1_1nodes_50steps_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp2_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp2_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp2_1nodes_50steps_core_enabled_rope_embeddings.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_1nodes_50steps_core_enabled_disable_bias_linear.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_1nodes_50steps_core_enabled_sequence_parallel.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_1nodes_50steps_core_enabled_swiglu.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_1nodes_50steps_core_enabled_untie_embeddings_and_outputs.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_1nodes_50steps_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_interleaved_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_interleaved_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_interleaved_1nodes_50steps_dist_optimizer_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_interleaved_1nodes_50steps_dist_optimizer_overlap_grad_reduce_param_gather.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp1_pp4_interleaved_1nodes_50steps_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp1_1nodes_50steps_core_enabled_context_parallelism_cp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp1_1nodes_50steps_core_enabled_te_8experts2parallel.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp1_1nodes_50steps_core_enabled_te_8experts2parallel_groupedGEMM.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp1_1nodes_50steps_core_enabled_te_8experts2parallel_top2router.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp2_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp2_1nodes_50steps_4experts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp2_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp2_1nodes_50steps_core_enabled_context_parallelism_cp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp2_1nodes_50steps_core_enabled_te_2experts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp2_1nodes_50steps_core_enabled_te_4experts2parallel.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp2_1nodes_50steps_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp2_pp2_1nodes_50steps_te_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp4_pp1_1nodes_50steps.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp4_pp1_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp4_pp1_1nodes_50steps_dist_optimizer_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp4_pp1_1nodes_50steps_dist_optimizer_overlap_grad_reduce_param_gather.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/gpt3/gpt3_tp4_pp1_1nodes_50steps_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/bert-345m-merge-request-dgx-a100-1n8g-mcore-tp2-pp2-local-spec.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/bert-345m-merge-request-dgx-a100-1n8g-mcore-tp2-pp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/bert-345m-merge-request-dgx-a100-1n8g-tp1-pp4-vp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/bert-345m-merge-request-dgx-a100-1n8g-tp2-pp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/bert-345m-merge-request-resume-dgx-a100-1n8g-tp1-pp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/bert-345m-nightly-dgx-a100-1n8g-mcore-tp1-pp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/bert-345m-nightly-dgx-a100-1n8g-mcore-tp1-pp4-vp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/bert-345m-nightly-dgx-a100-1n8g-mcore-tp4-pp1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/bert-345m-nightly-dgx-a100-1n8g-tp1-pp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/bert-345m-nightly-dgx-a100-1n8g-tp4-pp1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp1-pp1-dist-optimizer-no-mmap-bin-files.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp1-pp1-dist-optimizer.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp1-pp1-uniform-full-recompute.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp1-pp2-rope-embeddings-interleaved-no-fusion.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp1-pp2-rope-embeddings.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp1-pp4-disable-bias-linear.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp1-pp4-sequence-parallel.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp1-pp4-swiglu.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp1-pp4-untie-embeddings-and-outputs.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp1-pp4-vp1-decoupled-lr.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp1-pp4-vp1-dist-optimizer-overlap-grad-reduce-param-gather.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp1-pp4-vp1-dist-optimizer-overlap-grad-reduce-untied.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp1-pp4-vp1-dist-optimizer-overlap-grad-reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp1-pp4-vp1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp2-pp1-te-8experts2parallel-dist-optimizer.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp2-pp1-te-8experts2parallel-groupedgemm.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp2-pp1-te-8experts2parallel-overlap-grad-reduce-groupedgemm.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp2-pp1-te-8experts2parallel-top2router.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp2-pp1-te-8experts2parallel.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp2-pp2-no-create-attention-mask-in-dataloader.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp2-pp2-no-mmap-bin-files.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp2-pp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp4-pp1-dist-optimizer-overlap-grad-reduce-param-gather.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp4-pp1-dist-optimizer-overlap-grad-reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-mcore-tp4-pp1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-te-tp2-pp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-tp1-pp4-vp1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-dgx-a100-1n8g-tp2-pp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-merge-request-resume-dgx-a100-1n8g-tp1-pp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-nightly-dgx-a100-1n8g-mcore-tp1-pp1-dist-optimizer-overlap-grad-reduce-param-gather.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-nightly-dgx-a100-1n8g-mcore-tp1-pp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-nightly-dgx-a100-1n8g-mcore-tp1-pp4.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-nightly-dgx-a100-1n8g-mcore-tp2-pp2-te-2experts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-nightly-dgx-a100-1n8g-mcore-tp2-pp2-te-4experts2parallel.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-nightly-dgx-a100-1n8g-mcore-tp4-pp1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-nightly-dgx-a100-1n8g-tp1-pp1-dist-optimizer-overlap-grad-reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-nightly-dgx-a100-1n8g-tp1-pp1-overlap-grad-reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-nightly-dgx-a100-1n8g-tp1-pp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-nightly-dgx-a100-1n8g-tp1-pp4-overlap-grad-reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-nightly-dgx-a100-1n8g-tp1-pp4-vp1-overlap-grad-reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-nightly-dgx-a100-1n8g-tp1-pp4.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-nightly-dgx-a100-1n8g-tp2-pp2-4experts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-nightly-dgx-a100-1n8g-tp2-pp2-overlap-grad-reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-nightly-dgx-a100-1n8g-tp4-pp1-overlap-grad-reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-nightly-dgx-a100-1n8g-tp4-pp1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3-345m-weekly-dgx-h100-1n8g-mcore-tp1-pp1-bf16-baseline.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/gpt3_345m_mcore-pyt_func-train_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args--sequence-parallel.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/multimodal-llava-merge-request-dgx-a100-1n8g-mcore-te-tp1-pp1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/t5-220m-merge-request-dgx-a100-1n8g-mcore-te-tp1-pp1-vp1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/bert_345m_mcore-pyt_merge-request-resume_bf16_nodes-1_gpus-8_bs-128_steps-100_tp-1_pp-2_mcore-false_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/bert_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-128_steps-50_tp-1_pp-4_mcore-false_te-false_vp-2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/bert_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-128_steps-50_tp-2_pp-2_args-local-spec_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/bert_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-128_steps-50_tp-2_pp-2_mcore-false_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/bert_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-128_steps-50_tp-2_pp-2_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request-resume_bf16_nodes-1_gpus-8_bs-32_steps-100_tp-1_pp-2_mcore-false_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-1_args--recompute-granularity-full-recompute-method-uniform-recompute-num-layers-1-_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-1_args-dist-optimizer-no-mmap-bin-files_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-1_args-dist-optimizer_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-1_args-uniform-full-recompute_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-2_args--position-embedding-type-rope-_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-2_args-rope-embeddings-interleaved-no-fusion_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-2_args-rope-embeddings_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args--disable-bias-linear_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args--sequence-parallel_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args--swiglu_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args--untie-embeddings-and-output-weights_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args-disable-bias-linear_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args-dist-optimizer-overlap-grad-reduce-param-gather_mcore-true_te-false_vp-1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args-dist-optimizer-overlap-grad-reduce-untied_mcore-true_te-false_vp-1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args-dist-optimizer-overlap-grad-reduce_mcore-true_te-false_vp-1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args-sequence-parallel_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args-swiglu_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args-untie-embeddings-and-outputs_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_mcore-false_te-false_vp-1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_mcore-true_te-false_vp-1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-2_pp-1_args--sequence-parallel-num-experts-8-expert-model-parallel-size-2-_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-2_pp-1_args-te-8experts2parallel-dist-optimizer_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-2_pp-1_args-te-8experts2parallel-groupedgemm_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-2_pp-1_args-te-8experts2parallel-top2router_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-2_pp-1_args-te-8experts2parallel_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-2_pp-2_args-no-mmap-bin-files_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-2_pp-2_mcore-false_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-2_pp-2_mcore-false_te-true.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-2_pp-2_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-4_pp-1_args-dist-optimizer-overlap-grad-reduce-param-gather_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-4_pp-1_args-dist-optimizer-overlap-grad-reduce_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_nightly_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-1_args--overlap-grad-reduce_mcore-false_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_nightly_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-1_args--use-distributed-optimizer-overlap-grad-reduce-_mcore-false_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_nightly_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-2_mcore-false_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_nightly_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-2_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_nightly_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args--overlap-grad-reduce_mcore-false_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_nightly_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_args--overlap-grad-reduce_mcore-false_te-false_vp-1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_nightly_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_mcore-false_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_nightly_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-1_pp-4_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_nightly_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-2_pp-2_args--num-experts-2-_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_nightly_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-2_pp-2_args--num-experts-4-_mcore-false_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_nightly_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-2_pp-2_args--overlap-grad-reduce_mcore-false_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_nightly_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-2_pp-2_args--sequence-parallel-num-experts-4-expert-model-parallel-size-2-_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_nightly_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-4_pp-1_args--overlap-grad-reduce_mcore-false_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_nightly_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-4_pp-1_mcore-false_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/gpt3_345m_mcore-pyt_nightly_bf16_nodes-1_gpus-8_bs-32_steps-50_tp-4_pp-1_mcore-true_te-false.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/jet/dgx_h100/t5_220m_mcore-pyt_merge-request_bf16_nodes-1_gpus-8_bs-32_steps-100_tp-1_pp-1_mcore-true_te-true_vp-1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/retro/retro_tp1_pp1_1nodes_50steps_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_results/t5/t5_tp1_pp1_interleaved_1nodes_100steps_te_enabled_core_enabled.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_scripts/bert/pretrain_bert_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_scripts/bert/sbatch_bert_distributed_resume_checkpoint_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_scripts/bert/sbatch_bert_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_scripts/gpt3/pretrain_gpt3_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_scripts/gpt3/sbatch_gpt3_distributed_resume_checkpoint_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_scripts/gpt3/sbatch_gpt3_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_scripts/multimodal/pretrain_llava_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_scripts/retro/pretrain_retro_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_scripts/retro/sbatch_retro_distributed_resume_checkpoint_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_scripts/retro/sbatch_retro_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_scripts/t5/pretrain_t5_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_scripts/t5/sbatch_t5_distributed_resume_checkpoint_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/functional_tests/test_scripts/t5/sbatch_t5_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/test_basic.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/test_imports.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/test_parallel_state.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/test_training.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/test_utilities.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/test_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/data/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/data/test_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/data/test_mock_gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/data/test_multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/data/test_preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/data/test_preprocess_mmdata.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/dist_checkpointing/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/dist_checkpointing/conftest.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/dist_checkpointing/test_mapping.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/dist_checkpointing/test_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/dist_checkpointing/test_serialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/dist_checkpointing/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/dist_checkpointing/models/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/dist_checkpointing/models/test_bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/dist_checkpointing/models/test_gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/dist_checkpointing/models/test_mlp_glu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/dist_checkpointing/models/test_retro_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/dist_checkpointing/models/test_sequential_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/dist_checkpointing/models/test_t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/fusions/test_torch_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/models/test_base_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/models/test_bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/models/test_clip_vit_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/models/test_gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/models/test_llava_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/models/test_multimodal_projector.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/models/test_t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/pipeline_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/pipeline_parallel/test_schedules.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/tensor_parallel/test_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/tensor_parallel/test_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/tensor_parallel/test_initialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/tensor_parallel/test_mappings.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/tensor_parallel/test_random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/tensor_parallel/test_tensor_parallel_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/transformer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/transformer/test_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/transformer/test_attention_packed_seq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/transformer/test_core_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/transformer/test_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/transformer/test_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/transformer/test_retro_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/transformer/test_spec_customization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/transformer/test_transformer_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/transformer/test_transformer_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/transformer/moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/transformer/moe/test_grouped_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/transformer/moe/test_routers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/transformer/moe/test_sequential_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tests/unit_tests/transformer/moe/test_token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/autoformat.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/linter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/merge_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/preprocess_data_nmt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/preprocess_mmdata.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/run_text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/text_generation_cli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/bert_embedding/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/bert_embedding/dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/bert_embedding/embed.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/bert_embedding/external_libs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/bert_embedding/huggingface.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/checkpoint/convert.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/checkpoint/loader_llama2_hf.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/checkpoint/loader_mcore.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/checkpoint/loader_megatron.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/checkpoint/saver_mcore.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/checkpoint/saver_megatron.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/checkpoint/setter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/checkpoint/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/openwebtext/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/openwebtext/add_id.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/openwebtext/blacklist_urls.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/openwebtext/cleanup_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/openwebtext/cleanup_fix_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/openwebtext/filter_ngrams.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/openwebtext/find_duplicates.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/openwebtext/group_duplicate_url.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/openwebtext/merge_jsons.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/openwebtext/remove_group_duplicates.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/build_db.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/config_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/cli/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/cli/__main__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/cli/cli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/docker/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/sft/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/sft/dataset_conv.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/sft/open_inst.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/sft/sft_retro.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/sft/sft_retro_lm.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/text_generation/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/text_generation/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/text_generation/retro_api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/text_generation/retro_generate.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/text_generation/retro_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-240405/tools/retro/text_generation/retro_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/.coveragerc
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/.flake8
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/.pylintrc
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/CHANGELOG.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/CODEOWNERS
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/CONTRIBUTING.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/Dockerfile.ci.dev
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/Dockerfile.ci.lts
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/Dockerfile.linting
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/LICENSE
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/MANIFEST.in
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/pretrain_bert.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/pretrain_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/pretrain_ict.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/pretrain_mamba.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/pretrain_retro.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/pretrain_t5.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/pretrain_vision_classify.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/pretrain_vision_dino.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/pretrain_vision_inpaint.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/pretrain_vlm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/pyproject.toml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/pytest.ini
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/setup.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/.github/ISSUE_TEMPLATE/bug.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/.github/ISSUE_TEMPLATE/enhancement.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/.github/ISSUE_TEMPLATE/question.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/.github/ISSUE_TEMPLATE/regression.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/.github/workflows/stale.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/.gitlab/labeler-config.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/.gitlab/stages/00.pre.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/.gitlab/stages/01.test.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/.gitlab/stages/02.functional-tests.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/.gitlab/stages/03.publish.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/llama_mistral.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/context_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/datasets.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/dist_checkpointing.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/dist_checkpointing.strategies.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/dist_optimizer.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/distributed.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/encoder_decoder_parallelism.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/fusions.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/models.bert.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/models.gpt.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/models.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/models.t5.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/moe.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/num_microbatches_calculator.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/optimizer_param_scheduler.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/pipeline_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/tensor_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/api-guide/transformer.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/images/context_parallel/CP_overview.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/images/context_parallel/CP_results.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/images/distrib_optimizer/data_flow.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/images/distrib_optimizer/sharding_scheme.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/images/moe/token_drop.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/docs/source/user-guide/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/run_simple_mcore_train_loop.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/detxoify_lm/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/detxoify_lm/finetune_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/detxoify_lm/finetune_gpt_distributed-1.3b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/detxoify_lm/generate-1.3b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/detxoify_lm/generate_samples_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/detxoify_lm/perspective_api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/detxoify_lm/annotations/filter-selfgeneration.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/detxoify_lm/annotations/perspective_api_annotate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/detxoify_lm/annotations/preprocess.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/detxoify_lm/self_generation/selfgenerate-1.3b-unconditional.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/msdp/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/msdp/data_processing.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/msdp/eval_knwl_generation.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/msdp/eval_resp_generation.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/msdp/prep_resp_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/msdp/prompt_knwl_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/msdp/prompt_resp_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/sc21/CONFIG.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/sc21/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/sc21/SBATCH.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/sc21/SRUN.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/sc21/run_figure_11.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/sc21/run_figure_12.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/sc21/run_figure_13.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/sc21/run_figure_14.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/sc21/run_figure_15.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/sc21/run_figure_16.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/sc21/run_figure_17.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/sc21/run_figure_18.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/academic_paper_scripts/sc21/run_table_1.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/bert/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/bert/train_bert_340m_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/export/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/export/knowledge_distillation/pretrain_gpt_modelopt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/export/ptq_and_trtllm_export/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/export/ptq_and_trtllm_export/ptq_trtllm_llama2_7b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/export/ptq_and_trtllm_export/ptq_trtllm_llama3_1_8b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/export/ptq_and_trtllm_export/ptq_trtllm_llama3_8b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/export/ptq_and_trtllm_export/ptq_trtllm_minitron_8b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/export/ptq_and_trtllm_export/ptq_trtllm_mistral_12b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/export/ptq_and_trtllm_export/ptq_trtllm_mixtral_8x7b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/export/ptq_and_trtllm_export/text_generation_ptq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/export/ptq_and_trtllm_export/trtllm_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/export/trtllm_export/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/export/trtllm_export/distributed_export/gpt_distributed_gpu_export.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/export/trtllm_export/single_device_export/gpt_single_device_cpu_export.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/gpt3/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/gpt3/gpt_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/gpt3/train_gpt3_175b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/inference/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/inference/run_text_generation_server_345M.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/inference/run_text_generation_server_345M_8_tensor_parallel.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/inference/gpt/simple_gpt_batch_inference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/inference/llama_mistral/huggingface_reference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/inference/llama_mistral/run_text_generation_llama3.1.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/inference/llama_mistral/run_text_generation_llama3.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/inference/llama_mistral/run_text_generation_mistral.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/inference/t5/simple_t5_batch_inference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/mamba/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/mamba/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/mamba/run_text_gen_server_8b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/mamba/run_text_gen_server_8b_gpt3.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/mamba/train.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/mixtral/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/mixtral/train_mixtral_8x7b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/combine_mistral_clip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/combine_state_dicts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/convert_llava_pretrain_to_wds.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/dataloader_provider.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/dataset_helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/evaluate_ai2d.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/evaluate_chartqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/evaluate_coco.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/evaluate_mathvista.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/evaluate_mmmu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/evaluate_ocrbench.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/evaluate_textvqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/evaluate_vqav2.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/evaluation_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/image_processing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/manual_prompts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/multimodal_args.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/pretrain_dataset.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/pretrain_mistral_clip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/run_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/sft_dataset.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/sft_mistral_clip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/text_generation_mistral_clip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/train.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/assets/pretrain_curves.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/model_converter/clip_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/model_converter/internvit_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/model_converter/siglip_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/model_converter/vision_model_tester.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/multimodal/nvlm/internvit.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/retro/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/retro/preprocess_data.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/retro/train_retro_2b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/t5/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/t5/t5_mcore_train_curve.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/examples/t5/train_t5_220m_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/images/model_table.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/images/strong_scaling.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/images/weak_scaling.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/QuickStart.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/README_STRAGGLER.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/config_logger.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/jit.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/model_parallel_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/num_microbatches_calculator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/optimizer_param_scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/package_info.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/packed_seq_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/parallel_state.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/timers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/Makefile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/bert_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/blended_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/blended_megatron_dataset_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/blended_megatron_dataset_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/helpers.cpp
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/indexed_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/masked_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/megatron_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/megatron_tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/readme.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/t5_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/utils_s3.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/external_libs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/config/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/config/bert_embedders.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/config/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/config/gpt_chunk_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/config/tokenizers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/db/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/db/build.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/db/dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/db/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/index/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/index/build.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/index/factory.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/index/index.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/index/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/index/validate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/index/indexes/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/index/indexes/faiss_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/index/indexes/faiss_par_add.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/query/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/query/gpt_chunk_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/query/multi_split_gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/query/query.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/query/retro_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/datasets/retro/query/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/core.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/dict_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/exchange_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/mapping.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/serialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/state_dict_transformation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/validation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/strategies/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/strategies/async_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/strategies/base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/strategies/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/strategies/filesystem_async.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/strategies/fully_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/strategies/resharding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/strategies/state_dict_saver.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/strategies/tensorstore.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/strategies/torch.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/strategies/two_stage.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/dist_checkpointing/strategies/zarr.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/distributed/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/distributed/distributed_data_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/distributed/distributed_data_parallel_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/distributed/finalize_model_grads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/distributed/param_and_grad_buffer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/data_type.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/export_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/model_type.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/trt_model_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/trt_model_type.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/trtllm_helper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/trtllm_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/engine_builder/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/engine_builder/trtllm_engine_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/model_to_trllm_mapping/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/model_to_trllm_mapping/default_conversion_dict.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/model_to_trllm_mapping/falcon_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/model_to_trllm_mapping/gemma_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/model_to_trllm_mapping/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/model_to_trllm_mapping/gpt_next_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/model_to_trllm_mapping/llama_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/model_to_trllm_mapping/starcoder_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/trtllm_weights_converter/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/trtllm_weights_converter/distributed_trtllm_model_weights_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/export/trtllm/trtllm_weights_converter/single_device_trtllm_model_weights_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/extensions/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/extensions/transformer_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/fusions/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/fusions/fused_bias_dropout.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/fusions/fused_bias_geglu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/fusions/fused_bias_gelu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/fusions/fused_bias_swiglu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/fusions/fused_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/fusions/fused_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/fusions/fused_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/common_inference_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/communication_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/inference_request.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/ammo_support/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/ammo_support/gpt/model_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/ammo_support/gpt/state_dict_hooks.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/engines/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/engines/abstract_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/engines/mcore_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/model_inference_wrappers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/model_inference_wrappers/abstract_model_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/model_inference_wrappers/inference_wrapper_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/model_inference_wrappers/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/model_inference_wrappers/gpt/gpt_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/model_inference_wrappers/t5/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/model_inference_wrappers/t5/t5_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/modelopt_support/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/modelopt_support/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/modelopt_support/gpt/model_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/modelopt_support/gpt/state_dict_hooks.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/text_generation_controllers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/text_generation_controllers/encoder_decoder_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/inference/text_generation_controllers/simple_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/T5/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/T5/t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/T5/t5_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/bert/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/bert/bert_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/bert/bert_lm_head.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/bert/bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/bert/pooler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/common/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/common/embeddings/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/common/embeddings/language_model_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/common/embeddings/rope_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/common/embeddings/rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/common/embeddings/yarn_rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/common/language_module/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/common/language_module/language_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/common/vision_module/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/common/vision_module/vision_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/gpt/gpt_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/gpt/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/mamba/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/mamba/mamba_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/mamba/mamba_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/multimodal/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/multimodal/llava_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/multimodal/llava_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/retro/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/retro/base_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/retro/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/retro/decoder_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/retro/decoder_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/retro/encoder_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/retro/encoder_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/retro/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/retro/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/vision/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/vision/clip_vit_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/vision/multimodal_projector.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/models/vision/vit_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/optimizer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/optimizer/clip_grads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/optimizer/distrib_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/optimizer/grad_scaler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/optimizer/optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/optimizer/optimizer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/pipeline_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/pipeline_parallel/p2p_communication.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/pipeline_parallel/schedules.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/ssm/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/ssm/mamba_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/ssm/mamba_hybrid_layer_allocation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/ssm/mamba_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/ssm/mamba_mixer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/ssm/triton_cache_manager.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/tensor_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/tensor_parallel/cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/tensor_parallel/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/tensor_parallel/layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/tensor_parallel/mappings.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/tensor_parallel/random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/tensor_parallel/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/cuda_graphs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/dot_product_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/identity_op.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/multi_latent_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/spec_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/torch_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/transformer_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/transformer_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/custom_layers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/custom_layers/transformer_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/moe/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/moe/experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/moe/grouped_gemm_util.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/moe/legacy_a2a_token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/moe/moe_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/moe/router.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/moe/shared_experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/moe/token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/core/transformer/moe/upcycling_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/checkpointing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/algos/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/algos/distillation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/docs/distillation.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/endpoints/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/endpoints/completions.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/gpt/loss_func.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/gpt/model_provider.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/static/index.html
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/text_generation/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/text_generation/api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/text_generation/beam_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/text_generation/communication.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/text_generation/forward_step.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/text_generation/generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/text_generation/sampling.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/inference/text_generation/tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/indexer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/data/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/data/autoaugment.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/data/biencoder_dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/data/data_samplers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/data/dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/data/ict_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/data/image_folder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/data/multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/data/orqa_wiki_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/data/realm_dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/data/realm_index.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/data/vit_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/fp16_deprecated/loss_scaler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/fused_kernels/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/fused_kernels/compat.h
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/fused_kernels/type_shim.h
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/fused_kernels/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/fused_kernels/tests/test_fused_kernels.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/biencoder_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/fused_bias_gelu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/fused_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/fused_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/multiple_choice.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/realm_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/rms_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/vision/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/vision/dino.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/vision/esvit_swin_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/vision/inpainting.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/vision/knn_monitor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/vision/mit_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/vision/swin_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/vision/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/model/vision/vit_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/mpu/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/mpu/tests/commons.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/mpu/tests/test_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/mpu/tests/test_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/mpu/tests/test_initialize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/mpu/tests/test_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/legacy/mpu/tests/test_random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/activations.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/async_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/checkpointing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/dist_signal_handler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/ft_integration.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/global_vars.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/initialize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/log_handler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/one_logger_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/theoretical_memory_usage.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/training.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/yaml_arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/tokenizer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/tokenizer/bert_tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/tokenizer/gpt2_tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/tokenizer/multimodal_tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/megatron/training/tokenizer/tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/data_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/ensemble_classifier.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/finetune_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/glue/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/glue/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/glue/mnli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/glue/qqp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/msdp/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/msdp/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/msdp/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/msdp/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/msdp/preprocessing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/msdp/prompt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/orqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/orqa/evaluate_orqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/orqa/evaluate_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/orqa/supervised/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/orqa/supervised/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/orqa/supervised/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/orqa/unsupervised/nq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/orqa/unsupervised/qa_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/orqa/unsupervised/tokenizers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/quantize/calibrate_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/race/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/race/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/vision/finetune_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/vision/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/vision/classification/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/vision/classification/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/vision/segmentation/cityscapes.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/vision/segmentation/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/vision/segmentation/finetune_segformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/vision/segmentation/finetune_setr.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/vision/segmentation/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/vision/segmentation/seg_heads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/vision/segmentation/seg_models.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/vision/segmentation/transforms.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/vision/segmentation/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/zeroshot_gpt/datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/zeroshot_gpt/detokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tasks/zeroshot_gpt/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/jet_recipes/_build-mcore-dev.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/jet_recipes/_build-mcore-lts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/jet_recipes/_build-nemo.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/jet_recipes/bert.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/jet_recipes/common.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/jet_recipes/gpt-modelopt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/jet_recipes/gpt-nemo.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/jet_recipes/gpt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/jet_recipes/multimodal-llava.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/jet_recipes/t5.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/python_test_utils/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/python_test_utils/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/python_test_utils/get_test_results_from_tensorboard_logs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/python_test_utils/test_ci_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/python_test_utils/test_fp8_ci_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/python_test_utils/test_resume_checkpoint_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/python_test_utils/jet/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/python_test_utils/jet/generate_jet_trigger_job.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/python_test_utils/jet/generate_local_jobs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/python_test_utils/jet/launch_jet_workload.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/shell_test_utils/_run_training.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/shell_test_utils/notify.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/shell_test_utils/notify_unit_tests.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/shell_test_utils/run_ci_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_local_spec_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_local_spec_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_local_spec_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_local_spec_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_mr_tp1_pp4_vp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_mr_tp1_pp4_vp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_mr_tp1_pp4_vp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_mr_tp1_pp4_vp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_mr_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_mr_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_mr_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_mr_tp2_pp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp4_vp2/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp4_vp2/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp4_vp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp4_pp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp4_pp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp4_pp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp1_pp2/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp1_pp2/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp1_pp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp4_pp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp4_pp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp4_pp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/bert/bert_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/common/ckpt_converter/__main__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/common/ckpt_converter/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt-nemo/gpt3-nemo_126m_mr_mbs1_gbs8_mcore_te_tp2_pp4_vp3_seq_par_overlap_p2p_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt-nemo/gpt3-nemo_126m_mr_mbs4_gbs64_mcore_te_tp1_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/golden_values_0.8.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release_sm/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_dist_optimizer_overlap_grad_reduce_param_gather/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_dist_optimizer_overlap_grad_reduce_param_gather/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_dist_optimizer_overlap_grad_reduce_param_gather/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_fp16/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_fp16/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_fp16/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_resume_torch_dist/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_resume_torch_dist/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_resume_torch_dist/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4_resume_torch_dist/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_resume_torch_dist_te_4experts2parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_te_4experts2parallel/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_te_4experts2parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_te_4experts2parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_resume_torch_dist_te_2experts/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch_dist/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_dist_optimizer_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_dist_optimizer_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_dist_optimizer_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2_resume_torch/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2_resume_torch/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_resume_torch/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_resume_torch/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_vp1_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_vp1_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_vp1_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_4experts/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_4experts/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_4experts/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_resume_torch/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_resume_torch/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_nondet_tp1_pp1_fp8_no_model_parallel/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_nondet_tp1_pp1_fp8_no_model_parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_nondet_tp1_pp1_fp8_no_model_parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_bf16_baseline/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_bf16_baseline/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_bf16_baseline/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_fp8_no_model_parallel/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_fp8_no_model_parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_fp8_no_model_parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp2_fp8_pp/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp2_fp8_pp/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp2_fp8_pp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp_sp/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp_sp/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp_sp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_native_fp8_tp_pp_sp/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_native_fp8_tp_pp_sp/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_native_fp8_tp_pp_sp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp4_pp2_fp8_tp_pp/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp4_pp2_fp8_tp_pp/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp4_pp2_fp8_tp_pp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_uniform_full_recompute_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_uniform_full_recompute_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_uniform_full_recompute_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_uniform_full_recompute_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_reshard_2x1x4_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_disable_bias_linear_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_disable_bias_linear_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_disable_bias_linear_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_disable_bias_linear_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_sequence_parallel_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_swiglu_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_untie_embeddings_and_outputs_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_sequence_parallel_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_sequence_parallel_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_sequence_parallel_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_swiglu_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_swiglu_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_swiglu_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_untie_embeddings_and_outputs_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_untie_embeddings_and_outputs_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_untie_embeddings_and_outputs_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_calculate_per_token_loss_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_calculate_per_token_loss_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_calculate_per_token_loss_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_decoupled_lr_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_decoupled_lr_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_decoupled_lr_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_overlap_optimizer_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_overlap_optimizer_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_overlap_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_decoupled_lr_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_calculate_per_token_loss_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_tunable_overlap_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_tunable_overlap_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_tunable_overlap_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_tunable_overlap_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_uneven_pipeline_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_uneven_pipeline_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_uneven_pipeline_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_cp2_nondeterministic_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_top2router_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_overlap_grad_reduce_param_gather_groupedGEMM_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_overlap_grad_reduce_param_gather_groupedGEMM_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_overlap_grad_reduce_param_gather_groupedGEMM_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_top2router_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_nondeterministic_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cross_entropy_loss_fusion_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cross_entropy_loss_fusion_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cross_entropy_loss_fusion_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_ddp_average_in_collective_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_ddp_average_in_collective_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_ddp_average_in_collective_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_defer_embedding_wgrad_compute_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_defer_embedding_wgrad_compute_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_defer_embedding_wgrad_compute_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_mmap_bin_files_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_mmap_bin_files_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_mmap_bin_files_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cross_entropy_loss_fusion_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_ddp_average_in_collective_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_defer_embedding_wgrad_compute_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_mmap_bin_files_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_reshard_1x4xNone_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_qk_layernorm_test_mode_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_qk_layernorm_test_mode_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_qk_layernorm_test_mode_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_qk_layernorm_test_mode_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_resume_torch_dist_uninstall_te_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_uninstall_te_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_te_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_te_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_te_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_te_tp2_pp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_tp1_pp4_vp1_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_tp1_pp4_vp1_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_tp1_pp4_vp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_tp1_pp4_vp1_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_mr_tp2_pp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/gpt/gpt3_nightly_mcore_te_tp2_pp1_modelopt_distill_resume/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/mixtral/mixtral_8x22b_tp2pp8ep8vpp1_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/mixtral/mixtral_8x22b_tp2pp8ep8vpp1_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/golden_values_0.8.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release_sm/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_tp1pp4ep8vpp8_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_tp1pp4ep8vpp8_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp1_pp1_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp1_pp1_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp1_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp2_pp3_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp2_pp3_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp2_pp3_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_etp3_dgx_a100_1N7G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_etp3_dgx_a100_1N7G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_etp3_dgx_a100_1N7G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_resume_torch_etp3_dgx_a100_1N7G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp2_pp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp1_pp1_vp1_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1_sequence_parallel/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1_sequence_parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1_sequence_parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp2_pp1_vp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp2_pp1_vp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp2_pp1_vp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_weekly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_220m_weekly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1_sequence_parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/functional_tests/test_cases/t5/t5_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/conftest.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/test_basic.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/test_imports.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/test_inference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/test_local_multi_tensor_fns.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/test_num_microbatches_calculator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/test_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/test_optimizer_param_scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/test_parallel_state.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/test_tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/test_training.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/test_utilities.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/test_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/data/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/data/test_bin_reader.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/data/test_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/data/test_gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/data/test_multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/data/test_preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/data/test_preprocess_mmdata.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/conftest.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/test_async_save.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/test_cached_metadata.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/test_flattened_resharding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/test_fp8.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/test_fully_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/test_local.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/test_mapping.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/test_nonpersistent.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/test_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/test_serialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/models/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/models/test_bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/models/test_gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/models/test_mamba.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/models/test_mlp_glu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/models/test_moe_experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/models/test_retro_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/dist_checkpointing/models/test_t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/distributed/test_grad_reduce_for_replicated_embedder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/distributed/test_param_and_grad_buffer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/export/trtllm/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/export/trtllm/test_trtllm_distributed_gpu_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/export/trtllm/test_trtllm_helper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/export/trtllm/test_trtllm_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/export/trtllm/test_trtllm_single_device_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/fusions/test_torch_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/inference/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/inference/test_common_inference_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/inference/test_flash_decode.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/inference/test_inference_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/inference/test_modelopt_gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/inference/test_scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/inference/engines/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/inference/engines/test_mcore_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/inference/model_inference_wrappers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/inference/model_inference_wrappers/test_model_inference_wrapper_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/inference/model_inference_wrappers/gpt/test_gpt_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/inference/model_inference_wrappers/t5/test_t5_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/inference/text_generation_controllers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/inference/text_generation_controllers/test_encoder_decoder_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/inference/text_generation_controllers/test_simple_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/interface_tests/test_transformer_forward.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/models/test_base_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/models/test_bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/models/test_clip_vit_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/models/test_gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/models/test_llava_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/models/test_mamba_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/models/test_multimodal_projector.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/models/test_t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/pipeline_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/pipeline_parallel/test_helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/pipeline_parallel/test_schedules.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/ssm/test_mamba_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/ssm/test_mamba_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/ssm/test_mamba_mixer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/tensor_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/tensor_parallel/test_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/tensor_parallel/test_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/tensor_parallel/test_initialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/tensor_parallel/test_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/tensor_parallel/test_mappings.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/tensor_parallel/test_random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/tensor_parallel/test_tensor_parallel_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/test_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/test_attention_packed_seq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/test_core_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/test_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/test_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/test_multi_latent_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/test_retro_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/test_rope.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/test_spec_customization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/test_transformer_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/test_transformer_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/moe/test_a2a_token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/moe/test_aux_loss.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/moe/test_grouped_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/moe/test_moe_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/moe/test_routers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/moe/test_sequential_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/moe/test_shared_experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/moe/test_token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tests/unit_tests/transformer/moe/test_upcycling.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/autoformat.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/copyright.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/linter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/merge_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/preprocess_data_nmt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/preprocess_mmdata.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/report_theoretical_memory.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/run_mamba_text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/run_text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/run_vlm_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/text_generation_cli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/bert_embedding/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/bert_embedding/dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/bert_embedding/embed.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/bert_embedding/external_libs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/bert_embedding/huggingface.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/checkpoint/convert.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/checkpoint/hybrid_conversion.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/checkpoint/loader_llama_mistral.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/checkpoint/loader_mcore.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/checkpoint/loader_megatron.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/checkpoint/loader_mixtral_hf.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/checkpoint/saver_mcore.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/checkpoint/saver_megatron.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/checkpoint/setter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/checkpoint/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/openwebtext/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/openwebtext/add_id.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/openwebtext/blacklist_urls.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/openwebtext/cleanup_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/openwebtext/cleanup_fix_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/openwebtext/filter_ngrams.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/openwebtext/find_duplicates.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/openwebtext/group_duplicate_url.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/openwebtext/merge_jsons.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/openwebtext/remove_group_duplicates.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/build_db.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/config_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/cli/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/cli/__main__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/cli/cli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/docker/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/sft/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/sft/dataset_conv.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/sft/open_inst.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/sft/sft_retro.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/sft/sft_retro_lm.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/text_generation/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/text_generation/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/text_generation/retro_api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/text_generation/retro_generate.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/text_generation/retro_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-241113/tools/retro/text_generation/retro_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/.coveragerc
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/.flake8
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/.pylintrc
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/CHANGELOG.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/CODEOWNERS
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/CONTRIBUTING.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/Dockerfile.ci.dev
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/Dockerfile.ci.lts
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/Dockerfile.linting
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/LICENSE
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/MANIFEST.in
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/mypy.ini
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/pretrain_bert.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/pretrain_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/pretrain_ict.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/pretrain_mamba.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/pretrain_retro.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/pretrain_t5.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/pretrain_vision_classify.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/pretrain_vision_dino.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/pretrain_vision_inpaint.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/pretrain_vlm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/pyproject.toml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/pytest.ini
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/setup.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/.github/ISSUE_TEMPLATE/bug.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/.github/ISSUE_TEMPLATE/enhancement.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/.github/ISSUE_TEMPLATE/question.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/.github/ISSUE_TEMPLATE/regression.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/.github/workflows/stale.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/.gitlab/labeler-config.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/.gitlab/stages/00.pre.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/.gitlab/stages/01.test.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/.gitlab/stages/02.functional-tests.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/.gitlab/stages/03.publish.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/llama_mistral.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/context_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/datasets.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/dist_checkpointing.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/dist_checkpointing.strategies.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/dist_optimizer.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/distributed.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/encoder_decoder_parallelism.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/fusions.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/models.bert.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/models.gpt.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/models.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/models.t5.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/moe.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/num_microbatches_calculator.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/optimizer_param_scheduler.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/pipeline_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/tensor_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/api-guide/transformer.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/images/context_parallel/CP_overview.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/images/context_parallel/CP_results.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/images/distrib_optimizer/data_flow.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/images/distrib_optimizer/sharding_scheme.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/images/moe/token_drop.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/docs/source/user-guide/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/run_simple_mcore_train_loop.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/detxoify_lm/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/detxoify_lm/finetune_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/detxoify_lm/finetune_gpt_distributed-1.3b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/detxoify_lm/generate-1.3b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/detxoify_lm/generate_samples_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/detxoify_lm/perspective_api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/detxoify_lm/annotations/filter-selfgeneration.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/detxoify_lm/annotations/perspective_api_annotate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/detxoify_lm/annotations/preprocess.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/detxoify_lm/self_generation/selfgenerate-1.3b-unconditional.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/msdp/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/msdp/data_processing.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/msdp/eval_knwl_generation.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/msdp/eval_resp_generation.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/msdp/prep_resp_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/msdp/prompt_knwl_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/msdp/prompt_resp_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/sc21/CONFIG.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/sc21/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/sc21/SBATCH.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/sc21/SRUN.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/sc21/run_figure_11.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/sc21/run_figure_12.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/sc21/run_figure_13.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/sc21/run_figure_14.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/sc21/run_figure_15.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/sc21/run_figure_16.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/sc21/run_figure_17.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/sc21/run_figure_18.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/academic_paper_scripts/sc21/run_table_1.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/bert/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/bert/train_bert_340m_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/export/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/export/knowledge_distillation/pretrain_gpt_modelopt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/export/ptq_and_trtllm_export/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/export/ptq_and_trtllm_export/ptq_trtllm_llama2_7b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/export/ptq_and_trtllm_export/ptq_trtllm_llama3_1_8b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/export/ptq_and_trtllm_export/ptq_trtllm_llama3_8b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/export/ptq_and_trtllm_export/ptq_trtllm_minitron_8b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/export/ptq_and_trtllm_export/ptq_trtllm_mistral_12b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/export/ptq_and_trtllm_export/ptq_trtllm_mixtral_8x7b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/export/ptq_and_trtllm_export/text_generation_ptq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/export/ptq_and_trtllm_export/trtllm_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/export/trtllm_export/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/export/trtllm_export/distributed_export/gpt_distributed_gpu_export.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/export/trtllm_export/single_device_export/gpt_single_device_cpu_export.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/gpt3/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/gpt3/gpt_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/gpt3/train_gpt3_175b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/inference/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/inference/run_text_generation_server_345M.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/inference/run_text_generation_server_345M_8_tensor_parallel.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/inference/gpt/gpt_batch_inference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/inference/llama_mistral/huggingface_reference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/inference/llama_mistral/run_text_generation_llama3.1.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/inference/llama_mistral/run_text_generation_llama3.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/inference/llama_mistral/run_text_generation_mistral.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/inference/t5/simple_t5_batch_inference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/mamba/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/mamba/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/mamba/run_text_gen_server_8b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/mamba/run_text_gen_server_8b_gpt3.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/mamba/train.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/mixtral/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/mixtral/train_mixtral_8x7b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/combine_lm_vision_checkpoints.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/combine_state_dicts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/convert_llava_pretrain_to_wds.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/dataloader_provider.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/dataset_helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/energon_util.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/image_processing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/manual_prompts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/multimodal_args.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/pretrain_dataset.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/pretrain_mistral_clip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/run_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/sft_dataset.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/sft_mistral_clip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/text_generation_mistral_clip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/train.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/assets/pretrain_curves.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/evaluation/evaluate_ai2d.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/evaluation/evaluate_chartqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/evaluation/evaluate_coco.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/evaluation/evaluate_mathvista.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/evaluation/evaluate_mmmu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/evaluation/evaluate_ocrbench.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/evaluation/evaluate_textvqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/evaluation/evaluate_vqav2.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/evaluation/evaluation_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/model_converter/clip_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/model_converter/internvit_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/model_converter/radio_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/model_converter/siglip_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/model_converter/vision_model_tester.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/nvlm/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/nvlm/internvit.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/nvlm/nvlm_prompts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/nvlm/pp_checkpoint_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/nvlm/pretrain_blend.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/nvlm/pretrain_qwen20_72b_internvit_6b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/nvlm/pretrain_yi_34b_internvit_6b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/nvlm/run_text_generation_qwen20_72b_internvit_6b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/nvlm/run_text_generation_qwen25_7b_internvit_video.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/nvlm/run_text_generation_qwen25_7b_siglip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/nvlm/run_text_generation_yi_34b_internvit_6b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/nvlm/sft_34b_internvit.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/nvlm/sft_blend.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/nvlm/sft_qwen20_72b_internvit_6b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/multimodal/nvlm/sft_qwen2p5_7b_internvit_6b_video.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/retro/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/retro/preprocess_data.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/retro/train_retro_2b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/t5/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/t5/t5_mcore_train_curve.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/examples/t5/train_t5_220m_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/images/model_table.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/images/strong_scaling.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/images/weak_scaling.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/QuickStart.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/README_STRAGGLER.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/config_logger.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/jit.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/model_parallel_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/num_microbatches_calculator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/optimizer_param_scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/package_info.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/packed_seq_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/parallel_state.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/rerun_state_machine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/timers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/Makefile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/bert_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/blended_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/blended_megatron_dataset_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/blended_megatron_dataset_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/helpers.cpp
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/indexed_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/masked_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/megatron_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/megatron_tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/readme.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/t5_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/utils_s3.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/external_libs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/config/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/config/bert_embedders.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/config/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/config/gpt_chunk_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/config/tokenizers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/db/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/db/build.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/db/dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/db/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/index/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/index/build.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/index/factory.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/index/index.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/index/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/index/validate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/index/indexes/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/index/indexes/faiss_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/index/indexes/faiss_par_add.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/query/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/query/gpt_chunk_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/query/multi_split_gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/query/query.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/query/retro_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/datasets/retro/query/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/core.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/dict_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/exchange_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/mapping.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/serialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/state_dict_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/tensor_aware_state_dict.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/validation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/strategies/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/strategies/async_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/strategies/base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/strategies/cached_metadata_filesystem_reader.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/strategies/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/strategies/filesystem_async.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/strategies/fully_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/strategies/resharding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/strategies/state_dict_saver.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/strategies/tensorstore.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/strategies/torch.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/strategies/two_stage.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/dist_checkpointing/strategies/zarr.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/distributed/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/distributed/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/distributed/data_parallel_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/distributed/distributed_data_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/distributed/distributed_data_parallel_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/distributed/finalize_model_grads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/distributed/param_and_grad_buffer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/distributed/torch_fully_sharded_data_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/export/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/export/data_type.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/export/export_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/export/model_type.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/export/trtllm/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/export/trtllm/trt_model_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/export/trtllm/trt_model_type.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/export/trtllm/trtllm_helper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/export/trtllm/trtllm_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/export/trtllm/engine_builder/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/export/trtllm/engine_builder/trtllm_engine_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/export/trtllm/model_to_trllm_mapping/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/export/trtllm/model_to_trllm_mapping/default_conversion_dict.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/export/trtllm/trtllm_weights_converter/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/export/trtllm/trtllm_weights_converter/distributed_trtllm_model_weights_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/export/trtllm/trtllm_weights_converter/single_device_trtllm_model_weights_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/extensions/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/extensions/transformer_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/fusions/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/fusions/fused_bias_dropout.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/fusions/fused_bias_geglu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/fusions/fused_bias_gelu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/fusions/fused_bias_swiglu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/fusions/fused_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/fusions/fused_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/fusions/fused_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/async_stream.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/common_inference_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/communication_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/inference_request.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/sampling_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/engines/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/engines/abstract_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/engines/mcore_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/model_inference_wrappers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/model_inference_wrappers/abstract_model_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/model_inference_wrappers/inference_wrapper_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/model_inference_wrappers/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/model_inference_wrappers/gpt/gpt_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/model_inference_wrappers/multimodal/vlm_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/model_inference_wrappers/t5/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/model_inference_wrappers/t5/t5_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/modelopt_support/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/modelopt_support/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/modelopt_support/gpt/model_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/modelopt_support/gpt/state_dict_hooks.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/modelopt_support/mamba/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/modelopt_support/mamba/model_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/text_generation_controllers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/text_generation_controllers/encoder_decoder_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/text_generation_controllers/simple_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/text_generation_controllers/text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/inference/text_generation_controllers/vlm_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/T5/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/T5/t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/T5/t5_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/bert/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/bert/bert_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/bert/bert_lm_head.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/bert/bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/bert/pooler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/common/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/common/embeddings/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/common/embeddings/language_model_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/common/embeddings/relative_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/common/embeddings/rope_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/common/embeddings/rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/common/embeddings/yarn_rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/common/language_module/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/common/language_module/language_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/common/vision_module/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/common/vision_module/vision_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/gpt/gpt_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/gpt/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/gpt/moe_module_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/huggingface/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/huggingface/clip_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/huggingface/module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/huggingface/qwen_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/mamba/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/mamba/mamba_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/mamba/mamba_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/multimodal/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/multimodal/context_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/multimodal/llava_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/multimodal/llava_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/retro/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/retro/base_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/retro/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/retro/decoder_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/retro/decoder_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/retro/encoder_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/retro/encoder_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/retro/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/retro/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/vision/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/vision/clip_vit_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/vision/multimodal_projector.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/vision/radio.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/models/vision/vit_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/optimizer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/optimizer/clip_grads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/optimizer/distrib_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/optimizer/grad_scaler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/optimizer/optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/optimizer/optimizer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/optimizer/cpu_offloading/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/optimizer/cpu_offloading/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/optimizer/cpu_offloading/hybrid_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/pipeline_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/pipeline_parallel/p2p_communication.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/pipeline_parallel/schedules.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/ssm/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/ssm/mamba_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/ssm/mamba_hybrid_layer_allocation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/ssm/mamba_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/ssm/mamba_mixer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/ssm/triton_cache_manager.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/tensor_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/tensor_parallel/cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/tensor_parallel/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/tensor_parallel/layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/tensor_parallel/mappings.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/tensor_parallel/random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/tensor_parallel/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/cuda_graphs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/dot_product_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/identity_op.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/multi_latent_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/spec_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/torch_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/torch_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/transformer_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/transformer_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/custom_layers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/custom_layers/transformer_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/moe/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/moe/experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/moe/grouped_gemm_util.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/moe/legacy_a2a_token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/moe/moe_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/moe/router.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/moe/shared_experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/moe/token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/core/transformer/moe/upcycling_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/checkpointing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/algos/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/algos/distillation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/docs/distillation.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/endpoints/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/endpoints/completions.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/gpt/loss_func.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/gpt/model_provider.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/static/index.html
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/text_generation/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/text_generation/api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/text_generation/beam_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/text_generation/communication.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/text_generation/forward_step.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/text_generation/generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/text_generation/sampling.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/inference/text_generation/tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/indexer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/data/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/data/autoaugment.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/data/biencoder_dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/data/data_samplers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/data/dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/data/ict_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/data/image_folder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/data/multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/data/orqa_wiki_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/data/realm_dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/data/realm_index.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/data/vit_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/fp16_deprecated/loss_scaler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/fused_kernels/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/fused_kernels/compat.h
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/fused_kernels/type_shim.h
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/fused_kernels/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/fused_kernels/tests/test_fused_kernels.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/biencoder_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/fused_bias_gelu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/fused_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/fused_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/multiple_choice.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/realm_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/rms_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/vision/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/vision/dino.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/vision/esvit_swin_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/vision/inpainting.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/vision/knn_monitor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/vision/mit_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/vision/swin_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/vision/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/model/vision/vit_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/mpu/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/mpu/tests/commons.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/mpu/tests/test_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/mpu/tests/test_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/mpu/tests/test_initialize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/mpu/tests/test_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/legacy/mpu/tests/test_random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/activations.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/async_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/checkpointing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/dist_signal_handler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/ft_integration.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/global_vars.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/initialize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/log_handler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/one_logger_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/theoretical_memory_usage.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/training.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/wandb_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/yaml_arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/tokenizer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/tokenizer/bert_tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/tokenizer/gpt2_tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/tokenizer/multimodal_tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/megatron/training/tokenizer/tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/requirements/pytorch_24.01/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/requirements/pytorch_24.07/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/requirements/pytorch_24.10/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/data_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/ensemble_classifier.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/finetune_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/glue/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/glue/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/glue/mnli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/glue/qqp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/msdp/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/msdp/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/msdp/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/msdp/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/msdp/preprocessing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/msdp/prompt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/orqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/orqa/evaluate_orqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/orqa/evaluate_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/orqa/supervised/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/orqa/supervised/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/orqa/supervised/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/orqa/unsupervised/nq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/orqa/unsupervised/qa_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/orqa/unsupervised/tokenizers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/quantize/calibrate_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/race/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/race/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/vision/finetune_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/vision/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/vision/classification/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/vision/classification/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/vision/segmentation/cityscapes.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/vision/segmentation/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/vision/segmentation/finetune_segformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/vision/segmentation/finetune_setr.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/vision/segmentation/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/vision/segmentation/seg_heads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/vision/segmentation/seg_models.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/vision/segmentation/transforms.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/vision/segmentation/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/zeroshot_gpt/datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/zeroshot_gpt/detokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tasks/zeroshot_gpt/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/python_test_utils/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/python_test_utils/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/python_test_utils/conftest.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/python_test_utils/get_test_results_from_tensorboard_logs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/python_test_utils/test_regular_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/python_test_utils/test_resume_checkpoint_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/shell_test_utils/_run_training.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/shell_test_utils/run_ci_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_frozen_resume_torch_dist_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_frozen_resume_torch_dist_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_frozen_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_local_spec_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_local_spec_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_local_spec_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_local_spec_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_local_spec_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_local_spec_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_tp1_pp4_vp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_tp1_pp4_vp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_tp1_pp4_vp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_tp1_pp4_vp2_resume_torch_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_tp1_pp4_vp2_resume_torch_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_tp1_pp4_vp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_tp2_pp2_resume_torch_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_tp2_pp2_resume_torch_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_mr_tp2_pp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp4_vp2/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp4_vp2/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp4_vp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp4_pp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp4_pp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp4_pp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp1_pp2/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp1_pp2/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp1_pp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp4_pp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp4_pp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp4_pp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_release/golden_values_0.10.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/bert/bert_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/common/ckpt_converter/__main__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/common/ckpt_converter/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt-nemo/gpt3-nemo_126m_mr_mbs1_gbs8_mcore_te_8experts_tp2_ep2_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt-nemo/gpt3-nemo_126m_mr_mbs1_gbs8_mcore_te_tp2_pp4_vp3_seq_par_overlap_p2p_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt-nemo/gpt3-nemo_126m_mr_mbs4_gbs64_mcore_te_tp1_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/golden_values_0.10.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/golden_values_0.8.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release_sm/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic_dp_last/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic_dp_last/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic_dp_last/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_dist_optimizer_overlap_grad_reduce_param_gather/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_dist_optimizer_overlap_grad_reduce_param_gather/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_dist_optimizer_overlap_grad_reduce_param_gather/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_fsdp2_resume_torch_dist_te/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_fp16/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_fp16/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_fp16/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_resume_torch_dist/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_resume_torch_dist/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_resume_torch_dist/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4_resume_torch_dist/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4_resume_torch_dist/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4_resume_torch_dist/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_cp2_pp2_ep2_te_4experts2parallel/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_cp2_pp2_ep2_te_4experts2parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_cp2_pp2_ep2_te_4experts2parallel_dp_last/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_cp2_pp2_ep2_te_4experts2parallel_dp_last/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel_dp_last/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel_dp_last/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel_dp_last/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_resume_torch_dist_te_4experts2parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_resume_torch_dist_te_4experts2parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_te_4experts2parallel/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_te_4experts2parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_te_4experts2parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_resume_torch_dist_te_2experts/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch_dist/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch_dist/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch_dist/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_dist_optimizer_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_dist_optimizer_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_dist_optimizer_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2_resume_torch/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2_resume_torch/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_resume_torch/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_resume_torch/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_vp1_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_vp1_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_vp1_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_4experts/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_4experts/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_4experts/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_resume_torch/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_resume_torch/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_nondet_tp1_pp1_fp8_no_model_parallel/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_nondet_tp1_pp1_fp8_no_model_parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_nondet_tp1_pp1_fp8_no_model_parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_bf16_baseline/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_bf16_baseline/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_bf16_baseline/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_fp8_no_model_parallel/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_fp8_no_model_parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_fp8_no_model_parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp2_fp8_pp/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp2_fp8_pp/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp2_fp8_pp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp_sp/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp_sp/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp_sp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_native_fp8_tp_pp_sp/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_native_fp8_tp_pp_sp/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_native_fp8_tp_pp_sp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp4_pp2_fp8_tp_pp/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp4_pp2_fp8_tp_pp/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp4_pp2_fp8_tp_pp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_7b_mr_dgx_a100_1N8G_tp1_pp4_memory_speed/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_7b_mr_dgx_a100_1N8G_tp1_pp4_memory_speed/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_7b_mr_dgx_a100_1N8G_tp4_pp1_memory_speed/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_7b_mr_dgx_a100_1N8G_tp4_pp1_memory_speed/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_7b_mr_dgx_a100_1N8G_tp4_pp1_memory_speed/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_uniform_full_recompute_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_uniform_full_recompute_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_uniform_full_recompute_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_uniform_full_recompute_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_uniform_full_recompute_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_uniform_full_recompute_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_reshard_2x1x4_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_reshard_2x1x4_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_reshard_2x1x4_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_disable_bias_linear_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_disable_bias_linear_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_disable_bias_linear_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_persistent_ckpt_disable_bias_linear_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_persistent_ckpt_disable_bias_linear_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_persistent_ckpt_disable_bias_linear_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_disable_bias_linear_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_disable_bias_linear_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_disable_bias_linear_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_persistent_disable_bias_linear_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_persistent_disable_bias_linear_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_persistent_disable_bias_linear_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_sequence_parallel_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_sequence_parallel_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_sequence_parallel_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_swiglu_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_swiglu_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_swiglu_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_untie_embeddings_and_outputs_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_untie_embeddings_and_outputs_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_untie_embeddings_and_outputs_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_sequence_parallel_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_sequence_parallel_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_sequence_parallel_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_swiglu_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_swiglu_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_swiglu_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_untie_embeddings_and_outputs_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_untie_embeddings_and_outputs_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_untie_embeddings_and_outputs_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_calculate_per_token_loss_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_calculate_per_token_loss_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_calculate_per_token_loss_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_decoupled_lr_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_decoupled_lr_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_decoupled_lr_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_overlap_optimizer_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_overlap_optimizer_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_overlap_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_decoupled_lr_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_decoupled_lr_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_decoupled_lr_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_calculate_per_token_loss_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_calculate_per_token_loss_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_calculate_per_token_loss_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_tunable_overlap_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_tunable_overlap_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_tunable_overlap_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_tunable_overlap_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_tunable_overlap_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_tunable_overlap_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_uneven_pipeline_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_uneven_pipeline_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_uneven_pipeline_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp2_account_for_embedding_loss_in_pipeline_split_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp2_account_for_embedding_loss_in_pipeline_split_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp2_account_for_embedding_loss_in_pipeline_split_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_cp2_nondeterministic_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_fsdp2_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_multi_dist_optimizer_instances_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_multi_dist_optimizer_instances_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_multi_dist_optimizer_instances_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_multi_dist_optimizer_instances_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_multi_dist_optimizer_instances_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_multi_dist_optimizer_instances_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_top2router_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_ddp_average_in_collective_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_ddp_average_in_collective_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_ddp_average_in_collective_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_overlap_grad_reduce_param_gather_groupedGEMM_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_overlap_grad_reduce_param_gather_groupedGEMM_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_overlap_grad_reduce_param_gather_groupedGEMM_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_top2router_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts_etp1_ep4_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts_etp1_ep4_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_te_8experts_etp1_ep4_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_dp_last_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_dp_last_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_nondeterministic_dp_last_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_nondeterministic_dp_last_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_nondeterministic_dp_last_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_nondeterministic_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cross_entropy_loss_fusion_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cross_entropy_loss_fusion_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cross_entropy_loss_fusion_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_ddp_average_in_collective_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_ddp_average_in_collective_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_ddp_average_in_collective_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_defer_embedding_wgrad_compute_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_defer_embedding_wgrad_compute_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_defer_embedding_wgrad_compute_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_mmap_bin_files_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_mmap_bin_files_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_mmap_bin_files_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cross_entropy_loss_fusion_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cross_entropy_loss_fusion_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cross_entropy_loss_fusion_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_ddp_average_in_collective_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_ddp_average_in_collective_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_ddp_average_in_collective_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_defer_embedding_wgrad_compute_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_defer_embedding_wgrad_compute_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_defer_embedding_wgrad_compute_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_mmap_bin_files_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_mmap_bin_files_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_mmap_bin_files_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_reshard_1x4xNone_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_reshard_1x4xNone_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_reshard_1x4xNone_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_qk_layernorm_test_mode_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_qk_layernorm_test_mode_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_qk_layernorm_test_mode_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_qk_layernorm_test_mode_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_qk_layernorm_test_mode_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_qk_layernorm_test_mode_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_frozen_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_frozen_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_frozen_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_resume_torch_dist_uninstall_te_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_resume_torch_dist_uninstall_te_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_resume_torch_dist_uninstall_te_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_uninstall_te_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_uninstall_te_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_uninstall_te_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_te_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_te_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_te_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_te_tp2_pp2_resume_torch_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_te_tp2_pp2_resume_torch_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_te_tp2_pp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_tp1_pp4_vp1_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_tp1_pp4_vp1_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_tp1_pp4_vp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_tp1_pp4_vp1_resume_torch_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_tp1_pp4_vp1_resume_torch_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_tp1_pp4_vp1_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_mr_tp2_pp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_nightly_mcore_te_tp2_pp1_modelopt_distill_resume/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_nightly_mcore_te_tp2_pp1_modelopt_distill_resume/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/gpt/gpt3_nightly_mcore_te_tp2_pp1_modelopt_distill_resume/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/mixtral/mixtral_8x22b_tp2pp8ep8vpp1_release/golden_values_0.10.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/mixtral/mixtral_8x22b_tp2pp8ep8vpp1_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/mixtral/mixtral_8x22b_tp2pp8ep8vpp1_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/golden_values_0.10.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/golden_values_0.8.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release_sm/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_tp1pp4ep8vpp8_release/golden_values_0.10.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_tp1pp4ep8vpp8_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_tp1pp4ep8vpp8_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp1_pp1_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp1_pp1_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp1_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp2_pp3_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp2_pp3_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp2_pp3_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_etp3_dgx_a100_1N7G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_etp3_dgx_a100_1N7G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_etp3_dgx_a100_1N7G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_freeze_vit_freeze_lm_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_freeze_vit_freeze_lm_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_freeze_vit_freeze_lm_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_freeze_vit_freeze_lm_dist_opt_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_freeze_vit_freeze_lm_dist_opt_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_freeze_vit_freeze_lm_dist_opt_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_resume_torch_etp3_dgx_a100_1N7G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_resume_torch_etp3_dgx_a100_1N7G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_resume_torch_etp3_dgx_a100_1N7G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_frozen_resume_torch_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_frozen_resume_torch_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_frozen_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_resume_torch_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_resume_torch_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp2_pp2_resume_torch_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp2_pp2_resume_torch_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp2_pp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp1_pp1_vp1_resume_torch/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp1_pp1_vp1_resume_torch/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp1_pp1_vp1_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1_sequence_parallel/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1_sequence_parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1_sequence_parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1_resume_torch/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1_resume_torch/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp2_pp1_vp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp2_pp1_vp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp2_pp1_vp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_weekly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_220m_weekly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1_sequence_parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_release/golden_values_0.10.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/functional_tests/test_cases/t5/t5_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/test_utils/python_scripts/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/test_utils/python_scripts/download_golden_values.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/test_utils/python_scripts/generate_jet_trigger_job.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/test_utils/python_scripts/generate_local_jobs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/test_utils/python_scripts/launch_jet_workload.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/test_utils/recipes/_build-mcore-dev.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/test_utils/recipes/_build-mcore-lts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/test_utils/recipes/_build-nemo.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/test_utils/recipes/bert.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/test_utils/recipes/gpt-modelopt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/test_utils/recipes/gpt-nemo.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/test_utils/recipes/gpt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/test_utils/recipes/multimodal-llava.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/test_utils/recipes/t5.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/test_utils/recipes/unit-tests.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/test_utils/shell_scripts/notify.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/conftest.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/test_basic.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/test_imports.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/test_inference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/test_local_multi_tensor_fns.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/test_model_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/test_num_microbatches_calculator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/test_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/test_optimizer_cpu_offloading.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/test_optimizer_param_scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/test_parallel_state.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/test_tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/test_training.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/test_utilities.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/test_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/data/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/data/test_bin_reader.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/data/test_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/data/test_gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/data/test_multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/data/test_preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/data/test_preprocess_mmdata.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/conftest.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/test_async_save.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/test_flattened_resharding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/test_fp8.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/test_fully_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/test_global_metadata_reuse.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/test_local.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/test_mapping.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/test_nonpersistent.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/test_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/test_replication.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/test_serialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/test_torch_dist.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/models/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/models/test_bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/models/test_gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/models/test_mamba.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/models/test_mlp_glu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/models/test_moe_experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/models/test_retro_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/dist_checkpointing/models/test_t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/distributed/test_finalize_model_grads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/distributed/test_grad_reduce_for_replicated_embedder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/distributed/test_grad_sync_with_expert_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/distributed/test_param_and_grad_buffer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/export/trtllm/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/export/trtllm/test_distributed_fp8.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/export/trtllm/test_single_device_fp8.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/export/trtllm/test_trtllm_distributed_gpu_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/export/trtllm/test_trtllm_helper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/export/trtllm/test_trtllm_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/export/trtllm/test_trtllm_single_device_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/fusions/test_torch_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/inference/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/inference/test_common_inference_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/inference/test_flash_decode.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/inference/test_inference_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/inference/test_modelopt_module_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/inference/test_scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/inference/engines/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/inference/engines/test_mcore_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/inference/model_inference_wrappers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/inference/model_inference_wrappers/test_model_inference_wrapper_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/inference/model_inference_wrappers/gpt/test_gpt_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/inference/model_inference_wrappers/t5/test_t5_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/inference/text_generation_controllers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/inference/text_generation_controllers/test_encoder_decoder_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/inference/text_generation_controllers/test_simple_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/inference/text_generation_controllers/test_vlm_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/models/test_base_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/models/test_bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/models/test_clip_vit_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/models/test_gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/models/test_llava_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/models/test_mamba_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/models/test_multimodal_projector.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/models/test_radio_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/models/test_t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/pipeline_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/pipeline_parallel/test_helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/pipeline_parallel/test_schedules.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/ssm/test_mamba_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/ssm/test_mamba_hybrid_layer_allocation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/ssm/test_mamba_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/ssm/test_mamba_mixer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/tensor_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/tensor_parallel/test_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/tensor_parallel/test_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/tensor_parallel/test_initialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/tensor_parallel/test_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/tensor_parallel/test_mappings.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/tensor_parallel/test_random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/tensor_parallel/test_tensor_parallel_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/test_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/test_attention_packed_seq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/test_core_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/test_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/test_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/test_multi_latent_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/test_relative_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/test_retro_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/test_rope.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/test_spec_customization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/test_transformer_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/test_transformer_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/moe/conftest.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/moe/test_a2a_token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/moe/test_aux_loss.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/moe/test_grouped_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/moe/test_moe_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/moe/test_routers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/moe/test_sequential_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/moe/test_shared_experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/moe/test_token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tests/unit_tests/transformer/moe/test_upcycling.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/autoformat.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/copyright.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/linter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/merge_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/preprocess_data_nmt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/preprocess_mmdata.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/report_theoretical_memory.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/run_mamba_text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/run_text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/run_vlm_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/text_generation_cli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/bert_embedding/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/bert_embedding/dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/bert_embedding/embed.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/bert_embedding/external_libs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/bert_embedding/huggingface.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/checkpoint/convert.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/checkpoint/hybrid_conversion.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/checkpoint/loader_core.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/checkpoint/loader_legacy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/checkpoint/loader_llama_mistral.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/checkpoint/loader_mixtral_hf.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/checkpoint/saver_core.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/checkpoint/saver_legacy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/checkpoint/schema_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/checkpoint/schema_core.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/checkpoint/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/openwebtext/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/openwebtext/add_id.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/openwebtext/blacklist_urls.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/openwebtext/cleanup_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/openwebtext/cleanup_fix_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/openwebtext/filter_ngrams.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/openwebtext/find_duplicates.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/openwebtext/group_duplicate_url.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/openwebtext/merge_jsons.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/openwebtext/remove_group_duplicates.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/build_db.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/config_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/cli/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/cli/__main__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/cli/cli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/docker/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/sft/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/sft/dataset_conv.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/sft/open_inst.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/sft/sft_retro.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/sft/sft_retro_lm.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/text_generation/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/text_generation/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/text_generation/retro_api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/text_generation/retro_generate.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/text_generation/retro_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250217/tools/retro/text_generation/retro_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/.coveragerc
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/.flake8
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/.pylintrc
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/CHANGELOG.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/CODEOWNERS
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/CONTRIBUTING.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/Dockerfile.ci.dev
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/Dockerfile.ci.lts
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/Dockerfile.linting
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/LICENSE
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/MANIFEST.in
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/mypy.ini
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/pretrain_bert.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/pretrain_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/pretrain_ict.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/pretrain_mamba.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/pretrain_retro.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/pretrain_t5.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/pretrain_vision_classify.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/pretrain_vision_dino.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/pretrain_vision_inpaint.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/pretrain_vlm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/pyproject.toml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/pytest.ini
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/requirements_ci.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/requirements_mlm.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/setup.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/.github/ISSUE_TEMPLATE/bug.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/.github/ISSUE_TEMPLATE/enhancement.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/.github/ISSUE_TEMPLATE/question.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/.github/ISSUE_TEMPLATE/regression.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/.github/workflows/stale.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/.gitlab/labeler-config.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/.gitlab/stages/00.pre.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/.gitlab/stages/01.build.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/.gitlab/stages/02.test.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/.gitlab/stages/03.integration-tests.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/.gitlab/stages/04.functional-tests.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/.gitlab/stages/05.publish.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/llama_mistral.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/context_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/custom_fsdp.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/datasets.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/dist_checkpointing.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/dist_checkpointing.strategies.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/dist_optimizer.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/distributed.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/encoder_decoder_parallelism.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/fusions.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/models.bert.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/models.gpt.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/models.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/models.t5.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/moe.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/multi_latent_attention.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/multi_token_prediction.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/num_microbatches_calculator.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/optimizer_cpu_offload.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/optimizer_param_scheduler.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/pipeline_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/tensor_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/api-guide/transformer.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/images/context_parallel/CP_overview.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/images/context_parallel/CP_results.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/images/custom_fsdp/FSDP_Allreduce.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/images/custom_fsdp/FSDP_workflow.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/images/custom_fsdp/MCore_Custom_FSDP_Class_Diagram.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/images/distrib_optimizer/data_flow.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/images/distrib_optimizer/sharding_scheme.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/images/moe/token_drop.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/images/multi_token_prediction/MTP_implementation.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/docs/source/user-guide/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/run_simple_mcore_train_loop.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/detxoify_lm/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/detxoify_lm/finetune_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/detxoify_lm/finetune_gpt_distributed-1.3b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/detxoify_lm/generate-1.3b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/detxoify_lm/generate_samples_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/detxoify_lm/perspective_api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/detxoify_lm/annotations/filter-selfgeneration.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/detxoify_lm/annotations/perspective_api_annotate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/detxoify_lm/annotations/preprocess.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/detxoify_lm/self_generation/selfgenerate-1.3b-unconditional.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/msdp/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/msdp/data_processing.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/msdp/eval_knwl_generation.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/msdp/eval_resp_generation.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/msdp/prep_resp_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/msdp/prompt_knwl_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/msdp/prompt_resp_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/sc21/CONFIG.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/sc21/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/sc21/SBATCH.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/sc21/SRUN.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/sc21/run_figure_11.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/sc21/run_figure_12.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/sc21/run_figure_13.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/sc21/run_figure_14.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/sc21/run_figure_15.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/sc21/run_figure_16.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/sc21/run_figure_17.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/sc21/run_figure_18.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/academic_paper_scripts/sc21/run_table_1.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/bert/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/bert/train_bert_340m_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/export/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/export/knowledge_distillation/pretrain_gpt_modelopt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/export/trtllm_export/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/export/trtllm_export/distributed_export/gpt_distributed_gpu_export.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/export/trtllm_export/single_device_export/gpt_single_device_cpu_export.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/gpt3/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/gpt3/gpt_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/gpt3/train_gpt3_175b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/inference/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/inference/run_text_generation_server_345M.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/inference/run_text_generation_server_345M_8_tensor_parallel.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/inference/gpt/gpt_dynamic_inference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/inference/gpt/gpt_dynamic_inference_12b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/inference/gpt/gpt_dynamic_inference_357m.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/inference/gpt/gpt_static_inference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/inference/gpt/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/inference/llama_mistral/huggingface_reference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/inference/llama_mistral/run_text_generation_llama3.1.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/inference/llama_mistral/run_text_generation_llama3.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/inference/llama_mistral/run_text_generation_mistral.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/inference/t5/simple_t5_batch_inference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/mamba/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/mamba/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/mamba/run_text_gen_server_8b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/mamba/run_text_gen_server_8b_gpt3.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/mamba/train.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/mixtral/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/mixtral/train_mixtral_8x7b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/combine_lm_vision_checkpoints.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/combine_state_dicts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/convert_llava_pretrain_to_wds.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/dataloader_provider.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/dataset_helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/energon_util.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/image_processing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/layer_scaling.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/manual_prompts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/multimodal_args.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/pretrain_dataset.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/pretrain_mistral_clip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/run_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/sft_dataset.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/sft_mistral_clip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/text_generation_mistral_clip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/train.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/assets/pretrain_curves.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/evaluate_ai2d.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/evaluate_chartqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/evaluate_coco.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/evaluate_infovqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/evaluate_mathvista.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/evaluate_mmmu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/evaluate_ocrbench.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/evaluate_ocrbench_v2.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/evaluate_rd_tablebench.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/evaluate_realworldqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/evaluate_spdocvqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/evaluate_textvqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/evaluate_video_motionbench.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/evaluate_video_mvbench.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/evaluate_video_phys_game_bench.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/evaluate_vqav2.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/evaluation_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/evaluation/mmmu_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/model_converter/clip_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/model_converter/internvit_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/model_converter/radio_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/model_converter/siglip_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/model_converter/vision_model_tester.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/nvlm/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/nvlm/internvit.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/nvlm/nvlm_prompts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/nvlm/pp_checkpoint_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/nvlm/pretrain_blend.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/nvlm/pretrain_qwen20_72b_internvit_6b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/nvlm/pretrain_yi_34b_internvit_6b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/nvlm/run_text_generation_qwen20_72b_internvit_6b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/nvlm/run_text_generation_qwen25_7b_internvit_video.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/nvlm/run_text_generation_qwen25_7b_siglip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/nvlm/run_text_generation_yi_34b_internvit_6b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/nvlm/sft_34b_internvit.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/nvlm/sft_blend.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/nvlm/sft_qwen20_72b_internvit_6b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/nvlm/sft_qwen2p5_7b_internvit_6b_video.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/multimodal/radio/radio_g.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/post_training/modelopt/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/post_training/modelopt/convert.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/post_training/modelopt/convert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/post_training/modelopt/export.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/post_training/modelopt/export.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/post_training/modelopt/quantize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/post_training/modelopt/quantize.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/post_training/modelopt/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/post_training/modelopt/conf/arguments.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/post_training/modelopt/conf/deepseek-ai/DeepSeek-R1.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/post_training/modelopt/conf/deepseek-ai/DeepSeek-V2-Lite.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/post_training/modelopt/conf/meta-llama/Llama-3.1-8B-Instruct.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/post_training/modelopt/conf/meta-llama/Llama-3.2-1B-Instruct.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/post_training/modelopt/conf/nvidia/Nemotron-Mini-4B-Instruct.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/retro/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/retro/preprocess_data.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/retro/train_retro_2b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/t5/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/t5/t5_mcore_train_curve.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/examples/t5/train_t5_220m_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/images/model_table.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/images/strong_scaling.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/images/weak_scaling.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/QuickStart.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/README_STRAGGLER.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/config_logger.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/fp8_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/jit.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/model_parallel_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/num_microbatches_calculator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/optimizer_param_scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/package_info.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/packed_seq_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/parallel_state.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/rerun_state_machine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/timers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/Makefile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/bert_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/blended_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/blended_megatron_dataset_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/blended_megatron_dataset_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/helpers.cpp
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/indexed_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/masked_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/megatron_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/megatron_tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/readme.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/t5_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/utils_s3.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/external_libs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/config/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/config/bert_embedders.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/config/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/config/gpt_chunk_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/config/tokenizers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/db/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/db/build.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/db/dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/db/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/index/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/index/build.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/index/factory.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/index/index.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/index/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/index/validate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/index/indexes/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/index/indexes/faiss_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/index/indexes/faiss_par_add.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/query/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/query/gpt_chunk_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/query/multi_split_gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/query/query.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/query/retro_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/datasets/retro/query/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/core.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/dict_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/exchange_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/mapping.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/serialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/state_dict_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/tensor_aware_state_dict.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/validation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/strategies/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/strategies/async_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/strategies/base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/strategies/cached_metadata_filesystem_reader.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/strategies/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/strategies/filesystem_async.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/strategies/fully_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/strategies/resharding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/strategies/state_dict_saver.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/strategies/tensorstore.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/strategies/torch.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/strategies/two_stage.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/dist_checkpointing/strategies/zarr.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/distributed/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/distributed/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/distributed/data_parallel_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/distributed/distributed_data_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/distributed/distributed_data_parallel_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/distributed/finalize_model_grads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/distributed/param_and_grad_buffer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/distributed/torch_fully_sharded_data_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/distributed/custom_fsdp/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/distributed/custom_fsdp/fully_sharded_data_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/distributed/custom_fsdp/param_and_grad_buffer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/export/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/export/data_type.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/export/export_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/export/model_type.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/export/trtllm/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/export/trtllm/trt_model_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/export/trtllm/trt_model_type.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/export/trtllm/trtllm_helper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/export/trtllm/trtllm_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/export/trtllm/engine_builder/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/export/trtllm/engine_builder/trtllm_engine_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/export/trtllm/model_to_trllm_mapping/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/export/trtllm/model_to_trllm_mapping/default_conversion_dict.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/export/trtllm/trtllm_weights_converter/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/export/trtllm/trtllm_weights_converter/distributed_trtllm_model_weights_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/export/trtllm/trtllm_weights_converter/single_device_trtllm_model_weights_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/extensions/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/extensions/transformer_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/fusions/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/fusions/fused_bias_dropout.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/fusions/fused_bias_geglu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/fusions/fused_bias_gelu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/fusions/fused_bias_swiglu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/fusions/fused_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/fusions/fused_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/fusions/fused_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/async_stream.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/common_inference_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/communication_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/inference_request.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/sampling_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/contexts/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/contexts/base_context.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/contexts/dynamic_context.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/contexts/static_context.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/engines/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/engines/abstract_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/engines/dynamic_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/engines/mcore_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/engines/static_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/model_inference_wrappers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/model_inference_wrappers/abstract_model_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/model_inference_wrappers/inference_wrapper_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/model_inference_wrappers/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/model_inference_wrappers/gpt/gpt_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/model_inference_wrappers/multimodal/vlm_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/model_inference_wrappers/t5/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/model_inference_wrappers/t5/t5_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/modelopt_support/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/modelopt_support/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/modelopt_support/gpt/model_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/modelopt_support/gpt/state_dict_hooks.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/modelopt_support/mamba/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/modelopt_support/mamba/model_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/text_generation_controllers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/text_generation_controllers/encoder_decoder_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/text_generation_controllers/simple_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/text_generation_controllers/text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/inference/text_generation_controllers/vlm_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/T5/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/T5/t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/T5/t5_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/bert/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/bert/bert_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/bert/bert_lm_head.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/bert/bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/bert/pooler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/common/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/common/embeddings/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/common/embeddings/language_model_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/common/embeddings/relative_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/common/embeddings/rope_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/common/embeddings/rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/common/embeddings/yarn_rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/common/language_module/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/common/language_module/language_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/common/vision_module/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/common/vision_module/vision_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/gpt/gpt_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/gpt/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/gpt/moe_module_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/huggingface/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/huggingface/clip_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/huggingface/module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/huggingface/qwen_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/mamba/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/mamba/mamba_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/mamba/mamba_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/multimodal/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/multimodal/context_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/multimodal/llava_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/multimodal/llava_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/retro/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/retro/base_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/retro/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/retro/decoder_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/retro/decoder_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/retro/encoder_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/retro/encoder_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/retro/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/retro/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/vision/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/vision/clip_vit_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/vision/multimodal_projector.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/vision/radio.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/models/vision/vit_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/optimizer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/optimizer/clip_grads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/optimizer/distrib_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/optimizer/grad_scaler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/optimizer/optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/optimizer/optimizer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/optimizer/cpu_offloading/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/optimizer/cpu_offloading/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/optimizer/cpu_offloading/hybrid_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/pipeline_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/pipeline_parallel/p2p_communication.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/pipeline_parallel/schedules.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/post_training/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/post_training/modelopt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/post_training/modelopt/layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/post_training/modelopt/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/post_training/modelopt/gpt/model_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/post_training/modelopt/gpt/state_dict_hooks.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/post_training/modelopt/mamba/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/post_training/modelopt/mamba/model_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/ssm/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/ssm/mamba_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/ssm/mamba_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/ssm/mamba_hybrid_layer_allocation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/ssm/mamba_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/ssm/mamba_mixer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/ssm/mlp_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/ssm/triton_cache_manager.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/tensor_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/tensor_parallel/cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/tensor_parallel/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/tensor_parallel/layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/tensor_parallel/mappings.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/tensor_parallel/random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/tensor_parallel/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/cuda_graphs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/dot_product_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/identity_op.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/multi_latent_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/multi_token_prediction.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/spec_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/torch_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/torch_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/transformer_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/transformer_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/custom_layers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/custom_layers/transformer_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/moe/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/moe/experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/moe/fused_a2a.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/moe/grouped_gemm_util.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/moe/legacy_a2a_token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/moe/moe_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/moe/router.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/moe/shared_experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/moe/token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/core/transformer/moe/upcycling_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/inference/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/inference/text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/inference/endpoints/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/inference/endpoints/completions.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/inference/static/index.html
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/inference/text_generation/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/inference/text_generation/api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/inference/text_generation/beam_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/inference/text_generation/communication.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/inference/text_generation/forward_step.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/inference/text_generation/generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/inference/text_generation/mcore_engine_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/inference/text_generation/sampling.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/inference/text_generation/tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/indexer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/data/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/data/autoaugment.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/data/biencoder_dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/data/data_samplers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/data/dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/data/ict_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/data/image_folder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/data/multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/data/orqa_wiki_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/data/realm_dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/data/realm_index.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/data/vit_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/fp16_deprecated/loss_scaler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/fused_kernels/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/fused_kernels/compat.h
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/fused_kernels/type_shim.h
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/fused_kernels/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/fused_kernels/tests/test_fused_kernels.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/biencoder_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/fused_bias_gelu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/fused_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/fused_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/multiple_choice.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/realm_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/rms_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/vision/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/vision/dino.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/vision/esvit_swin_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/vision/inpainting.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/vision/knn_monitor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/vision/mit_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/vision/swin_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/vision/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/model/vision/vit_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/mpu/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/mpu/tests/commons.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/mpu/tests/test_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/mpu/tests/test_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/mpu/tests/test_initialize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/mpu/tests/test_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/legacy/mpu/tests/test_random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/post_training/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/post_training/arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/post_training/checkpointing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/post_training/loss_func.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/post_training/model_provider.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/post_training/algos/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/post_training/algos/distillation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/post_training/docs/distillation.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/activations.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/async_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/checkpointing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/dist_signal_handler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/ft_integration.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/global_vars.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/initialize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/log_handler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/one_logger_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/theoretical_memory_usage.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/training.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/wandb_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/yaml_arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/tokenizer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/tokenizer/bert_tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/tokenizer/gpt2_tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/tokenizer/multimodal_tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/megatron/training/tokenizer/tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/requirements/pytorch_24.01/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/requirements/pytorch_24.07/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/requirements/pytorch_24.10/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/data_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/ensemble_classifier.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/finetune_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/glue/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/glue/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/glue/mnli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/glue/qqp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/msdp/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/msdp/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/msdp/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/msdp/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/msdp/preprocessing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/msdp/prompt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/orqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/orqa/evaluate_orqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/orqa/evaluate_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/orqa/supervised/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/orqa/supervised/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/orqa/supervised/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/orqa/unsupervised/nq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/orqa/unsupervised/qa_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/orqa/unsupervised/tokenizers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/quantize/calibrate_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/race/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/race/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/vision/finetune_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/vision/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/vision/classification/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/vision/classification/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/vision/segmentation/cityscapes.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/vision/segmentation/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/vision/segmentation/finetune_segformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/vision/segmentation/finetune_setr.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/vision/segmentation/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/vision/segmentation/seg_heads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/vision/segmentation/seg_models.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/vision/segmentation/transforms.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/vision/segmentation/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/zeroshot_gpt/datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/zeroshot_gpt/detokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tasks/zeroshot_gpt/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/python_test_utils/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/python_test_utils/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/python_test_utils/conftest.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/python_test_utils/get_test_results_from_tensorboard_logs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/python_test_utils/test_regular_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/python_test_utils/test_resume_checkpoint_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/shell_test_utils/_run_training.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/shell_test_utils/run_ci_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_frozen_resume_torch_dist_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_frozen_resume_torch_dist_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_frozen_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_local_spec_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_local_spec_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_local_spec_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_local_spec_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_local_spec_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_local_spec_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_tp1_pp4_vp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_tp1_pp4_vp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_tp1_pp4_vp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_tp1_pp4_vp2_resume_torch_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_tp1_pp4_vp2_resume_torch_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_tp1_pp4_vp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_tp2_pp2_resume_torch_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_tp2_pp2_resume_torch_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_mr_tp2_pp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp4_vp2/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp4_vp2/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp4_vp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp4_pp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp4_pp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp4_pp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp1_pp2/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp1_pp2/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp1_pp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp4_pp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp4_pp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_tp4_pp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_release/golden_values_0.10.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/bert/bert_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/common/ckpt_converter/__main__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/common/ckpt_converter/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt-nemo/gpt3-nemo_126m_mr_mbs1_gbs8_mcore_te_8experts_tp2_ep2_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt-nemo/gpt3-nemo_126m_mr_mbs1_gbs8_mcore_te_tp2_pp4_vp3_seq_par_overlap_p2p_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt-nemo/gpt3-nemo_126m_mr_mbs4_gbs64_mcore_te_tp1_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/golden_values_0.10.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/golden_values_0.8.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release_sm/golden_values_0.11.0_pyt2410.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release_sm/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_dist_optimizer_overlap_grad_reduce_param_gather/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_dist_optimizer_overlap_grad_reduce_param_gather/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_dist_optimizer_overlap_grad_reduce_param_gather/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_fsdp2_resume_torch_dist_te/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_fp16/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_fp16/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_fp16/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_resume_torch_dist/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_resume_torch_dist/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_resume_torch_dist/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4_resume_torch_dist/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4_resume_torch_dist/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4_resume_torch_dist/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch_dist/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch_dist/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch_dist/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_dist_optimizer_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_dist_optimizer_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_dist_optimizer_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2_resume_torch/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2_resume_torch/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_resume_torch/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_resume_torch/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_vp1_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_vp1_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_vp1_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_overlap_grad_reduce/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_overlap_grad_reduce/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_overlap_grad_reduce/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_resume_torch/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_resume_torch/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_nondet_tp1_pp1_fp8_no_model_parallel/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_nondet_tp1_pp1_fp8_no_model_parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_nondet_tp1_pp1_fp8_no_model_parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_bf16_baseline/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_bf16_baseline/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_bf16_baseline/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_fp8_no_model_parallel/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_fp8_no_model_parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_fp8_no_model_parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp2_fp8_pp/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp2_fp8_pp/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp2_fp8_pp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp_sp/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp_sp/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp_sp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_native_fp8_tp_pp_sp/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_native_fp8_tp_pp_sp/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_native_fp8_tp_pp_sp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp4_pp2_fp8_tp_pp/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp4_pp2_fp8_tp_pp/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp4_pp2_fp8_tp_pp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_7b_mr_dgx_a100_1N8G_tp1_pp4_memory_speed/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_7b_mr_dgx_a100_1N8G_tp1_pp4_memory_speed/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_7b_mr_dgx_a100_1N8G_tp4_pp1_memory_speed/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_7b_mr_dgx_a100_1N8G_tp4_pp1_memory_speed/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_7b_mr_dgx_a100_1N8G_tp4_pp1_memory_speed/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_frozen_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_frozen_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_frozen_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_uniform_full_recompute_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_uniform_full_recompute_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_uniform_full_recompute_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_uniform_full_recompute_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_uniform_full_recompute_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_uniform_full_recompute_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_disable_bias_linear_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_disable_bias_linear_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_disable_bias_linear_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_frozen_resume_torch_dist_swiglu_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_frozen_resume_torch_dist_swiglu_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_frozen_resume_torch_dist_swiglu_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_persistent_ckpt_disable_bias_linear_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_persistent_ckpt_disable_bias_linear_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_persistent_ckpt_disable_bias_linear_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_disable_bias_linear_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_disable_bias_linear_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_disable_bias_linear_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_persistent_disable_bias_linear_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_persistent_disable_bias_linear_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_persistent_disable_bias_linear_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_sequence_parallel_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_sequence_parallel_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_sequence_parallel_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_swiglu_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_swiglu_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_swiglu_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_untie_embeddings_and_outputs_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_untie_embeddings_and_outputs_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_untie_embeddings_and_outputs_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_sequence_parallel_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_sequence_parallel_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_sequence_parallel_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_swiglu_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_swiglu_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_swiglu_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_untie_embeddings_and_outputs_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_untie_embeddings_and_outputs_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_untie_embeddings_and_outputs_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_calculate_per_token_loss_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_calculate_per_token_loss_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_calculate_per_token_loss_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_decoupled_lr_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_decoupled_lr_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_decoupled_lr_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_overlap_optimizer_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_overlap_optimizer_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_overlap_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_decoupled_lr_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_decoupled_lr_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_decoupled_lr_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_calculate_per_token_loss_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_calculate_per_token_loss_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_calculate_per_token_loss_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_tunable_overlap_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_tunable_overlap_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_tunable_overlap_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_tunable_overlap_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_tunable_overlap_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_tunable_overlap_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_uneven_pipeline_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_uneven_pipeline_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_uneven_pipeline_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp2_account_for_embedding_loss_in_pipeline_split_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp2_account_for_embedding_loss_in_pipeline_split_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp2_account_for_embedding_loss_in_pipeline_split_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_cp2_nondeterministic_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_fsdp2_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_multi_dist_optimizer_instances_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_multi_dist_optimizer_instances_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_multi_dist_optimizer_instances_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_multi_dist_optimizer_instances_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_multi_dist_optimizer_instances_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_multi_dist_optimizer_instances_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_calculate_per_token_loss_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_calculate_per_token_loss_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_calculate_per_token_loss_nondeterministic_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_calculate_per_token_loss_nondeterministic_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_calculate_per_token_loss_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_calculate_per_token_loss_dp_last_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_calculate_per_token_loss_dp_last_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_calculate_per_token_loss_nondeterministic_dp_last_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_calculate_per_token_loss_nondeterministic_dp_last_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_calculate_per_token_loss_nondeterministic_dp_last_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_dp_last_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_dp_last_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_nondeterministic_dp_last_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_nondeterministic_dp_last_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_nondeterministic_dp_last_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_nondeterministic_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cross_entropy_loss_fusion_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cross_entropy_loss_fusion_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cross_entropy_loss_fusion_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_ddp_average_in_collective_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_ddp_average_in_collective_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_ddp_average_in_collective_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_defer_embedding_wgrad_compute_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_defer_embedding_wgrad_compute_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_defer_embedding_wgrad_compute_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_mla_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_mla_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_mmap_bin_files_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_mmap_bin_files_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_mmap_bin_files_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cross_entropy_loss_fusion_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cross_entropy_loss_fusion_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cross_entropy_loss_fusion_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_ddp_average_in_collective_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_ddp_average_in_collective_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_ddp_average_in_collective_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_defer_embedding_wgrad_compute_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_defer_embedding_wgrad_compute_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_defer_embedding_wgrad_compute_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_mmap_bin_files_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_mmap_bin_files_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_mmap_bin_files_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_reshard_1x4xNone_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_reshard_1x4xNone_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_reshard_1x4xNone_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_zp_z3_resume_torch_dist_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_zp_z3_resume_torch_dist_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_zp_z3_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_qk_layernorm_test_mode_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_qk_layernorm_test_mode_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_qk_layernorm_test_mode_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_qk_layernorm_test_mode_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_qk_layernorm_test_mode_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_qk_layernorm_test_mode_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_frozen_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_frozen_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_frozen_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_resume_torch_dist_uninstall_te_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_resume_torch_dist_uninstall_te_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_resume_torch_dist_uninstall_te_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_uninstall_te_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_uninstall_te_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_uninstall_te_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_te_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_te_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_te_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_te_tp2_pp2_resume_torch_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_te_tp2_pp2_resume_torch_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_te_tp2_pp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_tp1_pp4_vp1_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_tp1_pp4_vp1_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_tp1_pp4_vp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_tp1_pp4_vp1_resume_torch_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_tp1_pp4_vp1_resume_torch_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_tp1_pp4_vp1_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_mr_tp2_pp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_nightly_mcore_te_tp2_pp1_modelopt_distill_resume/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_nightly_mcore_te_tp2_pp1_modelopt_distill_resume/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/gpt/gpt3_nightly_mcore_te_tp2_pp1_modelopt_distill_resume/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/mixtral/mixtral_8x22b_tp2pp8ep8vpp1_release/golden_values_0.10.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/mixtral/mixtral_8x22b_tp2pp8ep8vpp1_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/mixtral/mixtral_8x22b_tp2pp8ep8vpp1_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/golden_values_0.10.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/golden_values_0.8.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release_sm/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_tp1pp4ep8vpp8_release/golden_values_0.10.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_tp1pp4ep8vpp8_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_tp1pp4ep8vpp8_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic_dp_last/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic_dp_last/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic_dp_last/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_cp2_pp2_ep2_te_4experts2parallel/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_cp2_pp2_ep2_te_4experts2parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_cp2_pp2_ep2_te_4experts2parallel_dp_last/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_cp2_pp2_ep2_te_4experts2parallel_dp_last/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel_dp_last/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel_dp_last/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel_dp_last/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_resume_torch_dist_te_4experts2parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_resume_torch_dist_te_4experts2parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_te_4experts2parallel/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_te_4experts2parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_te_4experts2parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_resume_torch_dist_te_2experts/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_4experts/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_4experts/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_4experts/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_moe_mr_mcore_te_ep8_resume_torch_dist_dist_optimizer/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_moe_mr_mcore_te_ep8_resume_torch_dist_dist_optimizer/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_moe_mr_mcore_te_ep8_resume_torch_dist_dist_optimizer/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_moe_mr_mcore_te_tp4_ep2_etp2_pp2_resume_torch_dist_dist_optimizer/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_moe_mr_mcore_te_tp4_ep2_etp2_pp2_resume_torch_dist_dist_optimizer/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_moe_mr_mcore_te_tp4_ep2_etp2_pp2_resume_torch_dist_dist_optimizer/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_reshard_2x1x4_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_reshard_2x1x4_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_reshard_2x1x4_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_top2router_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_ddp_average_in_collective_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_ddp_average_in_collective_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_ddp_average_in_collective_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_overlap_grad_reduce_param_gather_groupedGEMM_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_overlap_grad_reduce_param_gather_groupedGEMM_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_overlap_grad_reduce_param_gather_groupedGEMM_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_top2router_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts_etp1_ep4_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts_etp1_ep4_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts_etp1_ep4_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_zp_z3_resume_torch_dist_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_zp_z3_resume_torch_dist_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_zp_z3_resume_torch_dist_te_8experts2parallel_top2router_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp1_pp1_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp1_pp1_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp1_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp2_pp3_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp2_pp3_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp2_pp3_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_etp3_dgx_a100_1N7G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_etp3_dgx_a100_1N7G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_etp3_dgx_a100_1N7G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_freeze_vit_freeze_lm_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_freeze_vit_freeze_lm_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_freeze_vit_freeze_lm_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_freeze_vit_freeze_lm_dist_opt_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_freeze_vit_freeze_lm_dist_opt_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_freeze_vit_freeze_lm_dist_opt_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_resume_torch_etp3_dgx_a100_1N7G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_resume_torch_etp3_dgx_a100_1N7G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_pp1_resume_torch_etp3_dgx_a100_1N7G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_sp_cp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_sp_cp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_sp_cp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_frozen_resume_torch_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_frozen_resume_torch_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_frozen_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_resume_torch_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_resume_torch_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp2_pp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp2_pp2_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp2_pp2_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp2_pp2_resume_torch_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp2_pp2_resume_torch_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp2_pp2_resume_torch_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp1_pp1_vp1_resume_torch/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp1_pp1_vp1_resume_torch/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp1_pp1_vp1_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1_sequence_parallel/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1_sequence_parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1_sequence_parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1_resume_torch/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1_resume_torch/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp2_pp1_vp1/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp2_pp1_vp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp2_pp1_vp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_weekly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_220m_weekly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1_sequence_parallel/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_release/golden_values_0.10.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_release/golden_values_0.9.0.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/functional_tests/test_cases/t5/t5_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/python_scripts/check_status_of_main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/python_scripts/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/python_scripts/dashboard.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/python_scripts/download_coverage_results.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/python_scripts/download_golden_values.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/python_scripts/generate_jet_trigger_job.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/python_scripts/generate_local_jobs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/python_scripts/launch_jet_workload.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/python_scripts/notify.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/recipes/_build-mcore-dev.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/recipes/_build-mcore-lts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/recipes/_build-nemo.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/recipes/bert.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/recipes/common.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/recipes/gpt-modelopt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/recipes/gpt-nemo.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/recipes/gpt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/recipes/moe.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/recipes/multimodal-llava.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/recipes/t5.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/test_utils/recipes/unit-tests.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/conftest.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/test_basic.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/test_checkpointing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/test_imports.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/test_inference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/test_local_multi_tensor_fns.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/test_model_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/test_num_microbatches_calculator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/test_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/test_optimizer_cpu_offloading.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/test_optimizer_param_scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/test_parallel_state.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/test_tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/test_training.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/test_utilities.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/test_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/data/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/data/test_bin_reader.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/data/test_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/data/test_gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/data/test_multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/data/test_preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/data/test_preprocess_mmdata.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/conftest.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/test_async_save.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/test_flattened_resharding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/test_fp8.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/test_fully_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/test_global_metadata_reuse.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/test_local.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/test_mapping.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/test_nonpersistent.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/test_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/test_replication.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/test_serialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/test_torch_dist.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/models/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/models/test_bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/models/test_gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/models/test_mamba.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/models/test_mlp_glu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/models/test_moe_experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/models/test_retro_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/dist_checkpointing/models/test_t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/distributed/test_finalize_model_grads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/distributed/test_grad_reduce_for_replicated_embedder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/distributed/test_grad_sync_with_expert_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/distributed/test_param_and_grad_buffer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/distributed/test_torch_fully_sharded_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/export/trtllm/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/export/trtllm/test_distributed_fp8.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/export/trtllm/test_single_device_fp8.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/export/trtllm/test_trtllm_distributed_gpu_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/export/trtllm/test_trtllm_helper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/export/trtllm/test_trtllm_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/export/trtllm/test_trtllm_single_device_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/fusions/test_torch_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/inference/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/inference/test_common_inference_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/inference/test_flash_decode.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/inference/test_inference_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/inference/test_scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/inference/engines/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/inference/engines/test_dynamic_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/inference/engines/test_static_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/inference/model_inference_wrappers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/inference/model_inference_wrappers/test_model_inference_wrapper_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/inference/model_inference_wrappers/gpt/test_gpt_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/inference/model_inference_wrappers/t5/test_t5_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/inference/text_generation_controllers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/inference/text_generation_controllers/test_encoder_decoder_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/inference/text_generation_controllers/test_simple_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/inference/text_generation_controllers/test_vlm_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/models/test_base_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/models/test_bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/models/test_clip_vit_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/models/test_gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/models/test_llava_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/models/test_mamba_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/models/test_multimodal_projector.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/models/test_radio_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/models/test_t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/pipeline_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/pipeline_parallel/test_helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/pipeline_parallel/test_schedules.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/post_training/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/post_training/test_modelopt_module_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/ssm/test_mamba_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/ssm/test_mamba_hybrid_layer_allocation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/ssm/test_mamba_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/ssm/test_mamba_mixer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/tensor_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/tensor_parallel/test_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/tensor_parallel/test_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/tensor_parallel/test_initialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/tensor_parallel/test_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/tensor_parallel/test_mappings.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/tensor_parallel/test_random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/tensor_parallel/test_tensor_parallel_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/test_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/test_attention_packed_seq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/test_core_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/test_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/test_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/test_multi_latent_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/test_multi_token_prediction.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/test_relative_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/test_retro_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/test_rope.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/test_spec_customization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/test_transformer_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/test_transformer_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/moe/conftest.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/moe/test_a2a_token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/moe/test_aux_loss.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/moe/test_grouped_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/moe/test_moe_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/moe/test_moe_layer_discrepancy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/moe/test_routers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/moe/test_sequential_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/moe/test_shared_experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/moe/test_token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tests/unit_tests/transformer/moe/test_upcycling.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/autoformat.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/copyright.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/linter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/merge_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/preprocess_data_nmt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/preprocess_mmdata.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/report_theoretical_memory.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/run_inference_performance_test.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/run_mamba_text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/run_text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/run_vlm_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/text_generation_cli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/bert_embedding/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/bert_embedding/dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/bert_embedding/embed.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/bert_embedding/external_libs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/bert_embedding/huggingface.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/checkpoint/convert.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/checkpoint/hybrid_conversion.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/checkpoint/loader_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/checkpoint/loader_core.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/checkpoint/loader_legacy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/checkpoint/loader_llama_mistral.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/checkpoint/loader_llava.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/checkpoint/loader_mixtral_hf.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/checkpoint/saver_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/checkpoint/saver_core.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/checkpoint/saver_hf_llava.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/checkpoint/saver_legacy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/checkpoint/saver_llava.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/checkpoint/schema_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/checkpoint/schema_core.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/checkpoint/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/openwebtext/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/openwebtext/add_id.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/openwebtext/blacklist_urls.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/openwebtext/cleanup_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/openwebtext/cleanup_fix_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/openwebtext/filter_ngrams.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/openwebtext/find_duplicates.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/openwebtext/group_duplicate_url.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/openwebtext/merge_jsons.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/openwebtext/remove_group_duplicates.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/build_db.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/config_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/cli/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/cli/__main__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/cli/cli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/docker/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/sft/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/sft/dataset_conv.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/sft/open_inst.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/sft/sft_retro.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/sft/sft_retro_lm.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/text_generation/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/text_generation/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/text_generation/retro_api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/text_generation/retro_generate.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/text_generation/retro_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250328/tools/retro/text_generation/retro_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/.flake8
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/.pre-commit-config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/.pylintrc
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/CHANGELOG.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/CODEOWNERS
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/CONTRIBUTING.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/LICENSE
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/MANIFEST.in
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/pretrain_bert.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/pretrain_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/pretrain_ict.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/pretrain_mamba.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/pretrain_retro.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/pretrain_t5.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/pretrain_vision_classify.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/pretrain_vision_dino.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/pretrain_vision_inpaint.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/pretrain_vlm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/pyproject.toml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/setup.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/uv.lock
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/.github/ISSUE_TEMPLATE/bug.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/.github/ISSUE_TEMPLATE/enhancement.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/.github/ISSUE_TEMPLATE/question.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/.github/ISSUE_TEMPLATE/regression.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/.github/workflows/stale.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/.gitlab/labeler-config.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/.gitlab/scripts/build.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/.gitlab/scripts/fetch-legacy-suite.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/.gitlab/stages/00.pre.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/.gitlab/stages/01.build.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/.gitlab/stages/02.test.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/.gitlab/stages/03.integration-tests.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/.gitlab/stages/04.functional-tests.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/.gitlab/stages/05.publish.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docker/Dockerfile.ci.dev
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docker/Dockerfile.ci.lts
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docker/Dockerfile.ci.nemo
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docker/Dockerfile.linting
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docker/common/build_causalconv1d.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docker/common/build_groupedgemm.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docker/common/build_mamba.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docker/common/build_te.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docker/common/install.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docker/common/manifest.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/llama_mistral.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/context_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/custom_fsdp.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/datasets.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/dist_checkpointing.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/dist_checkpointing.strategies.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/dist_optimizer.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/distributed.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/encoder_decoder_parallelism.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/fusions.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/models.bert.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/models.gpt.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/models.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/models.t5.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/moe.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/multi_latent_attention.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/multi_token_prediction.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/num_microbatches_calculator.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/optimizer_cpu_offload.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/optimizer_param_scheduler.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/pipeline_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/pipeline_parallel_layout.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/tensor_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/api-guide/transformer.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/images/context_parallel/CP_overview.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/images/context_parallel/CP_results.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/images/custom_fsdp/FSDP_Allreduce.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/images/custom_fsdp/FSDP_workflow.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/images/custom_fsdp/MCore_Custom_FSDP_Class_Diagram.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/images/distrib_optimizer/data_flow.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/images/distrib_optimizer/sharding_scheme.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/images/moe/token_drop.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/images/multi_token_prediction/MTP_implementation.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/docs/source/user-guide/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/run_simple_mcore_train_loop.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/detxoify_lm/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/detxoify_lm/finetune_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/detxoify_lm/finetune_gpt_distributed-1.3b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/detxoify_lm/generate-1.3b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/detxoify_lm/generate_samples_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/detxoify_lm/perspective_api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/detxoify_lm/annotations/filter-selfgeneration.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/detxoify_lm/annotations/perspective_api_annotate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/detxoify_lm/annotations/preprocess.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/detxoify_lm/self_generation/selfgenerate-1.3b-unconditional.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/msdp/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/msdp/data_processing.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/msdp/eval_knwl_generation.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/msdp/eval_resp_generation.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/msdp/prep_resp_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/msdp/prompt_knwl_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/msdp/prompt_resp_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/sc21/CONFIG.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/sc21/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/sc21/SBATCH.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/sc21/SRUN.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/sc21/run_figure_11.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/sc21/run_figure_12.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/sc21/run_figure_13.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/sc21/run_figure_14.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/sc21/run_figure_15.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/sc21/run_figure_16.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/sc21/run_figure_17.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/sc21/run_figure_18.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/academic_paper_scripts/sc21/run_table_1.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/bert/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/bert/train_bert_340m_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/export/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/export/trtllm_export/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/export/trtllm_export/distributed_export/gpt_distributed_gpu_export.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/export/trtllm_export/single_device_export/gpt_single_device_cpu_export.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/gpt3/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/gpt3/gpt_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/gpt3/train_gpt3_175b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/inference/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/inference/run_text_generation_server_345M.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/inference/run_text_generation_server_345M_8_tensor_parallel.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/inference/gpt/gpt_dynamic_inference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/inference/gpt/gpt_dynamic_inference_12b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/inference/gpt/gpt_dynamic_inference_357m.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/inference/gpt/gpt_static_inference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/inference/gpt/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/inference/llama_mistral/huggingface_reference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/inference/llama_mistral/run_static_inference_llama4_scout.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/inference/llama_mistral/run_text_generation_llama3.1.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/inference/llama_mistral/run_text_generation_llama3.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/inference/llama_mistral/run_text_generation_mistral.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/inference/t5/simple_t5_batch_inference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/llama/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/llama/train_llama3_8b_h100_fp8.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/mamba/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/mamba/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/mamba/run_text_gen_server_8b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/mamba/run_text_gen_server_8b_gpt3.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/mamba/train.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/mixtral/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/mixtral/train_mixtral_8x7b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/combine_lm_vision_checkpoints.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/combine_state_dicts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/convert_llava_pretrain_to_wds.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/dataloader_provider.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/dataset_helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/energon_util.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/image_processing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/layer_scaling.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/manual_prompts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/multimodal_args.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/pretrain_dataset.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/pretrain_mistral_clip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/run_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/sft_dataset.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/sft_mistral_clip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/text_generation_mistral_clip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/train.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/assets/pretrain_curves.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/evaluate_ai2d.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/evaluate_chartqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/evaluate_coco.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/evaluate_infovqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/evaluate_mathvista.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/evaluate_mmmu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/evaluate_ocrbench.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/evaluate_ocrbench_v2.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/evaluate_rd_tablebench.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/evaluate_realworldqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/evaluate_spdocvqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/evaluate_textvqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/evaluate_video_motionbench.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/evaluate_video_mvbench.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/evaluate_video_phys_game_bench.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/evaluate_vqav2.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/evaluation_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/evaluation/mmmu_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/llama_3p1_nemotron_nano_vl_8b_v1/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/llama_3p1_nemotron_nano_vl_8b_v1/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/llama_3p1_nemotron_nano_vl_8b_v1/pretraining_llama_3p1_nemotron_nano_vl_8b_v1.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/llama_3p1_nemotron_nano_vl_8b_v1/sft_llama_3p1_nemotron_nano_vl_8b_v1.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/llama_3p1_nemotron_nano_vl_8b_v1/text_generation.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/model_converter/clip_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/model_converter/internvit_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/model_converter/radio_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/model_converter/siglip_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/model_converter/vision_model_tester.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/nvlm/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/nvlm/internvit.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/nvlm/nvlm_prompts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/nvlm/pp_checkpoint_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/nvlm/pretrain_blend.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/nvlm/pretrain_qwen20_72b_internvit_6b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/nvlm/pretrain_yi_34b_internvit_6b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/nvlm/run_text_generation_qwen20_72b_internvit_6b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/nvlm/run_text_generation_qwen25_7b_internvit_video.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/nvlm/run_text_generation_qwen25_7b_siglip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/nvlm/run_text_generation_yi_34b_internvit_6b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/nvlm/sft_34b_internvit.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/nvlm/sft_blend.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/nvlm/sft_qwen20_72b_internvit_6b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/nvlm/sft_qwen2p5_7b_internvit_6b_video.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/multimodal/radio/radio_g.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/convert.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/convert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/export.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/export.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/finetune.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/generate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/generate.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/mmlu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/mmlu.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/quantize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/quantize.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/speculative.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/conf/arguments.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/conf/deepseek-ai/DeepSeek-R1.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/conf/deepseek-ai/DeepSeek-V2-Lite.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/conf/meta-llama/Llama-3.1-8B-Instruct.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/conf/meta-llama/Llama-3.2-1B-Instruct.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/conf/meta-llama/Llama-4-Maverick-17B-128E-Instruct.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/conf/meta-llama/Llama-4-Scout-17B-16E-Instruct.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/conf/nvidia/Nemotron-H-4B-Instruct.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/conf/nvidia/Nemotron-H-8B-Base-8K.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/conf/nvidia/Nemotron-Mini-4B-Instruct.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/conf/qwen/Qwen3-235B-A22B.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/post_training/modelopt/conf/qwen/Qwen3-30B-A3B.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/retro/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/retro/preprocess_data.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/retro/train_retro_2b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/t5/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/t5/t5_mcore_train_curve.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/examples/t5/train_t5_220m_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/images/model_table.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/images/strong_scaling.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/images/weak_scaling.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/MSC_Integration.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/QuickStart.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/README_STRAGGLER.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/config_logger.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/energy_monitor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/fp8_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/jit.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/model_parallel_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/msc_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/num_microbatches_calculator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/optimizer_param_scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/package_info.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/packed_seq_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/parallel_state.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/process_groups_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/rerun_state_machine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/timers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/Makefile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/bert_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/blended_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/blended_megatron_dataset_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/blended_megatron_dataset_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/helpers.cpp
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/indexed_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/masked_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/megatron_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/megatron_tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/object_storage_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/readme.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/t5_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/utils_object_storage.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/utils_s3.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/external_libs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/config/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/config/bert_embedders.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/config/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/config/gpt_chunk_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/config/tokenizers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/db/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/db/build.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/db/dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/db/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/index/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/index/build.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/index/factory.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/index/index.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/index/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/index/validate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/index/indexes/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/index/indexes/faiss_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/index/indexes/faiss_par_add.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/query/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/query/gpt_chunk_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/query/multi_split_gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/query/query.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/query/retro_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/datasets/retro/query/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/core.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/dict_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/exchange_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/mapping.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/serialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/state_dict_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/tensor_aware_state_dict.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/validation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/strategies/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/strategies/async_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/strategies/base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/strategies/cached_metadata_filesystem_reader.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/strategies/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/strategies/filesystem_async.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/strategies/fully_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/strategies/resharding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/strategies/state_dict_saver.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/strategies/tensorstore.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/strategies/torch.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/strategies/two_stage.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/dist_checkpointing/strategies/zarr.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/distributed/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/distributed/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/distributed/data_parallel_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/distributed/distributed_data_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/distributed/distributed_data_parallel_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/distributed/finalize_model_grads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/distributed/param_and_grad_buffer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/distributed/torch_fully_sharded_data_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/distributed/torch_fully_sharded_data_parallel_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/distributed/custom_fsdp/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/distributed/custom_fsdp/fully_sharded_data_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/distributed/custom_fsdp/param_and_grad_buffer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/export/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/export/data_type.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/export/export_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/export/model_type.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/export/trtllm/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/export/trtllm/trt_model_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/export/trtllm/trt_model_type.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/export/trtllm/trtllm_helper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/export/trtllm/trtllm_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/export/trtllm/engine_builder/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/export/trtllm/engine_builder/trtllm_engine_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/export/trtllm/model_to_trllm_mapping/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/export/trtllm/model_to_trllm_mapping/default_conversion_dict.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/export/trtllm/trtllm_weights_converter/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/export/trtllm/trtllm_weights_converter/distributed_trtllm_model_weights_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/export/trtllm/trtllm_weights_converter/single_device_trtllm_model_weights_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/export/trtllm/trtllm_weights_converter/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/extensions/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/extensions/kitchen.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/extensions/transformer_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/extensions/transformer_engine_spec_provider.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/fusions/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/fusions/fused_bias_dropout.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/fusions/fused_bias_geglu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/fusions/fused_bias_gelu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/fusions/fused_bias_swiglu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/fusions/fused_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/fusions/fused_indices_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/fusions/fused_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/fusions/fused_mla_yarn_rope_apply.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/fusions/fused_pad_routing_map.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/fusions/fused_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/async_stream.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/common_inference_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/communication_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/inference_request.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/sampling_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/contexts/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/contexts/base_context.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/contexts/dynamic_chunk_allocator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/contexts/dynamic_context.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/contexts/static_context.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/engines/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/engines/abstract_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/engines/dynamic_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/engines/mcore_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/engines/static_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/model_inference_wrappers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/model_inference_wrappers/abstract_model_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/model_inference_wrappers/inference_wrapper_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/model_inference_wrappers/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/model_inference_wrappers/gpt/gpt_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/model_inference_wrappers/multimodal/vlm_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/model_inference_wrappers/t5/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/model_inference_wrappers/t5/t5_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/text_generation_controllers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/text_generation_controllers/encoder_decoder_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/text_generation_controllers/simple_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/text_generation_controllers/text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/inference/text_generation_controllers/vlm_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/backends.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/T5/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/T5/t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/T5/t5_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/bert/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/bert/bert_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/bert/bert_lm_head.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/bert/bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/bert/pooler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/common/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/common/embeddings/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/common/embeddings/language_model_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/common/embeddings/relative_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/common/embeddings/rope_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/common/embeddings/rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/common/embeddings/yarn_rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/common/language_module/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/common/language_module/language_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/common/vision_module/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/common/vision_module/vision_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/gpt/fine_grained_callables.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/gpt/gpt_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/gpt/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/gpt/moe_module_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/gpt/heterogeneous/heterogeneous_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/huggingface/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/huggingface/clip_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/huggingface/module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/huggingface/qwen_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/mamba/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/mamba/mamba_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/mamba/mamba_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/mimo/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/mimo/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/mimo/config/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/mimo/config/base_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/mimo/model/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/mimo/model/base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/mimo/submodules/audio.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/mimo/submodules/base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/mimo/submodules/vision.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/multimodal/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/multimodal/context_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/multimodal/llava_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/multimodal/llava_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/retro/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/retro/base_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/retro/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/retro/decoder_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/retro/decoder_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/retro/encoder_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/retro/encoder_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/retro/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/retro/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/vision/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/vision/clip_vit_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/vision/multimodal_projector.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/vision/radio.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/models/vision/vit_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/optimizer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/optimizer/clip_grads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/optimizer/distrib_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/optimizer/grad_scaler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/optimizer/optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/optimizer/optimizer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/optimizer/cpu_offloading/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/optimizer/cpu_offloading/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/optimizer/cpu_offloading/hybrid_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/pipeline_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/pipeline_parallel/p2p_communication.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/pipeline_parallel/schedules.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/pipeline_parallel/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/post_training/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/post_training/modelopt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/post_training/modelopt/layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/post_training/modelopt/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/post_training/modelopt/gpt/model_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/post_training/modelopt/gpt/state_dict_hooks.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/post_training/modelopt/mamba/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/post_training/modelopt/mamba/model_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/quantization/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/quantization/quant_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/quantization/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/ssm/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/ssm/mamba_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/ssm/mamba_context_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/ssm/mamba_hybrid_layer_allocation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/ssm/mamba_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/ssm/mamba_mixer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/ssm/mlp_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/ssm/triton_cache_manager.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/tensor_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/tensor_parallel/cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/tensor_parallel/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/tensor_parallel/layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/tensor_parallel/mappings.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/tensor_parallel/random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/tensor_parallel/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/cuda_graphs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/dot_product_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/identity_op.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/multi_latent_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/multi_token_prediction.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/pipeline_parallel_layer_layout.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/spec_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/torch_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/torch_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/transformer_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/transformer_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/custom_layers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/custom_layers/transformer_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/heterogeneous/heterogeneous_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/heterogeneous/linear_replacements.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/moe/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/moe/experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/moe/fused_a2a.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/moe/grouped_gemm_util.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/moe/moe_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/moe/router.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/moe/shared_experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/moe/token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/core/transformer/moe/upcycling_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/inference/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/inference/text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/inference/endpoints/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/inference/endpoints/completions.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/inference/static/index.html
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/inference/text_generation/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/inference/text_generation/api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/inference/text_generation/beam_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/inference/text_generation/communication.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/inference/text_generation/forward_step.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/inference/text_generation/generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/inference/text_generation/mcore_engine_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/inference/text_generation/sampling.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/inference/text_generation/tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/indexer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/data/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/data/autoaugment.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/data/biencoder_dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/data/data_samplers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/data/dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/data/ict_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/data/image_folder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/data/multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/data/orqa_wiki_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/data/realm_dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/data/realm_index.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/data/vit_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/fp16_deprecated/loss_scaler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/fused_kernels/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/fused_kernels/compat.h
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/fused_kernels/type_shim.h
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/fused_kernels/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/fused_kernels/tests/test_fused_kernels.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/biencoder_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/fused_bias_gelu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/fused_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/fused_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/multiple_choice.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/realm_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/rms_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/vision/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/vision/dino.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/vision/esvit_swin_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/vision/inpainting.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/vision/knn_monitor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/vision/mit_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/vision/swin_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/vision/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/model/vision/vit_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/mpu/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/mpu/tests/commons.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/mpu/tests/test_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/mpu/tests/test_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/mpu/tests/test_initialize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/mpu/tests/test_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/legacy/mpu/tests/test_random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/post_training/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/post_training/arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/post_training/checkpointing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/post_training/generate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/post_training/loss_func.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/post_training/model_provider.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/post_training/non_loss_data_func.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/post_training/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/post_training/algos/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/post_training/algos/distillation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/post_training/docs/distillation.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/activations.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/async_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/checkpointing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/dist_signal_handler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/ft_integration.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/global_vars.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/initialize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/inprocess_restart.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/log_handler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/one_logger_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/theoretical_memory_usage.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/training.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/wandb_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/yaml_arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/datasets/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/datasets/sft_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/tokenizer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/tokenizer/bert_tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/tokenizer/gpt2_tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/tokenizer/multimodal_tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/tokenizer/sft_tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/megatron/training/tokenizer/tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/patches/nemo_2.3.0_te.patch
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/data_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/ensemble_classifier.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/finetune_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/glue/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/glue/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/glue/mnli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/glue/qqp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/msdp/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/msdp/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/msdp/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/msdp/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/msdp/preprocessing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/msdp/prompt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/orqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/orqa/evaluate_orqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/orqa/evaluate_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/orqa/supervised/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/orqa/supervised/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/orqa/supervised/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/orqa/unsupervised/nq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/orqa/unsupervised/qa_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/orqa/unsupervised/tokenizers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/quantize/calibrate_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/race/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/race/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/vision/finetune_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/vision/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/vision/classification/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/vision/classification/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/vision/segmentation/cityscapes.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/vision/segmentation/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/vision/segmentation/finetune_segformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/vision/segmentation/finetune_setr.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/vision/segmentation/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/vision/segmentation/seg_heads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/vision/segmentation/seg_models.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/vision/segmentation/transforms.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/vision/segmentation/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/zeroshot_gpt/datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/zeroshot_gpt/detokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tasks/zeroshot_gpt/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/python_test_utils/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/python_test_utils/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/python_test_utils/conftest.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/python_test_utils/get_test_results_from_tensorboard_logs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/python_test_utils/test_inference_regular_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/python_test_utils/test_pretraining_regular_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/python_test_utils/test_pretraining_resume_checkpoint_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/shell_test_utils/_run_training.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/shell_test_utils/run_ci_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/shell_test_utils/start_interactive_job.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_frozen_resume_torch_dist_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_frozen_resume_torch_dist_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_frozen_resume_torch_dist_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_frozen_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_local_spec_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_local_spec_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_local_spec_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_local_spec_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_local_spec_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_local_spec_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_local_spec_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_mr_mcore_tp2_pp2_resume_torch_dist_local_spec_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp4_vp2/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp4_vp2/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp4_vp2/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp1_pp4_vp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp4_pp1/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp4_pp1/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp4_pp1/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_nightly_dgx_a100_1N8G_mcore_tp4_pp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_release/golden_values_0.10.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_release/golden_values_0.11.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_release/golden_values_0.12.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_release/golden_values_0.13.0_dgx_h100_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_release/golden_values_0.9.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/bert/bert_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/common/ckpt_converter/__main__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/common/ckpt_converter/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt-nemo/bert-nemo_340m_mr_mbs2_gbs32_mcore_te_tp2_pp2_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt-nemo/gemma2-nemo_2b_mr_mbs1_gbs8_mcore_te_tp4_pp1_cp1_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt-nemo/llama3-nemo_8b_mr_mbs1_gbs8_mcore_te_8experts_tp2_ep2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt-nemo/llama3-nemo_8b_mr_mbs4_gbs64_mcore_te_tp1_pp1_cp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt-nemo/mixtral-nemo_8x7b_mr_mbs1_gbs8_mcore_te_tp2_pp1_ep2_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt-nemo/t5-nemo_220m_mr_mbs4_gbs64_te_tp1_pp1_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/golden_values_0.10.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/golden_values_0.11.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/golden_values_0.12.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/golden_values_0.13.0_dgx_h100_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/golden_values_0.8.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/golden_values_0.9.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release_sm/golden_values_0.11.0_PyT24.10_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release_sm/golden_values_0.11.0_PyT25.01_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release_sm/golden_values_0.12.0_PyT25.03_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_15b_8t_release_sm/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_dist_optimizer_overlap_grad_reduce_param_gather/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_dist_optimizer_overlap_grad_reduce_param_gather/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_dist_optimizer_overlap_grad_reduce_param_gather/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_fsdp2_resume_torch_dist_te/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_fp16/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_fp16/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_fp16/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_resume_torch_dist/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_resume_torch_dist/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_resume_torch_dist/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4_resume_torch_dist/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4_resume_torch_dist/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4_resume_torch_dist/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch_dist/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch_dist/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch_dist/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch_dist/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_b200_1N8G_mcore_tp2_pp2_current_scaling_native_fp8_tp_pp_sp_tp_overlap/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_b200_1N8G_mcore_tp2_pp2_current_scaling_native_fp8_tp_pp_sp_tp_overlap/tp_comm_overlap_cfg.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_b200_1N8G_mcore_tp4_cp2_current_scaling_native_fp8_tp_fsdp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_b200_1N8G_mcore_tp4_cp2_current_scaling_native_fp8_tp_sp_cp_tp_overlap/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_b200_1N8G_mcore_tp4_cp2_mxfp8_tp_sp_cp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_b200_1N8G_mcore_tp4_cp2_native_fp8_tp_sp_cp_tp_overlap/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_nondet_tp1_pp1_fp8_no_model_parallel/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_nondet_tp1_pp1_fp8_no_model_parallel/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_nondet_tp1_pp1_fp8_no_model_parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_bf16_baseline/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_bf16_baseline/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_bf16_baseline/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_fp8_no_model_parallel/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_fp8_no_model_parallel/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp1_fp8_no_model_parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp2_fp8_pp/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp2_fp8_pp/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp1_pp2_fp8_pp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_current_scaling_native_fp8_tp_pp_sp_tp_overlap/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_current_scaling_native_fp8_tp_pp_sp_tp_overlap/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_current_scaling_native_fp8_tp_pp_sp_tp_overlap/tp_comm_overlap_cfg.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp_sp/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp_sp/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_fp8_tp_pp_sp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_native_fp8_tp_pp_sp/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_native_fp8_tp_pp_sp/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp2_pp2_native_fp8_tp_pp_sp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp4_cp2_current_scaling_native_fp8_tp_fsdp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp4_cp2_current_scaling_native_fp8_tp_sp_cp_tp_overlap/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp4_cp2_current_scaling_native_fp8_tp_sp_cp_tp_overlap/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp4_cp2_native_fp8_tp_sp_cp_tp_overlap/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp4_cp2_native_fp8_tp_sp_cp_tp_overlap/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp4_pp2_fp8_tp_pp/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp4_pp2_fp8_tp_pp/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_345m_weekly_dgx_h100_1N8G_mcore_tp4_pp2_fp8_tp_pp/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_7b_mr_dgx_a100_1N8G_tp1_pp4_memory_speed/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_7b_mr_dgx_a100_1N8G_tp1_pp4_memory_speed/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_7b_mr_dgx_a100_1N8G_tp1_pp4_memory_speed/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_7b_mr_dgx_a100_1N8G_tp4_pp1_memory_speed/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_7b_mr_dgx_a100_1N8G_tp4_pp1_memory_speed/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_7b_mr_dgx_a100_1N8G_tp4_pp1_memory_speed/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_7b_mr_dgx_a100_1N8G_tp4_pp1_memory_speed/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_frozen_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_frozen_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_frozen_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_frozen_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_uniform_full_recompute_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_uniform_full_recompute_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_uniform_full_recompute_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_resume_torch_dist_uniform_full_recompute_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_uniform_full_recompute_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_uniform_full_recompute_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp1_uniform_full_recompute_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_cp4_a2a_p2p_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_disable_bias_linear_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_disable_bias_linear_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_disable_bias_linear_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_frozen_resume_torch_dist_swiglu_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_frozen_resume_torch_dist_swiglu_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_frozen_resume_torch_dist_swiglu_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_frozen_resume_torch_dist_swiglu_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_persistent_ckpt_disable_bias_linear_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_persistent_ckpt_disable_bias_linear_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_persistent_ckpt_disable_bias_linear_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_disable_bias_linear_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_disable_bias_linear_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_disable_bias_linear_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_disable_bias_linear_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_persistent_disable_bias_linear_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_persistent_disable_bias_linear_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_persistent_disable_bias_linear_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_persistent_disable_bias_linear_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_sequence_parallel_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_sequence_parallel_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_sequence_parallel_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_swiglu_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_swiglu_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_swiglu_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_swiglu_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_untie_embeddings_and_outputs_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_untie_embeddings_and_outputs_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_untie_embeddings_and_outputs_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_resume_torch_dist_untie_embeddings_and_outputs_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_sequence_parallel_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_sequence_parallel_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_sequence_parallel_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_swiglu_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_swiglu_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_swiglu_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_untie_embeddings_and_outputs_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_untie_embeddings_and_outputs_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_untie_embeddings_and_outputs_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_calculate_per_token_loss_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_calculate_per_token_loss_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_calculate_per_token_loss_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_decoupled_lr_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_decoupled_lr_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_decoupled_lr_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_overlap_optimizer_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_overlap_optimizer_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_overlap_optimizer_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_overlap_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_decoupled_lr_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_decoupled_lr_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_decoupled_lr_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_decoupled_lr_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_calculate_per_token_loss_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_calculate_per_token_loss_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_calculate_per_token_loss_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_calculate_per_token_loss_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_tunable_overlap_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_tunable_overlap_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_tunable_overlap_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_resume_torch_dist_tunable_overlap_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_tunable_overlap_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_tunable_overlap_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_tunable_overlap_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_tunable_overlap_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_uneven_pipeline_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_uneven_pipeline_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_uneven_pipeline_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp1_uneven_pipeline_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp2_account_for_embedding_loss_in_pipeline_split_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp2_account_for_embedding_loss_in_pipeline_split_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp2_account_for_embedding_loss_in_pipeline_split_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp1_pp4_vp2_account_for_embedding_loss_in_pipeline_split_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_cp2_nondeterministic_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_fsdp2_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_multi_dist_optimizer_instances_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_multi_dist_optimizer_instances_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_multi_dist_optimizer_instances_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_multi_dist_optimizer_instances_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_multi_dist_optimizer_instances_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_multi_dist_optimizer_instances_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_multi_dist_optimizer_instances_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_calculate_per_token_loss_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_calculate_per_token_loss_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_calculate_per_token_loss_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_calculate_per_token_loss_nondeterministic_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_calculate_per_token_loss_nondeterministic_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_calculate_per_token_loss_nondeterministic_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_calculate_per_token_loss_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_calculate_per_token_loss_dp_last_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_calculate_per_token_loss_dp_last_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_calculate_per_token_loss_dp_last_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_calculate_per_token_loss_nondeterministic_dp_last_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_calculate_per_token_loss_nondeterministic_dp_last_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_calculate_per_token_loss_nondeterministic_dp_last_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_calculate_per_token_loss_nondeterministic_dp_last_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_dp_last_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_dp_last_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_dp_last_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_nondeterministic_dp_last_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_nondeterministic_dp_last_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_nondeterministic_dp_last_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_etp4_nondeterministic_dp_last_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_nondeterministic_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cross_entropy_loss_fusion_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cross_entropy_loss_fusion_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cross_entropy_loss_fusion_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_cross_entropy_loss_fusion_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_ddp_average_in_collective_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_ddp_average_in_collective_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_ddp_average_in_collective_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_defer_embedding_wgrad_compute_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_defer_embedding_wgrad_compute_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_defer_embedding_wgrad_compute_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_mla_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_mla_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_mla_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_mmap_bin_files_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_mmap_bin_files_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_no_mmap_bin_files_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cp2_nondeterministic_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cross_entropy_loss_fusion_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cross_entropy_loss_fusion_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cross_entropy_loss_fusion_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_cross_entropy_loss_fusion_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_ddp_average_in_collective_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_ddp_average_in_collective_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_ddp_average_in_collective_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_ddp_average_in_collective_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_defer_embedding_wgrad_compute_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_defer_embedding_wgrad_compute_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_defer_embedding_wgrad_compute_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_defer_embedding_wgrad_compute_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_create_attention_mask_in_dataloader_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_mmap_bin_files_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_mmap_bin_files_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_no_mmap_bin_files_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_reshard_1x4xNone_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_reshard_1x4xNone_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_reshard_1x4xNone_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_pp2_resume_torch_dist_reshard_1x4xNone_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_zp_z3_resume_torch_dist_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_zp_z3_resume_torch_dist_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_zp_z3_resume_torch_dist_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp2_zp_z3_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_qk_layernorm_test_mode_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_qk_layernorm_test_mode_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_qk_layernorm_test_mode_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_qk_layernorm_test_mode_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_qk_layernorm_test_mode_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_qk_layernorm_test_mode_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp1_resume_torch_dist_qk_layernorm_test_mode_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_frozen_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_frozen_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_frozen_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_frozen_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_te_tp4_pp2_resume_torch_dist_reshard_8x1xNone_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_resume_torch_dist_uninstall_te_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_resume_torch_dist_uninstall_te_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_resume_torch_dist_uninstall_te_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_uninstall_te_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_uninstall_te_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_mr_mcore_tp2_pp2_uninstall_te_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_nightly_mcore_te_tp2_pp1_modelopt_distill_resume/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_nightly_mcore_te_tp2_pp1_modelopt_distill_resume/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt3_nightly_mcore_te_tp2_pp1_modelopt_distill_resume/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt_inference_tp1_pp1_583m_logitsmatch/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt_inference_tp1_pp1_583m_logitsmatch/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/gpt/gpt_inference_tp1_pp1_583m_logitsmatch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/hybrid/hybrid_inference_tp1_pp1_2B_logitsmatch/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/hybrid/hybrid_inference_tp1_pp1_2B_logitsmatch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/hybrid/hybrid_mr_mcore_te_tp1_pp1_cp1_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/hybrid/hybrid_mr_mcore_te_tp1_pp1_cp1_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/hybrid/hybrid_mr_mcore_te_tp1_pp1_cp1_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/hybrid/hybrid_mr_mcore_te_tp1_pp1_cp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/hybrid/hybrid_mr_mcore_te_tp1_pp4_cp1_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/hybrid/hybrid_mr_mcore_te_tp1_pp4_cp1_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/hybrid/hybrid_mr_mcore_te_tp1_pp4_cp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/hybrid/hybrid_mr_mcore_te_tp2_pp1_cp1_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/hybrid/hybrid_mr_mcore_te_tp2_pp1_cp1_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/hybrid/hybrid_mr_mcore_te_tp2_pp1_cp1_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/hybrid/hybrid_mr_mcore_te_tp2_pp1_cp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/hybrid/hybrid_mr_mcore_te_tp2_pp1_cp4_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/hybrid/hybrid_mr_mcore_te_tp2_pp1_cp4_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/hybrid/hybrid_mr_mcore_te_tp2_pp1_cp4_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/hybrid/hybrid_mr_mcore_te_tp2_pp1_cp4_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/mixtral/mixtral_8x22b_tp2pp8ep8vpp1_release/golden_values_0.10.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/mixtral/mixtral_8x22b_tp2pp8ep8vpp1_release/golden_values_0.12.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/mixtral/mixtral_8x22b_tp2pp8ep8vpp1_release/golden_values_0.9.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/mixtral/mixtral_8x22b_tp2pp8ep8vpp1_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/golden_values_0.10.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/golden_values_0.11.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/golden_values_0.11.0_patch_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/golden_values_0.12.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/golden_values_0.8.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/golden_values_0.9.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_alltoall_tp2pp4ep4_release_sm/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_tp1pp4ep8vpp8_release/golden_values_0.10.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_tp1pp4ep8vpp8_release/golden_values_0.11.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_tp1pp4ep8vpp8_release/golden_values_0.12.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_tp1pp4ep8vpp8_release/golden_values_0.9.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/mixtral/mixtral_8x7b_tp1pp4ep8vpp8_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic_dp_last/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic_dp_last/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic_dp_last/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_cp2_pp2_ep2_te_4experts2parallel_nondeterministic_dp_last/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_cp2_pp2_ep2_te_4experts2parallel/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_cp2_pp2_ep2_te_4experts2parallel/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_cp2_pp2_ep2_te_4experts2parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_cp2_pp2_ep2_te_4experts2parallel_dp_last/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_cp2_pp2_ep2_te_4experts2parallel_dp_last/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_cp2_pp2_ep2_te_4experts2parallel_dp_last/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel_dp_last/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel_dp_last/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel_dp_last/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_etp2_te_4experts2parallel_dp_last/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_resume_torch_dist_te_4experts2parallel/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_resume_torch_dist_te_4experts2parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_te_4experts2parallel/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_te_4experts2parallel/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_te_4experts2parallel/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_ep2_te_4experts2parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_resume_torch_dist_te_2experts/golden_values_dev.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_resume_torch_dist_te_2experts/golden_values_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_resume_torch_dist_te_2experts/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mcore_te_tp1_pp1_ep8_etp1_cp_memory_speed/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mcore_te_tp1_pp1_ep8_etp1_cp_memory_speed/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_moe_mr_mcore_te_ep8_resume_torch_dist_dist_optimizer/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_moe_mr_mcore_te_ep8_resume_torch_dist_dist_optimizer/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_moe_mr_mcore_te_ep8_resume_torch_dist_dist_optimizer/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_moe_mr_mcore_te_ep8_resume_torch_dist_dist_optimizer/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_moe_mr_mcore_te_tp4_ep2_etp2_pp2_resume_torch_dist_dist_optimizer/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_moe_mr_mcore_te_tp4_ep2_etp2_pp2_resume_torch_dist_dist_optimizer/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_moe_mr_mcore_te_tp4_ep2_etp2_pp2_resume_torch_dist_dist_optimizer/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_moe_mr_mcore_te_tp4_ep2_etp2_pp2_resume_torch_dist_dist_optimizer/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_reshard_2x1x4_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_reshard_2x1x4_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_reshard_2x1x4_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp1_pp2_resume_torch_dist_reshard_2x1x4_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_frozen_resume_torch_dist_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_multi_dist_optimizer_instances_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_multi_dist_optimizer_instances_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_multi_dist_optimizer_instances_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_multi_dist_optimizer_instances_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_resume_torch_dist_te_8experts2parallel_top2router_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_ddp_average_in_collective_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_ddp_average_in_collective_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_ddp_average_in_collective_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_ddp_average_in_collective_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_overlap_grad_reduce_param_gather_groupedGEMM_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_overlap_grad_reduce_param_gather_groupedGEMM_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_overlap_grad_reduce_param_gather_groupedGEMM_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_overlap_grad_reduce_param_gather_groupedGEMM_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_top2router_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts_etp1_ep4_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts_etp1_ep4_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts_etp1_ep4_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_pp1_te_8experts_etp1_ep4_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_zp_z3_resume_torch_dist_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_zp_z3_resume_torch_dist_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_zp_z3_resume_torch_dist_te_8experts2parallel_top2router_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt3_mr_mcore_te_tp2_zp_z3_resume_torch_dist_te_8experts2parallel_top2router_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt_inference_tp1_pp1_ep1_16B_logitsmatch/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/moe/gpt_inference_tp1_pp1_ep1_16B_logitsmatch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp1_pp1_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp1_pp1_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp1_pp1_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp1_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_sp_cp2_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_sp_cp2_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_sp_cp2_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/multimodal-llava/multimodal_llava_mr_mcore_te_tp4_sp_cp2_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_11b_mr_mcore_tp4_pp1_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_11b_mr_mcore_tp4_pp1_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_11b_mr_mcore_tp4_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_te_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_mr_mcore_tp4_pp1_resume_torch_dist_dgx_a100_1N8G/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp1_pp1_vp1_resume_torch/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp1_pp1_vp1_resume_torch/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp1_pp1_vp1_resume_torch/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp1_pp1_vp1_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1_sequence_parallel/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1_sequence_parallel/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1_sequence_parallel/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1_sequence_parallel/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1_resume_torch/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1_resume_torch/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1_resume_torch/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_vp1_resume_torch/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp2_pp1_vp1/golden_values_dev_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp2_pp1_vp1/golden_values_dev_dgx_h100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp2_pp1_vp1/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_nightly_dgx_a100_1N8G_mcore_tp2_pp1_vp1/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_weekly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_220m_weekly_dgx_a100_1N8G_mcore_te_tp2_pp1_vp1_sequence_parallel/golden_values_lts_dgx_a100.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_release/golden_values_0.10.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_release/golden_values_0.11.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_release/golden_values_0.12.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_release/golden_values_0.9.0_dgx_a100_lts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/functional_tests/test_cases/t5/t5_release/model_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/python_scripts/auto_reminder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/python_scripts/check_status_of_main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/python_scripts/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/python_scripts/dashboard.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/python_scripts/download_coverage_results.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/python_scripts/download_golden_values.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/python_scripts/generate_jet_trigger_job.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/python_scripts/generate_local_jobs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/python_scripts/launch_jet_workload.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/python_scripts/notify.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/python_scripts/wait_for_resources.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/recipes/_build-mcore-dev.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/recipes/_build-mcore-lts.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/recipes/_build-nemo.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/recipes/bert.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/recipes/common.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/recipes/gpt-inference.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/recipes/gpt-nemo.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/recipes/gpt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/recipes/mamba-inference.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/recipes/mamba.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/recipes/moe-inference.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/recipes/moe.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/recipes/multimodal-llava.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/recipes/t5.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/test_utils/recipes/unit-tests.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/conftest.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/run_ci_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/test_basic.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/test_checkpointing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/test_fp8_param.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/test_imports.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/test_inference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/test_local_multi_tensor_fns.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/test_model_configs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/test_num_microbatches_calculator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/test_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/test_optimizer_cpu_offloading.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/test_optimizer_param_scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/test_parallel_state.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/test_process_groups_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/test_tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/test_training.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/test_utilities.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/test_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/a2a_overlap/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/data/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/data/test_bin_reader.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/data/test_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/data/test_gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/data/test_multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/data/test_preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/data/test_preprocess_mmdata.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/conftest.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/test_async_save.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/test_flattened_resharding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/test_fp8.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/test_fully_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/test_global_metadata_reuse.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/test_local.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/test_mapping.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/test_msc.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/test_nonpersistent.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/test_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/test_pipeline_parallel_layout.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/test_replication.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/test_serialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/test_strict.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/test_torch_dist.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/models/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/models/test_bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/models/test_gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/models/test_mamba.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/models/test_mlp_glu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/models/test_moe_experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/dist_checkpointing/models/test_t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/distributed/test_distributed_data_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/distributed/test_finalize_model_grads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/distributed/test_grad_reduce_for_replicated_embedder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/distributed/test_grad_sync_with_expert_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/distributed/test_mcore_fully_sharded_data_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/distributed/test_param_and_grad_buffer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/distributed/test_torch_fully_sharded_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/export/trtllm/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/export/trtllm/test_distributed_fp8.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/export/trtllm/test_single_device_fp8.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/export/trtllm/test_trtllm_distributed_gpu_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/export/trtllm/test_trtllm_helper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/export/trtllm/test_trtllm_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/export/trtllm/test_trtllm_single_device_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/fusions/test_bias_dropout_fusion.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/fusions/test_mla_yarn_rope_apply.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/fusions/test_swiglu_fusion.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/fusions/test_torch_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/test_common_inference_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/test_communication_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/test_flash_decode.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/test_inference_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/test_scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/contexts/test_dynamic_context.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/engines/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/engines/test_dynamic_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/engines/test_static_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/model_inference_wrappers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/model_inference_wrappers/test_model_inference_wrapper_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/model_inference_wrappers/gpt/test_gpt_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/model_inference_wrappers/t5/test_t5_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/text_generation_controllers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/text_generation_controllers/test_encoder_decoder_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/text_generation_controllers/test_simple_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/inference/text_generation_controllers/test_vlm_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/models/test_base_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/models/test_bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/models/test_clip_vit_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/models/test_gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/models/test_gpt_model_quantization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/models/test_heterogeneous_gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/models/test_llava_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/models/test_mamba_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/models/test_mimo_audio_submodules.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/models/test_mimo_embedding_alignment.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/models/test_mimo_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/models/test_mimo_submodules.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/models/test_multimodal_projector.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/models/test_radio_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/models/test_t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/pipeline_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/pipeline_parallel/test_helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/pipeline_parallel/test_pipeline_layout.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/pipeline_parallel/test_schedules.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/post_training/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/post_training/test_modelopt_module_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/ssm/test_mamba_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/ssm/test_mamba_context_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/ssm/test_mamba_hybrid_layer_allocation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/ssm/test_mamba_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/ssm/test_mamba_mixer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/tensor_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/tensor_parallel/test_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/tensor_parallel/test_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/tensor_parallel/test_initialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/tensor_parallel/test_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/tensor_parallel/test_mappings.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/tensor_parallel/test_random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/tensor_parallel/test_tensor_parallel_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_attention_no_rope.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_attention_packed_seq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_core_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_cuda_graphs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_multi_latent_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_multi_token_prediction.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_quantization_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_relative_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_retro_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_rope.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_spec_customization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_submodule_callables.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_transformer_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_transformer_block_custom_pgs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_transformer_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/test_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/moe/conftest.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/moe/test_a2a_token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/moe/test_aux_loss.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/moe/test_grouped_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/moe/test_moe_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/moe/test_moe_layer_discrepancy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/moe/test_multihot_indices_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/moe/test_routers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/moe/test_sequential_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/moe/test_shared_experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/moe/test_token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tests/unit_tests/transformer/moe/test_upcycling.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/autoformat.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/copyright.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/linter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/merge_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/preprocess_data_nmt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/preprocess_mmdata.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/report_theoretical_memory.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/run_inference_performance_test.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/run_mamba_text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/run_mamba_text_generation_server_completions.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/run_text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/run_vlm_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/text_generation_cli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/wait_daemon.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/bert_embedding/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/bert_embedding/dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/bert_embedding/embed.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/bert_embedding/external_libs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/bert_embedding/huggingface.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/checkpoint/convert.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/checkpoint/hybrid_conversion.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/checkpoint/loader_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/checkpoint/loader_core.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/checkpoint/loader_legacy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/checkpoint/loader_llama_mistral.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/checkpoint/loader_llava.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/checkpoint/loader_mixtral_hf.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/checkpoint/saver_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/checkpoint/saver_core.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/checkpoint/saver_hf_llava.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/checkpoint/saver_legacy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/checkpoint/saver_llava.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/checkpoint/schema_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/checkpoint/schema_core.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/checkpoint/schema_hf.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/checkpoint/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/build_db.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/config_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/cli/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/cli/__main__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/cli/cli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/docker/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/sft/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/sft/dataset_conv.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/sft/open_inst.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/sft/sft_retro.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/sft/sft_retro_lm.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/text_generation/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/text_generation/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/text_generation/retro_api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/text_generation/retro_generate.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/text_generation/retro_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/Megatron-LM-250624/tools/retro/text_generation/retro_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/.coveragerc
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/CODEOWNERS
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/CONTRIBUTING.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/Dockerfile.ci
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/Dockerfile.linting
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/LICENSE
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/MANIFEST.in
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/jet-tests.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/pretrain_bert.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/pretrain_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/pretrain_ict.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/pretrain_mamba.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/pretrain_retro.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/pretrain_t5.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/pretrain_vision_classify.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/pretrain_vision_dino.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/pretrain_vision_inpaint.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/pretrain_vlm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/pyproject.toml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/setup.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/.github/ISSUE_TEMPLATE/bug.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/.github/ISSUE_TEMPLATE/enhancement.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/.github/ISSUE_TEMPLATE/question.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/.github/ISSUE_TEMPLATE/regression.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/.github/workflows/stale.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/llama_mistral.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/distrib_optimizer.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/api-guide/context_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/api-guide/datasets.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/api-guide/dist_checkpointing.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/api-guide/dist_checkpointing.strategies.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/api-guide/distributed.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/api-guide/fusions.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/api-guide/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/api-guide/models.bert.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/api-guide/models.gpt.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/api-guide/models.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/api-guide/models.t5.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/api-guide/moe.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/api-guide/num_microbatches_calculator.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/api-guide/pipeline_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/api-guide/tensor_parallel.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/api-guide/transformer.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/images/context_parallel/CP_overview.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/images/context_parallel/CP_results.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/images/distrib_optimizer/data_flow.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/images/distrib_optimizer/sharding_scheme.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/docs/source/user-guide/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/run_simple_mcore_train_loop.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/detxoify_lm/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/detxoify_lm/finetune_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/detxoify_lm/finetune_gpt_distributed-1.3b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/detxoify_lm/generate-1.3b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/detxoify_lm/generate_samples_gpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/detxoify_lm/perspective_api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/detxoify_lm/annotations/filter-selfgeneration.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/detxoify_lm/annotations/perspective_api_annotate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/detxoify_lm/annotations/preprocess.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/detxoify_lm/self_generation/selfgenerate-1.3b-unconditional.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/msdp/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/msdp/data_processing.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/msdp/eval_knwl_generation.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/msdp/eval_resp_generation.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/msdp/prep_resp_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/msdp/prompt_knwl_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/msdp/prompt_resp_gen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/sc21/CONFIG.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/sc21/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/sc21/SBATCH.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/sc21/SRUN.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/sc21/run_figure_11.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/sc21/run_figure_12.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/sc21/run_figure_13.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/sc21/run_figure_14.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/sc21/run_figure_15.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/sc21/run_figure_16.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/sc21/run_figure_17.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/sc21/run_figure_18.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/academic_paper_scripts/sc21/run_table_1.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/bert/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/bert/train_bert_340m_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/gpt3/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/gpt3/gpt_config.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/gpt3/train_gpt3_175b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/inference/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/inference/run_text_generation_server_345M.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/inference/run_text_generation_server_345M_8_tensor_parallel.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/inference/gpt/simple_gpt_batch_inference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/inference/quantization/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/inference/quantization/ptq_trtllm_llama_7b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/inference/quantization/ptq_trtllm_nemotron3_8b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/inference/quantization/text_generation_ptq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/inference/quantization/trtllm_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/mamba/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/mamba/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/mamba/run_text_gen_server_8b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/mamba/run_text_gen_server_8b_gpt3.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/mamba/train.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/mixtral/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/mixtral/train_mixtral_8x7b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/clip_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/combine_mistral_clip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/combine_state_dicts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/convert_llava_pretrain_to_wds.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/dataloader_provider.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/dataset_helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/evaluate_coco.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/evaluate_mmmu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/evaluate_textvqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/evaluate_vqav2.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/manual_prompts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/pretrain_dataset.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/pretrain_mistral_clip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/run_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/sft_dataset.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/sft_mistral_clip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/text_generation_mistral_clip.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/train.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/multimodal/assets/pretrain_curves.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/retro/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/retro/preprocess_data.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/retro/train_retro_2b_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/t5/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/t5/t5_mcore_train_curve.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/examples/t5/train_t5_220m_distributed.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/images/model_table.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/images/strong_scaling.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/images/weak_scaling.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/QuickStart.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/README_STRAGGLER.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/jit.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/model_parallel_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/num_microbatches_calculator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/package_info.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/packed_seq_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/parallel_state.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/timers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/Makefile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/bert_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/blended_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/blended_megatron_dataset_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/blended_megatron_dataset_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/helpers.cpp
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/indexed_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/masked_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/megatron_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/megatron_tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/readme.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/t5_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/utils_s3.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/external_libs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/config/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/config/bert_embedders.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/config/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/config/gpt_chunk_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/config/tokenizers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/db/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/db/build.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/db/dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/db/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/index/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/index/build.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/index/factory.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/index/index.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/index/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/index/validate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/index/indexes/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/index/indexes/faiss_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/index/indexes/faiss_par_add.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/query/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/query/gpt_chunk_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/query/multi_split_gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/query/query.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/query/retro_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/datasets/retro/query/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/core.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/dict_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/mapping.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/serialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/validation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/strategies/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/strategies/async_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/strategies/base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/strategies/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/strategies/filesystem_async.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/strategies/fully_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/strategies/resharding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/strategies/state_dict_saver.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/strategies/tensorstore.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/strategies/torch.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/strategies/two_stage.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/dist_checkpointing/strategies/zarr.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/distributed/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/distributed/distributed_data_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/distributed/distributed_data_parallel_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/distributed/finalize_model_grads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/distributed/param_and_grad_buffer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/fusions/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/fusions/fused_bias_dropout.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/fusions/fused_bias_geglu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/fusions/fused_bias_gelu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/fusions/fused_bias_swiglu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/fusions/fused_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/fusions/fused_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/fusions/fused_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/common_inference_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/communication_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/inference_request.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/ammo_support/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/ammo_support/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/ammo_support/gpt/model_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/ammo_support/gpt/state_dict_hooks.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/engines/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/engines/abstract_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/engines/mcore_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/model_inference_wrappers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/model_inference_wrappers/abstract_model_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/model_inference_wrappers/inference_wrapper_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/model_inference_wrappers/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/model_inference_wrappers/gpt/gpt_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/text_generation_controllers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/inference/text_generation_controllers/simple_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/T5/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/T5/t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/T5/t5_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/bert/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/bert/bert_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/bert/bert_lm_head.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/bert/bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/bert/pooler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/common/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/common/embeddings/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/common/embeddings/language_model_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/common/embeddings/rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/common/language_module/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/common/language_module/language_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/common/vision_module/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/common/vision_module/vision_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/gpt/gpt_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/gpt/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/mamba/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/mamba/mamba_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/mamba/mamba_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/multimodal/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/multimodal/llava_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/multimodal/llava_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/retro/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/retro/base_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/retro/config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/retro/decoder_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/retro/decoder_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/retro/encoder_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/retro/encoder_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/retro/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/retro/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/vision/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/vision/clip_vit_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/vision/multimodal_projector.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/models/vision/vit_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/clip_grads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/distrib_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/grad_scaler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/offload_chained_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/offload_distrib_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/optimizer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/chunk/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/chunk/chunk.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/chunk/manager.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/hybrid_adam/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/hybrid_adam/_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/hybrid_adam/cpu_adam.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/hybrid_adam/hybrid_adam.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/hybrid_adam/kernel_loader.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/hybrid_adam/nvme_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/hybrid_adam/csrc/cpu_adam.cpp
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/hybrid_adam/csrc/cpu_adam.h
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/hybrid_adam/csrc/cpu_adam_arm.cpp
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/hybrid_adam/csrc/cpu_adam_arm.h
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/hybrid_adam/csrc/optimizer.cpp
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/hybrid_adam/csrc/cuda/micros.h
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/hybrid_adam/csrc/cuda/multi_tensor_adam_kernel.cu
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/optimizer/hybrid_adam/csrc/cuda/multi_tensor_apply.cuh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/pipeline_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/pipeline_parallel/p2p_communication.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/pipeline_parallel/schedules.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/ssm/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/ssm/mamba_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/ssm/mamba_hybrid_layer_allocation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/ssm/mamba_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/ssm/mamba_mixer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/ssm/triton_cache_manager.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/tensor_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/tensor_parallel/cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/tensor_parallel/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/tensor_parallel/layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/tensor_parallel/mappings.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/tensor_parallel/random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/tensor_parallel/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/dot_product_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/identity_op.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/spec_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/torch_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/transformer_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/transformer_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/custom_layers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/custom_layers/transformer_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/moe/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/moe/experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/moe/grouped_gemm_util.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/moe/moe_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/moe/router.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/core/transformer/moe/token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/inference/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/inference/arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/inference/checkpointing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/inference/text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/inference/gpt/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/inference/gpt/model_provider.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/inference/static/index.html
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/inference/text_generation/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/inference/text_generation/api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/inference/text_generation/beam_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/inference/text_generation/communication.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/inference/text_generation/forward_step.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/inference/text_generation/generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/inference/text_generation/sampling.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/inference/text_generation/tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/indexer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/data/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/data/autoaugment.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/data/biencoder_dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/data/data_samplers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/data/dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/data/ict_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/data/image_folder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/data/multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/data/orqa_wiki_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/data/realm_dataset_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/data/realm_index.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/data/vit_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/fp16_deprecated/loss_scaler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/fused_kernels/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/fused_kernels/compat.h
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/fused_kernels/type_shim.h
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/fused_kernels/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/fused_kernels/tests/test_fused_kernels.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/biencoder_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/fused_bias_gelu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/fused_layer_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/fused_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/multiple_choice.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/realm_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/rms_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/vision/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/vision/dino.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/vision/esvit_swin_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/vision/inpainting.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/vision/knn_monitor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/vision/mit_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/vision/swin_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/vision/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/model/vision/vit_backbone.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/mpu/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/mpu/tests/commons.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/mpu/tests/test_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/mpu/tests/test_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/mpu/tests/test_initialize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/mpu/tests/test_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/legacy/mpu/tests/test_random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/activations.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/async_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/checkpointing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/dist_signal_handler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/global_vars.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/initialize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/log_handler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/one_logger_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/optimizer_param_scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/theoretical_memory_usage.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/training.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/yaml_arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/memory_tracer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/memory_tracer/memory_monitor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/memory_tracer/memory_stats.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/memory_tracer/memstats_collector.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/memory_tracer/param_runtime_order.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/tokenizer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/tokenizer/bert_tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/tokenizer/gpt2_tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/megatron/training/tokenizer/tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/data_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/ensemble_classifier.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/finetune_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/glue/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/glue/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/glue/mnli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/glue/qqp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/msdp/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/msdp/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/msdp/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/msdp/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/msdp/preprocessing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/msdp/prompt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/orqa/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/orqa/evaluate_orqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/orqa/evaluate_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/orqa/supervised/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/orqa/supervised/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/orqa/supervised/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/orqa/unsupervised/nq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/orqa/unsupervised/qa_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/orqa/unsupervised/tokenizers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/race/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/race/finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/vision/finetune_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/vision/main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/vision/classification/classification.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/vision/classification/eval_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/vision/segmentation/cityscapes.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/vision/segmentation/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/vision/segmentation/finetune_segformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/vision/segmentation/finetune_setr.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/vision/segmentation/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/vision/segmentation/seg_heads.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/vision/segmentation/seg_models.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/vision/segmentation/transforms.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/vision/segmentation/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/zeroshot_gpt/datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/zeroshot_gpt/detokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tasks/zeroshot_gpt/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/jet_recipes/MR-bert.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/jet_recipes/MR-gpt-nemo.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/jet_recipes/MR-gpt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/jet_recipes/MR-multimodal.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/jet_recipes/MR-t5.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/jet_recipes/build-pyt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/jet_recipes/local-generator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/jet_recipes/nightly-bert.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/jet_recipes/nightly-gpt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/jet_recipes/weekly-gpt.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/jet_recipes/weekly-t5.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/python_test_utils/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/python_test_utils/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/python_test_utils/get_test_results_from_tensorboard_logs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/python_test_utils/jet_test_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/python_test_utils/multitest_ci_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/python_test_utils/test_ci_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/python_test_utils/test_fp8_ci_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/python_test_utils/test_resume_checkpoint_pipeline.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/shell_test_utils/_run_local_training.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/shell_test_utils/restart_jet_log_jobs.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/shell_test_utils/run_release_record.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/bert_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/bert_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4_vp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/bert_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/bert_345m_nightly_dgx_a100_1N8G_tp1_pp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/bert_345m_nightly_dgx_a100_1N8G_tp4_pp1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/bert_mr_mcore_tp2_pp2_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/bert_mr_mcore_tp2_pp2_local_spec_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/bert_mr_resume_tp1_pp2dgx_a100_1N8G_.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/bert_mr_tp1_pp4_vp2_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/bert_mr_tp2_pp2_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_dist_optimizer_overlap_grad_reduce_param_gather.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp1_resume_torch_dist_dist_optimizer_overlap_grad_reduce_param_gather.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp2_resume_torch_dist.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp1_pp4_resume_torch_dist.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_resume_torch_dist_te_2experts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_resume_torch_dist_te_4experts2parallel.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_te_2experts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp2_pp2_te_4experts2parallel.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_mcore_tp4_pp1_resume_torch_dist.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_dist_optimizer_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp1_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp2_resume_torch.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_resume_torch.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_tp1_pp4_vp1_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_4experts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_4experts.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_tp2_pp2_resume_torch_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_overlap_grad_reduce.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_345m_nightly_dgx_a100_1N8G_tp4_pp1_resume_torch.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp1_pp1_dist_optimizer_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp1_pp1_dist_optimizer_no_mmap_bin_files_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp1_pp1_uniform_full_recompute_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp1_pp2_rope_embeddings_interleaved_no_fusion_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp1_pp4_disable_bias_linear_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp1_pp4_sequence_parallel_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp1_pp4_swiglu_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp1_pp4_untie_embeddings_and_outputs_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp1_pp4_vp1_calculate_per_token_loss_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp1_pp4_vp1_decoupled_lr_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp1_pp4_vp1_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp1_pp4_vp1_dist_optimizer_overlap_grad_reduce_untied_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp2_pp1_cp2_nondeterministic_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_dist_optimizer_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_groupedGEMM_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_overlap_grad_reduce_param_gather_groupedGEMM_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp2_pp1_te_8experts2parallel_top2router_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp2_pp2_cp2_nondeterministic_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp2_pp2_cross_entropy_loss_fusion_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp2_pp2_ddp_average_in_collective_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp2_pp2_defer_embedding_wgrad_compute_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp2_pp2_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp2_pp2_no_create_attention_mask_in_dataloader_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp2_pp2_no_mmap_bin_files_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp4_pp1_dist_optimizer_overlap_grad_reduce_param_gather_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_mcore_te_tp4_pp1_qk_layernorm_test_mode_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_resume_dgx_a100_1N8G_tp1_pp2.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_te_tp2_pp2_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_tp1_pp4_vp1_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/gpt3_mr_tp2_pp2_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/multimodal_llava_mr_mcore_te_tp1_pp1_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/multimodal_llava_mr_mcore_te_tp2_pp4_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_results/jet/t5_220m_mr_mcore_tp2_pp4_dgx_a100_1N8G.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_scripts/bert/pretrain_bert_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_scripts/gpt3/pretrain_gpt3_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_scripts/gpt3/pretrain_gpt3_nemo_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_scripts/multimodal/pretrain_llava_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_scripts/retro/pretrain_retro_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/functional_tests/test_scripts/t5/pretrain_t5_distributed_test.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/test_basic.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/test_imports.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/test_local_multi_tensor_fns.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/test_num_microbatches_calculator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/test_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/test_parallel_state.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/test_training.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/test_utilities.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/test_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/data/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/data/test_bin_reader.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/data/test_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/data/test_gpt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/data/test_multimodal_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/data/test_preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/data/test_preprocess_mmdata.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/conftest.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/test_async_save.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/test_cached_metadata.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/test_flattened_resharding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/test_fully_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/test_mapping.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/test_optimizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/test_serialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/models/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/models/test_bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/models/test_gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/models/test_grouped_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/models/test_mlp_glu.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/models/test_retro_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/models/test_sequential_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/dist_checkpointing/models/test_t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/distributed/test_param_and_grad_buffer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/fusions/test_torch_softmax.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/inference/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/inference/test_common_inference_params.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/inference/test_inference_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/inference/test_modelopt_gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/inference/test_scheduler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/inference/engines/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/inference/engines/test_mcore_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/inference/model_inference_wrappers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/inference/model_inference_wrappers/test_model_inference_wrapper_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/inference/model_inference_wrappers/gpt/test_gpt_inference_wrapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/inference/text_generation_controllers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/inference/text_generation_controllers/test_simple_text_generation_controller.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/models/test_base_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/models/test_bert_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/models/test_clip_vit_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/models/test_gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/models/test_llava_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/models/test_mamba_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/models/test_multimodal_projector.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/models/test_t5_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/pipeline_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/pipeline_parallel/test_schedules.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/tensor_parallel/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/tensor_parallel/test_cross_entropy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/tensor_parallel/test_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/tensor_parallel/test_initialization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/tensor_parallel/test_layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/tensor_parallel/test_mappings.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/tensor_parallel/test_random.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/tensor_parallel/test_tensor_parallel_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/transformer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/transformer/test_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/transformer/test_attention_packed_seq.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/transformer/test_core_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/transformer/test_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/transformer/test_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/transformer/test_retro_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/transformer/test_spec_customization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/transformer/test_transformer_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/transformer/test_transformer_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/transformer/moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/transformer/moe/test_a2a_token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/transformer/moe/test_aux_loss.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/transformer/moe/test_grouped_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/transformer/moe/test_routers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/transformer/moe/test_sequential_mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tests/unit_tests/transformer/moe/test_token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/autoformat.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/linter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/merge_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/preprocess_data_nmt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/preprocess_mmdata.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/report_theoretical_memory.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/run_mamba_text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/run_text_generation_server.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/run_vlm_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/text_generation_cli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/bert_embedding/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/bert_embedding/dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/bert_embedding/embed.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/bert_embedding/external_libs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/bert_embedding/huggingface.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/checkpoint/convert.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/checkpoint/hybrid_conversion.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/checkpoint/loader_llama_mistral.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/checkpoint/loader_mcore.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/checkpoint/loader_megatron.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/checkpoint/loader_mixtral_hf.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/checkpoint/saver_mcore.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/checkpoint/saver_megatron.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/checkpoint/setter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/checkpoint/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/openwebtext/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/openwebtext/add_id.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/openwebtext/blacklist_urls.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/openwebtext/cleanup_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/openwebtext/cleanup_fix_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/openwebtext/filter_ngrams.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/openwebtext/find_duplicates.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/openwebtext/group_duplicate_url.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/openwebtext/merge_jsons.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/openwebtext/remove_group_duplicates.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/build_db.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/config_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/cli/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/cli/__main__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/cli/cli.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/docker/Dockerfile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/sft/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/sft/dataset_conv.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/sft/open_inst.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/sft/sft_retro.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/sft/sft_retro_lm.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/text_generation/evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/text_generation/metrics.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/text_generation/retro_api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/text_generation/retro_generate.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/text_generation/retro_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/megatron/PAI-Megatron-LM-240718/tools/retro/text_generation/retro_text_generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/.pylintrc
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/LICENSE
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/Makefile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/README_CN.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/setup.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/.github/ISSUE_TEMPLATE/bug_report.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/.github/ISSUE_TEMPLATE/feature_request.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/.github/workflows/build.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/.github/workflows/pylint.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/.github/workflows/python-publish.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/.github/workflows/unit_test.yml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/entrypoint.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/hooks.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/offline_ckpt_converter.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/algorithm/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/algorithm/base_algo.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/algorithm/grpo.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/algorithm/grpo_utils/advantage_compute.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/algorithm/grpo_utils/loss_gallery.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/algorithm/grpo_utils/megatron_policy_trainer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/algorithm/grpo_utils/packing_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/algorithm/grpo_utils/policy_trainer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/algorithm/grpo_utils/trainer_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/algorithm/grpo_utils/vllm_policy_inference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/algorithm/grpo_utils/megatron_utils/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/algorithm/grpo_utils/megatron_utils/policy_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/algorithm/grpo_utils/megatron_utils/train_helper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/checkpoint/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/checkpoint/checkpoint_manager.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/configs/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/configs/common.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/configs/megatron_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/data/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/data/data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/data/prompt_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/data/sampler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/data/data_preprocess/gsm8k.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/data/data_preprocess/math_lighteval.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/launcher/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/launcher/dlc_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/launcher/initialize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/base_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/fsdp_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/megatron_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/torch_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/vllm_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/megatron/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/megatron/memory_manager/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/megatron/memory_manager/base_trainer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/megatron/memory_manager/inference.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/megatron/memory_manager/trainer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/patches/monkey_patch.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/patches/transformers/qwen2_patch.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/patches/transformers/qwen3_moe_patch.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/patches/transformers/qwen3_patch.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/reward/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/reward/rule_reward.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/vllm/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/vllm/hooks/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/vllm/hooks/vllm_0_8_5/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/vllm/hooks/vllm_0_8_5/async_llm_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/vllm/hooks/vllm_0_8_5/llm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/vllm/hooks/vllm_0_8_5/llm_engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/vllm/hooks/vllm_0_8_5/logits_processor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/vllm/hooks/vllm_0_8_5/ray_distributed_executor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/models/vllm/hooks/vllm_0_8_5/worker_base.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/runtime/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/runtime/decorator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/runtime/dist_actor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/runtime/engine.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/runtime/environment.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/runtime/evaluator.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/runtime/executor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/runtime/model_flow.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/runtime/trainer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/runtime/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/schedule/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/schedule/metric_manager.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/schedule/model_manager.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/schedule/port_manager.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/schedule/resource_manager.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/synchronizer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/synchronizer/base_parameter_sync.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/synchronizer/comm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/synchronizer/parameter_sync.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/synchronizer/parameter_sync_fsdp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/synchronizer/structs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/synchronizer/mappers/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/synchronizer/mappers/mapper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/synchronizer/mappers/mapping_helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/synchronizer/planners/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/synchronizer/planners/planner.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/tools/check_parameter_sync.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/communication_op.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/constant.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/error_monitor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/flat_tensors.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/future.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/global_vars.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/log_monitor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/logger.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/megatron_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/parse_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/timer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/version.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/vllm_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/mappings/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/mappings/megatron_helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/mappings/sharded_tensor_info.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/mappings/vllm_helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/rule_reward_score/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/chatlearn/utils/rule_reward_score/math.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docker/torch/Dockerfile.torch2.3.0
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docker/torch/Dockerfile.torch2.5.1.vllm066
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docker/torch/Dockerfile.torch2.6.0.vllm085
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/Makefile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/requirements.txt
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/.readthedocs.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/Makefile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/advanced.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/chatlearn.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/conf.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/config_yaml.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/faq.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/installation.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/programming.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/api/config.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/api/engine.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/api/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/api/module.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/tutorial/check_sync_parameter.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/tutorial/continue_train.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/tutorial/custom_model_flow.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/tutorial/data.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/tutorial/ems.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/tutorial/evaluator.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/tutorial/profile.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/tutorial/run.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/tutorial/tutorial_grpo_fsdp.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/tutorial/tutorial_grpo_mcore.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/tutorial/tutorial_llama2.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/en/tutorial/tutorial_qwen.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/images/arch.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/images/class.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/images/dlc_1.jpg
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/images/dlc_2.jpg
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/images/engine.jpg
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/images/engine_class.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/images/fault.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/images/logo.jpg
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/images/perf.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/images/rlhf.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/images/yaml.jpg
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/.readthedocs.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/Makefile
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/advanced.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/chatlearn.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/conf.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/config_yaml.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/faq.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/installation.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/programming.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/api/config.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/api/engine.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/api/index.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/api/module.rst
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/tutorial/continue_train.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/tutorial/custom_model_flow.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/tutorial/data.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/tutorial/ems.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/tutorial/evaluator.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/tutorial/profile.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/tutorial/run.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/tutorial/tutorial_grpo_fsdp.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/tutorial/tutorial_grpo_mcore.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/tutorial/tutorial_llama2.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/docs/zh/tutorial/tutorial_qwen.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/examples/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/examples/tests/barrier.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/examples/tests/benchmark_vllm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/examples/tests/benchmark_vllm.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/scripts/base_env.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/scripts/train_fsdp_vllm_qwen3_235b_a22b_grpo.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/scripts/train_fsdp_vllm_qwen3_30b_a3b_grpo.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/scripts/train_fsdp_vllm_qwen3_8b_grpo.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/scripts/train_mcore_vllm_deepseek_v3_671b_grpo.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/scripts/train_mcore_vllm_moonlight_16b_grpo.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/scripts/train_mcore_vllm_qwen3_235b_grpo.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/scripts/train_mcore_vllm_qwen3_30b_grpo.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/scripts/train_mcore_vllm_qwen3_8b_grpo.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/template/grpo_fsdp.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/template/grpo_megatron.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/run_tests.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/test_main.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/base/test_exp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/base/test_multi_dataloader.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/base/test_send_recv.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/configs/base.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/configs/eval.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/configs/exp1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/configs/exp2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/configs/grpo.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/configs/model.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/configs/o1.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/configs/parameter_sync.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/configs/rlhf.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/configs/rlhf2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/configs/rlhf_cpu.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/configs/rlhf_eval.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/configs/sprl.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/configs/test_eval.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/configs/test_eval2.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/parameter_sync/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/parameter_sync/test_mapper_helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/rlhf/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/rlhf/test_ckpt.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/rlhf/test_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/rlhf/test_grpo.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/rlhf/test_indivisible_batchsz.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/rlhf/test_model_flow.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/rlhf/test_placement.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/rlhf/test_placement_colocate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/rlhf/test_relay_buffer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/rlhf/test_rlhf_custom.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/rlhf/test_rlhf_placement_colocate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/rlhf/test_rlhf_replica.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/unittests/test_flat_tensors.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/unittests/test_sampler.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/backends/rl/ChatLearn/tests/unittests/test_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/docker/chatlearn
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/docker/pai_megatron_patch
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan/ds_config_TEMPLATE.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan/ds_train_huggingface_baichuan.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan/evaluate_huggingface_baichuan13b.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan/evaluate_megatron_baichuan13b.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan/finetune_huggingface_baichuan13b.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan/finetune_megatron_baichuan13b.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan/pretrain_megatron_baichuan13b.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan/run_ds_train_huggingface_baichuan.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan/run_evaluate_huggingface_baichuan.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan/run_evaluate_megatron_baichuan.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan/run_finetune_huggingface_baichuan.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan/run_finetune_megatron_baichuan.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan/run_pretrain_megatron_baichuan.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan2/evaluate_huggingface_baichuan.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan2/evaluate_megatron_baichuan.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan2/generate_text_megatron_baichuan.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan2/pretrain_megatron_baichuan.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan2/run_evaluate_huggingface_baichuan.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan2/run_evaluate_megatron_baichuan.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan2/run_pretrain_megatron_baichuan.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/baichuan2/run_text_generation_megatron_baichuan.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/bloom/evaluate_huggingface_bloom.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/bloom/evaluate_megatron_bloom.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/bloom/finetune_megatron_bloom.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/bloom/generate_text_bloom.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/bloom/pretrain_megatron_bloom.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/bloom/run_evaluate_huggingface_bloom.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/bloom/run_evaluate_megatron_bloom.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/bloom/run_finetune_megatron_bloom.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/bloom/run_pretrain_megatron_bloom.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/bloom/run_text_generation_megatron_bloom.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/chatglm/finetune_huggingface_chatglm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/chatglm/finetune_megatron_chatglm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/chatglm/pretrain_megatron_chatglm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/chatglm/run_finetune_huggingface_chatglm.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/chatglm/run_finetune_megatron_chatglm.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/chatglm/run_pretrain_megatron_chatglm.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/codellama/ds_config_TEMPLATE.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/codellama/ds_train_huggingface_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/codellama/evaluate_huggingface_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/codellama/evaluate_megatron_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/codellama/finetune_megatron_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/codellama/generate_text_megatron_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/codellama/pretrain_megatron_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/codellama/run_ds_train_huggingface_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/codellama/run_evaluate_huggingface_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/codellama/run_evaluate_megatron_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/codellama/run_finetune_megatron_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/codellama/run_finetune_megatron_llama_withGA.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/codellama/run_pretrain_megatron_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/codellama/run_text_generation_megatron_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepseek/run_evaluate_megatron_deepseek.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepseek/run_finetune_megatron_deepseek.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepseek/run_finetune_megatron_deepseek_withGA.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepseek/run_pretrain_megatron_deepseek.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepseek/run_text_generation_megatron_deepseek.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepseek_v2/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepseek_v2/pretrain_deepseek.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepseek_v2/run_mcore_deepseek.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepseek_v3/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepseek_v3/README_grpo.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepseek_v3/pretrain_deepseek.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepseek_v3/pretrain_deepseek_250624.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepseek_v3/run_mcore_deepseek.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepseek_v3/run_mcore_deepseek_250624.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepseek_v3/run_mcore_deepseek_grpo.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepspeed/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepspeed/ds_config_TEMPLATE.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepspeed/ds_train_huggingface_finetune.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepspeed/run_ds_train_huggingface_finetune.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepspeed/text_generation_huggingface.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/deepspeed/text_generation_vllm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/evaluate_huggingface_falcon.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/evaluate_megatron_falcon.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/evaluate_megatron_falcon40b.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/finetune_huggingface_falcon.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/finetune_megatron_falcon.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/finetune_megatron_falcon40b.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/generate_text_megatron_falcon.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/generate_text_megatron_falcon40b.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/pretrain_megatron_falcon.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/pretrain_megatron_falcon40b.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/run_evaluate_huggingface_falcon.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/run_evaluate_megatron_falcon.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/run_evaluate_megatron_falcon40b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/run_finetune_huggingface_falcon.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/run_finetune_megatron_falcon.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/run_finetune_megatron_falcon40b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/run_pretrain_megatron_falcon.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/run_pretrain_megatron_falcon40b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/run_text_generation_megatron_falcon.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/falcon/run_text_generation_megatron_falcon40b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/galactica/evaluate_huggingface_galactica.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/galactica/evaluate_megatron_galactica.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/galactica/finetune_huggingface_galactica.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/galactica/finetune_megatron_galactica.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/galactica/pretrain_megatron_galactica.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/galactica/run_evaluate_huggingface_galactica.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/galactica/run_evaluate_megatron_galactica.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/galactica/run_finetune_huggingface_galactica.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/galactica/run_finetune_megatron_galactica.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/galactica/run_pretrain_megatron_galactica.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/glm130b/evaluate_megatron_glm130b.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/glm130b/evaluate_sat_glm130b.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/glm130b/pretrain_megatron_glm130b.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/glm130b/run_evaluate_megatron_glm130b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/glm130b/run_evaluate_sat_glm130b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/glm130b/run_pretrain_megatron_glm130b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/gpt3/pretrain_megatron_gpt3.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/gpt3/run_pretrain_megatron_gpt3.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/gpt3/run_pretrain_megatron_gpt3_enwiki.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama/evaluate_huggingface_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama/evaluate_megatron_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama/finetune_huggingface_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama/finetune_megatron_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama/generate_text_megatron_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama/pretrain_megatron_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama/run_evaluate_huggingface_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama/run_evaluate_megatron_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama/run_finetune_huggingface_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama/run_finetune_megatron_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama/run_pretrain_megatron_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama/run_text_generation_megatron_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/ds_config_TEMPLATE.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/ds_train_huggingface_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/evaluate_huggingface_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/evaluate_huggingface_llama_moe.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/evaluate_mcore_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/evaluate_megatron_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/finetune_mcore_llama_withGA.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/finetune_megatron_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/finetune_megatron_llama_withGA.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/generate_text_megatron_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/pretrain_mcore_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/pretrain_megatron_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/run_ds_train_huggingface_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/run_evaluate_huggingface_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/run_evaluate_mcore_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/run_evaluate_megatron_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/run_finetune_mcore_llama_withGA.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/run_finetune_megatron_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/run_finetune_megatron_llama_withGA.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/run_mcore_llama2_70b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/run_pretrain_mcore_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/run_pretrain_megatron_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama2/run_text_generation_megatron_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama3/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama3/entry.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama3/mpi_run_pretrain_llama3.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama3/pretrain_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama3/pretrain_llama_mcore070.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama3/run_finetune_mcore_llama_withGA.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama3/run_finetune_megatron_llama_withGA.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama3/run_pretrain_llama_70b.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama3/run_pretrain_mcore_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama3/run_pretrain_megatron_llama.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama3_1/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama3_1/pretrain_llama.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llama3_1/run_mcore_llama3_1.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llava/finetune_megatron_llava.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llava/pretrain_megatron_llava.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llava/run_finetune_megatron_llava.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llava/run_pretrain_megatron_llava.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llava_mcore/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llava_mcore/dataset_helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llava_mcore/image_processing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llava_mcore/lm_loss.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llava_mcore/pretrain_llava.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/llava_mcore/run_mcore_llava.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/mistral/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/mistral/pretrain_mcore_mistral.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/mistral/run_mcore_mistral.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/moonlight/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/moonlight/README_grpo.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/moonlight/modeling_deepseek_pai.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/moonlight/run_mcore_moonlight.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/moonlight/run_mcore_moonlight_grpo.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/ds_config_TEMPLATE.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/ds_train_huggingface_qwen.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/evaluate_huggingface_qwen.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/evaluate_megatron_qwen.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/evaluate_megatron_qwen_moe.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/finetune_megatron_qwen.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/finetune_megatron_qwen_withGA.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/generate_text_megatron_qwen.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/lm_evaluate_megatron_qwen.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/pretrain_megatron_qwen.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/pretrain_megatron_qwen_upcycled.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/run_ds_train_huggingface_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/run_evaluate_huggingface_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/run_evaluate_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/run_evaluate_megatron_qwen_moe.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/run_finetune_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/run_finetune_megatron_qwen_withGA.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/run_lm_evaluate_huggingface_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/run_lm_evaluate_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/run_pretrain_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/run_pretrain_megatron_qwen_upcycled.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen/run_text_generation_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen1_5/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen1_5/evaluate_mcore_qwen.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen1_5/pretrain_mcore_qwen.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen1_5/run_evaluate_mcore_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen1_5/run_evaluate_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen1_5/run_finetune_mcore_qwen_withGA.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen1_5/run_finetune_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen1_5/run_finetune_megatron_qwen_withGA.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen1_5/run_pretrain_mcore_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen1_5/run_pretrain_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen1_5/run_text_generation_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen2/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen2/README_moe.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen2/pretrain_qwen.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen2/pretrain_qwen2_moe.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen2/run_mcore_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen2/run_mcore_qwen2_moe.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen2_5/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen2_5/run_mcore_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen2_5_vl/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen2_5_vl/pretrain_qwen.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen2_5_vl/run_mcore_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen2_vl/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen2_vl/pretrain_qwen.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen2_vl/run_mcore_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen3/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen3/README_grpo.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen3/entrypoint.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen3/pretrain_qwen.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen3/run_mcore_qwen3.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen3/run_mcore_qwen3_235b_grpo.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen3/run_mcore_qwen3_30b_grpo.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen3/run_mcore_qwen3_8b_grpo.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen3/configs/grpo_megatron.yaml
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen_vl/finetune_megatron_qwen_vl.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwen_vl/run_finetune_megatron_qwen_vl.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwq/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/qwq/run_mcore_qwen.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/starcoder/ds_config_TEMPLATE.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/starcoder/ds_train_huggingface_starcoder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/starcoder/evaluate_megatron_starcoder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/starcoder/finetune_megatron_starcoder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/starcoder/generate_text_megatron_starcoder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/starcoder/pretrain_megatron_starcoder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/starcoder/run_ds_train_huggingface_starcoder.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/starcoder/run_evaluate_megatron_starcoder.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/starcoder/run_finetune_megatron_starcoder_wgbs.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/starcoder/run_finetune_megatron_starcoder_wogbs.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/starcoder/run_pretrain_megatron_starcoder.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/starcoder/run_text_generation_megatron_starcoder.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/yi/run_evaluate_megatron_yi.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/yi/run_finetune_megatron_yi.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/examples/yi/run_pretrain_megatron_yi.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/arguments.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/finetune_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/initialize.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/lm_evaluate.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/tensor_parallel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/training.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/data/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/data/dataset_helpers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/data/image_processing.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/data/json_sft.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/data/utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/data/energon/chatml.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/fixes/optimizer_offloading/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/fixes/optimizer_offloading/fix_optimizer_offloading.patch
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/fixes/yarn_args/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/fixes/yarn_args/fix_yarn_args.patch
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/generation/api.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/generation/generation.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/generation/gpt_predictor.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/generation/megatron.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/generation/tokenization.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/baichuan/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/baichuan/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/baichuan/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/baichuan/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/baichuan2/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/baichuan2/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/baichuan2/layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/baichuan2/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/bloom/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/bloom/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/bloom/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/bloom/layers.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/bloom/positional_embeddings.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/bloom/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/chatglm/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/chatglm/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/chatglm/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/chatglm/positional_embeddings.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/chatglm/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/multi_latent_attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/transformer_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/transformer_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/moe/experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/moe/shared_experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/falcon/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/falcon/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/falcon/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/falcon/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/falcon40b/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/falcon40b/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/falcon40b/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/falcon40b/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/galactica/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/galactica/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/galactica/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/galactica/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/glm130b/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/glm130b/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/glm130b/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/glm130b/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama/positional_embeddings.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama2/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama2/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama2/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama2/rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama2/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama3/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama3/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama3/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama3/layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama3/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama3/rms_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama3/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama3/transformer_legacy.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama3/transformer/attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama3/transformer/mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama3_1/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama3_1/layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama3_1/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama3_1/rms_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llama3_1/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llava/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llava/clip_encoder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llava/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llava/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llava/mm_projector_builder.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llava/rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llava/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/llava_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/llava_spec.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/vision/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/vision/clip_vit_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/vision/multimodal_projector.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/vision/vit_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mistral/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mistral/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mistral/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mistral/modeling_attn_mask_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mistral/rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mistral/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral/layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral/moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral/moe/experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral/moe/router.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral/moe/token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral/transformer/attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral/transformer/mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/moe/experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/moe/grouped_gemm_util.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/moe/moe_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/moe/router.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/moe/token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/transformer/attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/transformer/mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/moe/experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/moe/router.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/moe/token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/transformer/attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/transformer/mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen1_5_megablocks/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen1_5_megablocks/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen1_5_megablocks/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen1_5_megablocks/rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen1_5_megablocks/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2/layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2/rms_norm.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2/transformer_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2/transformer_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2/moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2/moe/experts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2/moe/router.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2/moe/token_dispatcher.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2/transformer/attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2/transformer/mlp.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_5_vl/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_5_vl/transformer_block.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_5_vl/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_5_vl/visionmodel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_moe/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_moe/layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_moe/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/attention.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/attention_vision.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/language_model_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/language_module.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/rope_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/transformer_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/visionmodel.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen3_moe/gpt_layer_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen3_moe/moe_module_specs.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen3_moe/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen3_moe/moe/moe_utils.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen3_moe/moe/router.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen_vl/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen_vl/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen_vl/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen_vl/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/qwen_vl/visual.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/starcoder/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/starcoder/enums.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/starcoder/glu_activations.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/starcoder/gpt_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/starcoder/language_model.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/model/starcoder/transformer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/template/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/template/helper.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/tokenizer/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/tokenizer/icetk_glm130b_tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/tokenizer/jiebabpe_tokenizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/tokenizer/tokenization_baichuan.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/tokenizer/tokenization_qwen_vl.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/megatron_patch/tokenizer/tokenization_yi.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/auto_configurator/report_auto_config.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/auto_configurator/report_theoretical_memory.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/auto_configurator/run_auto_config.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/auto_configurator/run_estimate_memory_usage.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/convert.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/deepseek_v3/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/deepseek_v3/h2m_synchronizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/deepseek_v3/m2h_synchronizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/deepseek_v3/patch.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/general/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/general/h2m_synchronizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/general/m2h_synchronizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/general/synchronizer.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/scripts/deepseek_v3/run_32xH20.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/scripts/moonlight/run_2xH20.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/scripts/qwen2_5/run_8xH20.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/scripts/qwen3/run_8xH20.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/scripts/qwen3/run_A22B_16xH20.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan/configuration_baichuan.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan/hf2te.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan/model_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan/te_model_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan2/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan2/configuration_baichuan.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan2/hf2te.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan2/hf2te_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan2/model_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/bloom/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/bloom/deepspeed_to_megatron.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/bloom/deepspeed_to_megatron_ori.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/bloom/model_convertor_huggingface_megatron.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/bloom/reward_model_convertor_megatron.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/bloom/reward_model_to_megatron.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/bloom/run_convert_deepspeed_to_megatron.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/bloom/run_convert_deepspeed_to_transformers.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/chatglm/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/chatglm/run_convert_huggingface_to_megatron.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/deepseek/fp8_cast_bf16.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/deepseek/hf2mcore_deepseek_v2_moe.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/deepseek/hf2mcore_deepseek_v2_moe_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/deepseek/hf2mcore_deepseek_v3_moe.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/deepseek/hf2mcore_deepseek_v3_moe_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/falcon/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/falcon/configuration_RW.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/falcon/model_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/falcon40b/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/falcon40b/configuration_RW.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/falcon40b/model_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/galactica/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/galactica/run_convert_huggingface_to_megatron.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/glm/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/glm/run_convert_transformers_to_megatron.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/glm130b/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/glm130b/merge_130b_ckpts.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/glm130b/run_convert_transformers_to_megatron.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf2mcore.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf2mcore_70b.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf2mcore_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf2mcore_convertor_llama3_1.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf2mcore_llama3_1.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf2megatron.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf2megatron_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf_llama_moe/config_TEMPLATE.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf_llama_moe/llama_moe.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llava/hf2mcore_convertor_llava.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llava/hf2mcore_llava.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/mistral/hf2mcore.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/mistral/hf2mcore_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/mistral/hf2mcore_mixtral.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/mistral/hf_mistral_moe/config_TEMPLATE.json
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/moonlight/hf2mcore_moonlight_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen1.5_dense_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen1.5_dense_gqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen1.5_dense_mha.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen1.5_dense_mha_to_moe.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen1.5_dense_to_moe_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen1.5_moe.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen1.5_moe_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2.5_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2.5_vl.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2.5_vl_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2_dense_and_moe_gqa.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2_moe.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2_moe_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2_vl.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2_vl_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen3_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2megablocks_qwen1.5.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2megablocks_qwen1.5_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2megatron_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2megatron_qwen1.0.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2megatron_qwen1.5.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/starcoder/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/starcoder/model_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/utils/__init__.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/yi/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/yi/model_convertor.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/multimodal_data_preprocessing/build_llava_frame_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/multimodal_data_preprocessing/convert_custom_dataset_to_wds_chatml.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/multimodal_data_preprocessing/convert_llava_pretrain_to_wds.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/multimodal_data_preprocessing/dataset_preparation.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/multimodal_data_preprocessing/replace_llava_image_key.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/clean_raw_text.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/convert_json_to_list.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/img.png
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/preprocess_data.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/preprocess_data_megatron.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/preprocess_wudao2.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/qwen_hf_preprocess_datasets.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/run_make_pretraining_dataset.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/run_make_pretraining_dataset_megatron.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/run_prepare_dataset.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/run_prepare_wudao.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/sft_data_preprocessing/README.md
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/sft_data_preprocessing/build_idxmap_sft_dataset.py
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/sft_data_preprocessing/run_build_idxmap_sft_dataset.sh
pretrain/Pai-Megatron-Patch/Pai-Megatron-Patch/toolkits/sft_data_preprocessing/sample_stats.py
pretrain/Pai-Megatron-Patch/docker/chatlearn
pretrain/Pai-Megatron-Patch/docker/pai_megatron_patch
pretrain/Pai-Megatron-Patch/examples/baichuan/ds_config_TEMPLATE.json
pretrain/Pai-Megatron-Patch/examples/baichuan/ds_train_huggingface_baichuan.py
pretrain/Pai-Megatron-Patch/examples/baichuan/evaluate_huggingface_baichuan13b.py
pretrain/Pai-Megatron-Patch/examples/baichuan/evaluate_megatron_baichuan13b.py
pretrain/Pai-Megatron-Patch/examples/baichuan/finetune_huggingface_baichuan13b.py
pretrain/Pai-Megatron-Patch/examples/baichuan/finetune_megatron_baichuan13b.py
pretrain/Pai-Megatron-Patch/examples/baichuan/pretrain_megatron_baichuan13b.py
pretrain/Pai-Megatron-Patch/examples/baichuan/run_ds_train_huggingface_baichuan.sh
pretrain/Pai-Megatron-Patch/examples/baichuan/run_evaluate_huggingface_baichuan.sh
pretrain/Pai-Megatron-Patch/examples/baichuan/run_evaluate_megatron_baichuan.sh
pretrain/Pai-Megatron-Patch/examples/baichuan/run_finetune_huggingface_baichuan.sh
pretrain/Pai-Megatron-Patch/examples/baichuan/run_finetune_megatron_baichuan.sh
pretrain/Pai-Megatron-Patch/examples/baichuan/run_pretrain_megatron_baichuan.sh
pretrain/Pai-Megatron-Patch/examples/baichuan2/evaluate_huggingface_baichuan.py
pretrain/Pai-Megatron-Patch/examples/baichuan2/evaluate_megatron_baichuan.py
pretrain/Pai-Megatron-Patch/examples/baichuan2/generate_text_megatron_baichuan.py
pretrain/Pai-Megatron-Patch/examples/baichuan2/pretrain_megatron_baichuan.py
pretrain/Pai-Megatron-Patch/examples/baichuan2/run_evaluate_huggingface_baichuan.sh
pretrain/Pai-Megatron-Patch/examples/baichuan2/run_evaluate_megatron_baichuan.sh
pretrain/Pai-Megatron-Patch/examples/baichuan2/run_pretrain_megatron_baichuan.sh
pretrain/Pai-Megatron-Patch/examples/baichuan2/run_text_generation_megatron_baichuan.sh
pretrain/Pai-Megatron-Patch/examples/bloom/evaluate_huggingface_bloom.py
pretrain/Pai-Megatron-Patch/examples/bloom/evaluate_megatron_bloom.py
pretrain/Pai-Megatron-Patch/examples/bloom/finetune_megatron_bloom.py
pretrain/Pai-Megatron-Patch/examples/bloom/generate_text_bloom.py
pretrain/Pai-Megatron-Patch/examples/bloom/pretrain_megatron_bloom.py
pretrain/Pai-Megatron-Patch/examples/bloom/run_evaluate_huggingface_bloom.sh
pretrain/Pai-Megatron-Patch/examples/bloom/run_evaluate_megatron_bloom.sh
pretrain/Pai-Megatron-Patch/examples/bloom/run_finetune_megatron_bloom.sh
pretrain/Pai-Megatron-Patch/examples/bloom/run_pretrain_megatron_bloom.sh
pretrain/Pai-Megatron-Patch/examples/bloom/run_text_generation_megatron_bloom.sh
pretrain/Pai-Megatron-Patch/examples/chatglm/finetune_huggingface_chatglm.py
pretrain/Pai-Megatron-Patch/examples/chatglm/finetune_megatron_chatglm.py
pretrain/Pai-Megatron-Patch/examples/chatglm/pretrain_megatron_chatglm.py
pretrain/Pai-Megatron-Patch/examples/chatglm/run_finetune_huggingface_chatglm.sh
pretrain/Pai-Megatron-Patch/examples/chatglm/run_finetune_megatron_chatglm.sh
pretrain/Pai-Megatron-Patch/examples/chatglm/run_pretrain_megatron_chatglm.sh
pretrain/Pai-Megatron-Patch/examples/codellama/ds_config_TEMPLATE.json
pretrain/Pai-Megatron-Patch/examples/codellama/ds_train_huggingface_llama.py
pretrain/Pai-Megatron-Patch/examples/codellama/evaluate_huggingface_llama.py
pretrain/Pai-Megatron-Patch/examples/codellama/evaluate_megatron_llama.py
pretrain/Pai-Megatron-Patch/examples/codellama/finetune_megatron_llama.py
pretrain/Pai-Megatron-Patch/examples/codellama/generate_text_megatron_llama.py
pretrain/Pai-Megatron-Patch/examples/codellama/pretrain_megatron_llama.py
pretrain/Pai-Megatron-Patch/examples/codellama/run_ds_train_huggingface_llama.sh
pretrain/Pai-Megatron-Patch/examples/codellama/run_evaluate_huggingface_llama.sh
pretrain/Pai-Megatron-Patch/examples/codellama/run_evaluate_megatron_llama.sh
pretrain/Pai-Megatron-Patch/examples/codellama/run_finetune_megatron_llama.sh
pretrain/Pai-Megatron-Patch/examples/codellama/run_finetune_megatron_llama_withGA.sh
pretrain/Pai-Megatron-Patch/examples/codellama/run_pretrain_megatron_llama.sh
pretrain/Pai-Megatron-Patch/examples/codellama/run_text_generation_megatron_llama.sh
pretrain/Pai-Megatron-Patch/examples/deepseek/run_evaluate_megatron_deepseek.sh
pretrain/Pai-Megatron-Patch/examples/deepseek/run_finetune_megatron_deepseek.sh
pretrain/Pai-Megatron-Patch/examples/deepseek/run_finetune_megatron_deepseek_withGA.sh
pretrain/Pai-Megatron-Patch/examples/deepseek/run_pretrain_megatron_deepseek.sh
pretrain/Pai-Megatron-Patch/examples/deepseek/run_text_generation_megatron_deepseek.sh
pretrain/Pai-Megatron-Patch/examples/deepseek_v2/README.md
pretrain/Pai-Megatron-Patch/examples/deepseek_v2/pretrain_deepseek.py
pretrain/Pai-Megatron-Patch/examples/deepseek_v2/run_mcore_deepseek.sh
pretrain/Pai-Megatron-Patch/examples/deepseek_v3/README.md
pretrain/Pai-Megatron-Patch/examples/deepseek_v3/README_grpo.md
pretrain/Pai-Megatron-Patch/examples/deepseek_v3/pretrain_deepseek.py
pretrain/Pai-Megatron-Patch/examples/deepseek_v3/pretrain_deepseek_250624.py
pretrain/Pai-Megatron-Patch/examples/deepseek_v3/run_mcore_deepseek.sh
pretrain/Pai-Megatron-Patch/examples/deepseek_v3/run_mcore_deepseek_250624.sh
pretrain/Pai-Megatron-Patch/examples/deepseek_v3/run_mcore_deepseek_grpo.sh
pretrain/Pai-Megatron-Patch/examples/deepspeed/README.md
pretrain/Pai-Megatron-Patch/examples/deepspeed/ds_config_TEMPLATE.json
pretrain/Pai-Megatron-Patch/examples/deepspeed/ds_train_huggingface_finetune.py
pretrain/Pai-Megatron-Patch/examples/deepspeed/run_ds_train_huggingface_finetune.sh
pretrain/Pai-Megatron-Patch/examples/deepspeed/text_generation_huggingface.py
pretrain/Pai-Megatron-Patch/examples/deepspeed/text_generation_vllm.py
pretrain/Pai-Megatron-Patch/examples/falcon/evaluate_huggingface_falcon.py
pretrain/Pai-Megatron-Patch/examples/falcon/evaluate_megatron_falcon.py
pretrain/Pai-Megatron-Patch/examples/falcon/evaluate_megatron_falcon40b.py
pretrain/Pai-Megatron-Patch/examples/falcon/finetune_huggingface_falcon.py
pretrain/Pai-Megatron-Patch/examples/falcon/finetune_megatron_falcon.py
pretrain/Pai-Megatron-Patch/examples/falcon/finetune_megatron_falcon40b.py
pretrain/Pai-Megatron-Patch/examples/falcon/generate_text_megatron_falcon.py
pretrain/Pai-Megatron-Patch/examples/falcon/generate_text_megatron_falcon40b.py
pretrain/Pai-Megatron-Patch/examples/falcon/pretrain_megatron_falcon.py
pretrain/Pai-Megatron-Patch/examples/falcon/pretrain_megatron_falcon40b.py
pretrain/Pai-Megatron-Patch/examples/falcon/run_evaluate_huggingface_falcon.sh
pretrain/Pai-Megatron-Patch/examples/falcon/run_evaluate_megatron_falcon.sh
pretrain/Pai-Megatron-Patch/examples/falcon/run_evaluate_megatron_falcon40b.sh
pretrain/Pai-Megatron-Patch/examples/falcon/run_finetune_huggingface_falcon.sh
pretrain/Pai-Megatron-Patch/examples/falcon/run_finetune_megatron_falcon.sh
pretrain/Pai-Megatron-Patch/examples/falcon/run_finetune_megatron_falcon40b.sh
pretrain/Pai-Megatron-Patch/examples/falcon/run_pretrain_megatron_falcon.sh
pretrain/Pai-Megatron-Patch/examples/falcon/run_pretrain_megatron_falcon40b.sh
pretrain/Pai-Megatron-Patch/examples/falcon/run_text_generation_megatron_falcon.sh
pretrain/Pai-Megatron-Patch/examples/falcon/run_text_generation_megatron_falcon40b.sh
pretrain/Pai-Megatron-Patch/examples/galactica/evaluate_huggingface_galactica.py
pretrain/Pai-Megatron-Patch/examples/galactica/evaluate_megatron_galactica.py
pretrain/Pai-Megatron-Patch/examples/galactica/finetune_huggingface_galactica.py
pretrain/Pai-Megatron-Patch/examples/galactica/finetune_megatron_galactica.py
pretrain/Pai-Megatron-Patch/examples/galactica/pretrain_megatron_galactica.py
pretrain/Pai-Megatron-Patch/examples/galactica/run_evaluate_huggingface_galactica.sh
pretrain/Pai-Megatron-Patch/examples/galactica/run_evaluate_megatron_galactica.sh
pretrain/Pai-Megatron-Patch/examples/galactica/run_finetune_huggingface_galactica.sh
pretrain/Pai-Megatron-Patch/examples/galactica/run_finetune_megatron_galactica.sh
pretrain/Pai-Megatron-Patch/examples/galactica/run_pretrain_megatron_galactica.sh
pretrain/Pai-Megatron-Patch/examples/glm130b/evaluate_megatron_glm130b.py
pretrain/Pai-Megatron-Patch/examples/glm130b/evaluate_sat_glm130b.py
pretrain/Pai-Megatron-Patch/examples/glm130b/pretrain_megatron_glm130b.py
pretrain/Pai-Megatron-Patch/examples/glm130b/run_evaluate_megatron_glm130b.sh
pretrain/Pai-Megatron-Patch/examples/glm130b/run_evaluate_sat_glm130b.sh
pretrain/Pai-Megatron-Patch/examples/glm130b/run_pretrain_megatron_glm130b.sh
pretrain/Pai-Megatron-Patch/examples/gpt3/pretrain_megatron_gpt3.py
pretrain/Pai-Megatron-Patch/examples/gpt3/run_pretrain_megatron_gpt3.sh
pretrain/Pai-Megatron-Patch/examples/gpt3/run_pretrain_megatron_gpt3_enwiki.sh
pretrain/Pai-Megatron-Patch/examples/llama/evaluate_huggingface_llama.py
pretrain/Pai-Megatron-Patch/examples/llama/evaluate_megatron_llama.py
pretrain/Pai-Megatron-Patch/examples/llama/finetune_huggingface_llama.py
pretrain/Pai-Megatron-Patch/examples/llama/finetune_megatron_llama.py
pretrain/Pai-Megatron-Patch/examples/llama/generate_text_megatron_llama.py
pretrain/Pai-Megatron-Patch/examples/llama/pretrain_megatron_llama.py
pretrain/Pai-Megatron-Patch/examples/llama/run_evaluate_huggingface_llama.sh
pretrain/Pai-Megatron-Patch/examples/llama/run_evaluate_megatron_llama.sh
pretrain/Pai-Megatron-Patch/examples/llama/run_finetune_huggingface_llama.sh
pretrain/Pai-Megatron-Patch/examples/llama/run_finetune_megatron_llama.sh
pretrain/Pai-Megatron-Patch/examples/llama/run_pretrain_megatron_llama.sh
pretrain/Pai-Megatron-Patch/examples/llama/run_text_generation_megatron_llama.sh
pretrain/Pai-Megatron-Patch/examples/llama2/README.md
pretrain/Pai-Megatron-Patch/examples/llama2/ds_config_TEMPLATE.json
pretrain/Pai-Megatron-Patch/examples/llama2/ds_train_huggingface_llama.py
pretrain/Pai-Megatron-Patch/examples/llama2/evaluate_huggingface_llama.py
pretrain/Pai-Megatron-Patch/examples/llama2/evaluate_huggingface_llama_moe.py
pretrain/Pai-Megatron-Patch/examples/llama2/evaluate_mcore_llama.py
pretrain/Pai-Megatron-Patch/examples/llama2/evaluate_megatron_llama.py
pretrain/Pai-Megatron-Patch/examples/llama2/finetune_mcore_llama_withGA.py
pretrain/Pai-Megatron-Patch/examples/llama2/finetune_megatron_llama.py
pretrain/Pai-Megatron-Patch/examples/llama2/finetune_megatron_llama_withGA.py
pretrain/Pai-Megatron-Patch/examples/llama2/generate_text_megatron_llama.py
pretrain/Pai-Megatron-Patch/examples/llama2/pretrain_mcore_llama.py
pretrain/Pai-Megatron-Patch/examples/llama2/pretrain_megatron_llama.py
pretrain/Pai-Megatron-Patch/examples/llama2/run_ds_train_huggingface_llama.sh
pretrain/Pai-Megatron-Patch/examples/llama2/run_evaluate_huggingface_llama.sh
pretrain/Pai-Megatron-Patch/examples/llama2/run_evaluate_mcore_llama.sh
pretrain/Pai-Megatron-Patch/examples/llama2/run_evaluate_megatron_llama.sh
pretrain/Pai-Megatron-Patch/examples/llama2/run_finetune_mcore_llama_withGA.sh
pretrain/Pai-Megatron-Patch/examples/llama2/run_finetune_megatron_llama.sh
pretrain/Pai-Megatron-Patch/examples/llama2/run_finetune_megatron_llama_withGA.sh
pretrain/Pai-Megatron-Patch/examples/llama2/run_mcore_llama2_70b.sh
pretrain/Pai-Megatron-Patch/examples/llama2/run_pretrain_mcore_llama.sh
pretrain/Pai-Megatron-Patch/examples/llama2/run_pretrain_megatron_llama.sh
pretrain/Pai-Megatron-Patch/examples/llama2/run_text_generation_megatron_llama.sh
pretrain/Pai-Megatron-Patch/examples/llama3/README.md
pretrain/Pai-Megatron-Patch/examples/llama3/entry.sh
pretrain/Pai-Megatron-Patch/examples/llama3/mpi_run_pretrain_llama3.sh
pretrain/Pai-Megatron-Patch/examples/llama3/pretrain_llama.py
pretrain/Pai-Megatron-Patch/examples/llama3/pretrain_llama_mcore070.py
pretrain/Pai-Megatron-Patch/examples/llama3/run_finetune_mcore_llama_withGA.sh
pretrain/Pai-Megatron-Patch/examples/llama3/run_finetune_megatron_llama_withGA.sh
pretrain/Pai-Megatron-Patch/examples/llama3/run_pretrain_llama_70b.sh
pretrain/Pai-Megatron-Patch/examples/llama3/run_pretrain_mcore_llama.sh
pretrain/Pai-Megatron-Patch/examples/llama3/run_pretrain_megatron_llama.sh
pretrain/Pai-Megatron-Patch/examples/llama3_1/README.md
pretrain/Pai-Megatron-Patch/examples/llama3_1/pretrain_llama.py
pretrain/Pai-Megatron-Patch/examples/llama3_1/run_mcore_llama3_1.sh
pretrain/Pai-Megatron-Patch/examples/llava/finetune_megatron_llava.py
pretrain/Pai-Megatron-Patch/examples/llava/pretrain_megatron_llava.py
pretrain/Pai-Megatron-Patch/examples/llava/run_finetune_megatron_llava.sh
pretrain/Pai-Megatron-Patch/examples/llava/run_pretrain_megatron_llava.sh
pretrain/Pai-Megatron-Patch/examples/llava_mcore/README.md
pretrain/Pai-Megatron-Patch/examples/llava_mcore/dataset_helpers.py
pretrain/Pai-Megatron-Patch/examples/llava_mcore/image_processing.py
pretrain/Pai-Megatron-Patch/examples/llava_mcore/lm_loss.png
pretrain/Pai-Megatron-Patch/examples/llava_mcore/pretrain_llava.py
pretrain/Pai-Megatron-Patch/examples/llava_mcore/run_mcore_llava.sh
pretrain/Pai-Megatron-Patch/examples/mistral/README.md
pretrain/Pai-Megatron-Patch/examples/mistral/pretrain_mcore_mistral.py
pretrain/Pai-Megatron-Patch/examples/mistral/run_mcore_mistral.sh
pretrain/Pai-Megatron-Patch/examples/moonlight/README.md
pretrain/Pai-Megatron-Patch/examples/moonlight/README_grpo.md
pretrain/Pai-Megatron-Patch/examples/moonlight/modeling_deepseek_pai.py
pretrain/Pai-Megatron-Patch/examples/moonlight/run_mcore_moonlight.sh
pretrain/Pai-Megatron-Patch/examples/moonlight/run_mcore_moonlight_grpo.sh
pretrain/Pai-Megatron-Patch/examples/qwen/ds_config_TEMPLATE.json
pretrain/Pai-Megatron-Patch/examples/qwen/ds_train_huggingface_qwen.py
pretrain/Pai-Megatron-Patch/examples/qwen/evaluate_huggingface_qwen.py
pretrain/Pai-Megatron-Patch/examples/qwen/evaluate_megatron_qwen.py
pretrain/Pai-Megatron-Patch/examples/qwen/evaluate_megatron_qwen_moe.py
pretrain/Pai-Megatron-Patch/examples/qwen/finetune_megatron_qwen.py
pretrain/Pai-Megatron-Patch/examples/qwen/finetune_megatron_qwen_withGA.py
pretrain/Pai-Megatron-Patch/examples/qwen/generate_text_megatron_qwen.py
pretrain/Pai-Megatron-Patch/examples/qwen/lm_evaluate_megatron_qwen.py
pretrain/Pai-Megatron-Patch/examples/qwen/pretrain_megatron_qwen.py
pretrain/Pai-Megatron-Patch/examples/qwen/pretrain_megatron_qwen_upcycled.py
pretrain/Pai-Megatron-Patch/examples/qwen/run_ds_train_huggingface_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen/run_evaluate_huggingface_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen/run_evaluate_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen/run_evaluate_megatron_qwen_moe.sh
pretrain/Pai-Megatron-Patch/examples/qwen/run_finetune_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen/run_finetune_megatron_qwen_withGA.sh
pretrain/Pai-Megatron-Patch/examples/qwen/run_lm_evaluate_huggingface_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen/run_lm_evaluate_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen/run_pretrain_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen/run_pretrain_megatron_qwen_upcycled.sh
pretrain/Pai-Megatron-Patch/examples/qwen/run_text_generation_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen1_5/README.md
pretrain/Pai-Megatron-Patch/examples/qwen1_5/evaluate_mcore_qwen.py
pretrain/Pai-Megatron-Patch/examples/qwen1_5/pretrain_mcore_qwen.py
pretrain/Pai-Megatron-Patch/examples/qwen1_5/run_evaluate_mcore_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen1_5/run_evaluate_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen1_5/run_finetune_mcore_qwen_withGA.sh
pretrain/Pai-Megatron-Patch/examples/qwen1_5/run_finetune_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen1_5/run_finetune_megatron_qwen_withGA.sh
pretrain/Pai-Megatron-Patch/examples/qwen1_5/run_pretrain_mcore_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen1_5/run_pretrain_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen1_5/run_text_generation_megatron_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen2/README.md
pretrain/Pai-Megatron-Patch/examples/qwen2/README_moe.md
pretrain/Pai-Megatron-Patch/examples/qwen2/pretrain_qwen.py
pretrain/Pai-Megatron-Patch/examples/qwen2/pretrain_qwen2_moe.py
pretrain/Pai-Megatron-Patch/examples/qwen2/run_mcore_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen2/run_mcore_qwen2_moe.sh
pretrain/Pai-Megatron-Patch/examples/qwen2_5/README.md
pretrain/Pai-Megatron-Patch/examples/qwen2_5/run_mcore_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen2_5_vl/README.md
pretrain/Pai-Megatron-Patch/examples/qwen2_5_vl/pretrain_qwen.py
pretrain/Pai-Megatron-Patch/examples/qwen2_5_vl/run_mcore_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen2_vl/README.md
pretrain/Pai-Megatron-Patch/examples/qwen2_vl/pretrain_qwen.py
pretrain/Pai-Megatron-Patch/examples/qwen2_vl/run_mcore_qwen.sh
pretrain/Pai-Megatron-Patch/examples/qwen3/README.md
pretrain/Pai-Megatron-Patch/examples/qwen3/README_grpo.md
pretrain/Pai-Megatron-Patch/examples/qwen3/entrypoint.py
pretrain/Pai-Megatron-Patch/examples/qwen3/pretrain_qwen.py
pretrain/Pai-Megatron-Patch/examples/qwen3/run_mcore_qwen3.sh
pretrain/Pai-Megatron-Patch/examples/qwen3/run_mcore_qwen3_235b_grpo.sh
pretrain/Pai-Megatron-Patch/examples/qwen3/run_mcore_qwen3_30b_grpo.sh
pretrain/Pai-Megatron-Patch/examples/qwen3/run_mcore_qwen3_8b_grpo.sh
pretrain/Pai-Megatron-Patch/examples/qwen3/configs/grpo_megatron.yaml
pretrain/Pai-Megatron-Patch/examples/qwen_vl/finetune_megatron_qwen_vl.py
pretrain/Pai-Megatron-Patch/examples/qwen_vl/run_finetune_megatron_qwen_vl.sh
pretrain/Pai-Megatron-Patch/examples/qwq/README.md
pretrain/Pai-Megatron-Patch/examples/qwq/run_mcore_qwen.sh
pretrain/Pai-Megatron-Patch/examples/starcoder/ds_config_TEMPLATE.json
pretrain/Pai-Megatron-Patch/examples/starcoder/ds_train_huggingface_starcoder.py
pretrain/Pai-Megatron-Patch/examples/starcoder/evaluate_megatron_starcoder.py
pretrain/Pai-Megatron-Patch/examples/starcoder/finetune_megatron_starcoder.py
pretrain/Pai-Megatron-Patch/examples/starcoder/generate_text_megatron_starcoder.py
pretrain/Pai-Megatron-Patch/examples/starcoder/pretrain_megatron_starcoder.py
pretrain/Pai-Megatron-Patch/examples/starcoder/run_ds_train_huggingface_starcoder.sh
pretrain/Pai-Megatron-Patch/examples/starcoder/run_evaluate_megatron_starcoder.sh
pretrain/Pai-Megatron-Patch/examples/starcoder/run_finetune_megatron_starcoder_wgbs.sh
pretrain/Pai-Megatron-Patch/examples/starcoder/run_finetune_megatron_starcoder_wogbs.sh
pretrain/Pai-Megatron-Patch/examples/starcoder/run_pretrain_megatron_starcoder.sh
pretrain/Pai-Megatron-Patch/examples/starcoder/run_text_generation_megatron_starcoder.sh
pretrain/Pai-Megatron-Patch/examples/yi/run_evaluate_megatron_yi.sh
pretrain/Pai-Megatron-Patch/examples/yi/run_finetune_megatron_yi.sh
pretrain/Pai-Megatron-Patch/examples/yi/run_pretrain_megatron_yi.sh
pretrain/Pai-Megatron-Patch/megatron_patch/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/arguments.py
pretrain/Pai-Megatron-Patch/megatron_patch/efficientllm_config.sh
pretrain/Pai-Megatron-Patch/megatron_patch/efficientllm_metrics.py
pretrain/Pai-Megatron-Patch/megatron_patch/finetune_utils.py
pretrain/Pai-Megatron-Patch/megatron_patch/initialize.py
pretrain/Pai-Megatron-Patch/megatron_patch/lm_evaluate.py
pretrain/Pai-Megatron-Patch/megatron_patch/tensor_parallel.py
pretrain/Pai-Megatron-Patch/megatron_patch/training.py
pretrain/Pai-Megatron-Patch/megatron_patch/data/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/data/dataset_helpers.py
pretrain/Pai-Megatron-Patch/megatron_patch/data/image_processing.py
pretrain/Pai-Megatron-Patch/megatron_patch/data/json_sft.py
pretrain/Pai-Megatron-Patch/megatron_patch/data/utils.py
pretrain/Pai-Megatron-Patch/megatron_patch/data/energon/chatml.py
pretrain/Pai-Megatron-Patch/megatron_patch/fixes/optimizer_offloading/README.md
pretrain/Pai-Megatron-Patch/megatron_patch/fixes/optimizer_offloading/fix_optimizer_offloading.patch
pretrain/Pai-Megatron-Patch/megatron_patch/fixes/yarn_args/README.md
pretrain/Pai-Megatron-Patch/megatron_patch/fixes/yarn_args/fix_yarn_args.patch
pretrain/Pai-Megatron-Patch/megatron_patch/generation/api.py
pretrain/Pai-Megatron-Patch/megatron_patch/generation/generation.py
pretrain/Pai-Megatron-Patch/megatron_patch/generation/gpt_predictor.py
pretrain/Pai-Megatron-Patch/megatron_patch/generation/megatron.md
pretrain/Pai-Megatron-Patch/megatron_patch/generation/tokenization.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/baichuan/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/baichuan/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/baichuan/language_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/baichuan/transformer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/baichuan2/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/baichuan2/language_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/baichuan2/layers.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/baichuan2/transformer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/bloom/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/bloom/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/bloom/language_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/bloom/layers.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/bloom/positional_embeddings.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/bloom/transformer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/chatglm/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/chatglm/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/chatglm/language_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/chatglm/positional_embeddings.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/chatglm/transformer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/layer_specs.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/mlp.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/multi_latent_attention.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/transformer_block.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/transformer_config.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/transformer_layer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/moe/experts.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/deepseek_v2/moe/shared_experts.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/falcon/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/falcon/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/falcon/language_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/falcon/transformer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/falcon40b/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/falcon40b/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/falcon40b/language_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/falcon40b/transformer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/galactica/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/galactica/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/galactica/language_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/galactica/transformer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/glm130b/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/glm130b/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/glm130b/language_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/glm130b/transformer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama/language_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama/positional_embeddings.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama/transformer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama2/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama2/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama2/language_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama2/rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama2/transformer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama3/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama3/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama3/language_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama3/layer_specs.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama3/model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama3/rms_norm.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama3/transformer_config.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama3/transformer_legacy.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama3/transformer/attention.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama3/transformer/mlp.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama3_1/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama3_1/layer_specs.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama3_1/model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama3_1/rms_norm.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llama3_1/transformer_config.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llava/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llava/clip_encoder.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llava/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llava/language_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llava/mm_projector_builder.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llava/rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llava/transformer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/layer_specs.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/llava_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/llava_spec.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/transformer_config.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/vision/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/vision/clip_vit_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/vision/multimodal_projector.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/llava_mcore/vision/vit_layer_specs.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mistral/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mistral/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mistral/language_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mistral/modeling_attn_mask_utils.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mistral/rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mistral/transformer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral/layer_specs.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral/model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral/transformer_config.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral/moe/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral/moe/experts.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral/moe/router.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral/moe/token_dispatcher.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral/transformer/attention.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral/transformer/mlp.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/layer_specs.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/transformer_config.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/moe/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/moe/experts.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/moe/grouped_gemm_util.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/moe/moe_utils.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/moe/router.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/moe/token_dispatcher.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/transformer/attention.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/mixtral_bak/transformer/mlp.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen/language_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen/transformer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/layer_specs.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/transformer_config.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/moe/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/moe/experts.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/moe/router.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/moe/token_dispatcher.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/transformer/attention.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen1_5/transformer/mlp.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen1_5_megablocks/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen1_5_megablocks/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen1_5_megablocks/language_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen1_5_megablocks/rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen1_5_megablocks/transformer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2/layer_specs.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2/model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2/positional_encodings.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2/rms_norm.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2/transformer_block.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2/transformer_config.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2/transformer_layer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2/moe/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2/moe/experts.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2/moe/router.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2/moe/token_dispatcher.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2/transformer/attention.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2/transformer/mla_attention.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2/transformer/mlp.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2/transformer/mqa_attention.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2/transformer/nsa_attention.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_5_vl/model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_5_vl/transformer_block.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_5_vl/transformer_config.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_5_vl/visionmodel.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_moe/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_moe/layer_specs.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_moe/transformer_config.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/attention.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/attention_vision.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/language_model_embedding.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/language_module.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/layer_specs.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/rope_utils.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/rotary_pos_embedding.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/transformer_config.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen2_vl/visionmodel.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen3_moe/gpt_layer_specs.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen3_moe/moe_module_specs.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen3_moe/moe/moe_layer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen3_moe/moe/moe_utils.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen3_moe/moe/router.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen_vl/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen_vl/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen_vl/language_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen_vl/transformer.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/qwen_vl/visual.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/starcoder/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/starcoder/enums.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/starcoder/glu_activations.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/starcoder/gpt_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/starcoder/language_model.py
pretrain/Pai-Megatron-Patch/megatron_patch/model/starcoder/transformer.py
pretrain/Pai-Megatron-Patch/megatron_patch/template/README.md
pretrain/Pai-Megatron-Patch/megatron_patch/template/helper.py
pretrain/Pai-Megatron-Patch/megatron_patch/tokenizer/__init__.py
pretrain/Pai-Megatron-Patch/megatron_patch/tokenizer/icetk_glm130b_tokenizer.py
pretrain/Pai-Megatron-Patch/megatron_patch/tokenizer/jiebabpe_tokenizer.py
pretrain/Pai-Megatron-Patch/megatron_patch/tokenizer/tokenization_baichuan.py
pretrain/Pai-Megatron-Patch/megatron_patch/tokenizer/tokenization_qwen_vl.py
pretrain/Pai-Megatron-Patch/megatron_patch/tokenizer/tokenization_yi.py
pretrain/Pai-Megatron-Patch/scripts/DATASET_README.md
pretrain/Pai-Megatron-Patch/scripts/generate_efficientllm_configs.sh
pretrain/Pai-Megatron-Patch/scripts/prepare_fineweb_dataset.sh
pretrain/Pai-Megatron-Patch/scripts/run_efficientllm_benchmark.sh
pretrain/Pai-Megatron-Patch/scripts/test_efficientllm_variants.sh
pretrain/Pai-Megatron-Patch/toolkits/auto_configurator/report_auto_config.py
pretrain/Pai-Megatron-Patch/toolkits/auto_configurator/report_theoretical_memory.py
pretrain/Pai-Megatron-Patch/toolkits/auto_configurator/run_auto_config.sh
pretrain/Pai-Megatron-Patch/toolkits/auto_configurator/run_estimate_memory_usage.sh
pretrain/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/README.md
pretrain/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/convert.py
pretrain/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/deepseek_v3/__init__.py
pretrain/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/deepseek_v3/h2m_synchronizer.py
pretrain/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/deepseek_v3/m2h_synchronizer.py
pretrain/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/deepseek_v3/patch.py
pretrain/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/general/__init__.py
pretrain/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/general/h2m_synchronizer.py
pretrain/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/general/m2h_synchronizer.py
pretrain/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/impl/general/synchronizer.py
pretrain/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/scripts/deepseek_v3/run_32xH20.sh
pretrain/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/scripts/moonlight/run_2xH20.sh
pretrain/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/scripts/qwen2_5/run_8xH20.sh
pretrain/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/scripts/qwen3/run_8xH20.sh
pretrain/Pai-Megatron-Patch/toolkits/distributed_checkpoints_convertor/scripts/qwen3/run_A22B_16xH20.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/README.md
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan/configuration_baichuan.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan/hf2te.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan/model_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan/te_model_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan2/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan2/configuration_baichuan.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan2/hf2te.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan2/hf2te_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/baichuan2/model_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/bloom/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/bloom/deepspeed_to_megatron.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/bloom/deepspeed_to_megatron_ori.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/bloom/model_convertor_huggingface_megatron.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/bloom/reward_model_convertor_megatron.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/bloom/reward_model_to_megatron.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/bloom/run_convert_deepspeed_to_megatron.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/bloom/run_convert_deepspeed_to_transformers.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/chatglm/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/chatglm/run_convert_huggingface_to_megatron.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/deepseek/fp8_cast_bf16.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/deepseek/hf2mcore_deepseek_v2_moe.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/deepseek/hf2mcore_deepseek_v2_moe_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/deepseek/hf2mcore_deepseek_v3_moe.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/deepseek/hf2mcore_deepseek_v3_moe_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/falcon/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/falcon/configuration_RW.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/falcon/model_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/falcon40b/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/falcon40b/configuration_RW.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/falcon40b/model_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/galactica/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/galactica/run_convert_huggingface_to_megatron.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/glm/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/glm/run_convert_transformers_to_megatron.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/glm130b/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/glm130b/merge_130b_ckpts.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/glm130b/run_convert_transformers_to_megatron.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf2mcore.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf2mcore_70b.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf2mcore_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf2mcore_convertor_llama3_1.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf2mcore_llama3_1.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf2megatron.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf2megatron_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf_llama_moe/config_TEMPLATE.json
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llama/hf_llama_moe/llama_moe.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llava/hf2mcore_convertor_llava.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/llava/hf2mcore_llava.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/mistral/hf2mcore.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/mistral/hf2mcore_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/mistral/hf2mcore_mixtral.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/mistral/hf_mistral_moe/config_TEMPLATE.json
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/moonlight/hf2mcore_moonlight_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen1.5_dense_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen1.5_dense_gqa.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen1.5_dense_mha.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen1.5_dense_mha_to_moe.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen1.5_dense_to_moe_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen1.5_moe.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen1.5_moe_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2.5_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2.5_vl.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2.5_vl_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2_dense_and_moe_gqa.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2_moe.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2_moe_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2_vl.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen2_vl_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2mcore_qwen3_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2megablocks_qwen1.5.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2megablocks_qwen1.5_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2megatron_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2megatron_qwen1.0.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/qwen/hf2megatron_qwen1.5.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/starcoder/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/starcoder/model_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/utils/__init__.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/yi/checkpoint_reshaping_and_interoperability.py
pretrain/Pai-Megatron-Patch/toolkits/model_checkpoints_convertor/yi/model_convertor.sh
pretrain/Pai-Megatron-Patch/toolkits/multimodal_data_preprocessing/build_llava_frame_dataset.py
pretrain/Pai-Megatron-Patch/toolkits/multimodal_data_preprocessing/convert_custom_dataset_to_wds_chatml.py
pretrain/Pai-Megatron-Patch/toolkits/multimodal_data_preprocessing/convert_llava_pretrain_to_wds.py
pretrain/Pai-Megatron-Patch/toolkits/multimodal_data_preprocessing/dataset_preparation.md
pretrain/Pai-Megatron-Patch/toolkits/multimodal_data_preprocessing/replace_llava_image_key.py
pretrain/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/README.md
pretrain/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/clean_raw_text.py
pretrain/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/convert_json_to_list.py
pretrain/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/img.png
pretrain/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/preprocess_data.py
pretrain/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/preprocess_data_megatron.py
pretrain/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/preprocess_wudao2.py
pretrain/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/qwen_hf_preprocess_datasets.py
pretrain/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/run_make_pretraining_dataset.sh
pretrain/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/run_make_pretraining_dataset_megatron.sh
pretrain/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/run_prepare_dataset.sh
pretrain/Pai-Megatron-Patch/toolkits/pretrain_data_preprocessing/run_prepare_wudao.sh
pretrain/Pai-Megatron-Patch/toolkits/sft_data_preprocessing/README.md
pretrain/Pai-Megatron-Patch/toolkits/sft_data_preprocessing/build_idxmap_sft_dataset.py
pretrain/Pai-Megatron-Patch/toolkits/sft_data_preprocessing/run_build_idxmap_sft_dataset.sh
pretrain/Pai-Megatron-Patch/toolkits/sft_data_preprocessing/sample_stats.py
pretrain/RWKV-LM/CITATION.cff
pretrain/RWKV-LM/LICENSE
pretrain/RWKV-LM/README.md
pretrain/RWKV-LM/RWKV-chat.png
pretrain/RWKV-LM/RWKV-ctxlen.png
pretrain/RWKV-LM/RWKV-demo.png
pretrain/RWKV-LM/RWKV-eval.png
pretrain/RWKV-LM/RWKV-eval2.png
pretrain/RWKV-LM/RWKV-formula.png
pretrain/RWKV-LM/RWKV-loss.png
pretrain/RWKV-LM/RWKV-paper.png
pretrain/RWKV-LM/RWKV-time-w.png
pretrain/RWKV-LM/RWKV-v2-430M-Pile-LR.png
pretrain/RWKV-LM/RWKV-v2-430M-Pile.png
pretrain/RWKV-LM/RWKV-v2-RNN-run.png
pretrain/RWKV-LM/RWKV-v2-RNN.png
pretrain/RWKV-LM/RWKV-v3-1.5B-Pile.png
pretrain/RWKV-LM/RWKV-v3-plan.png
pretrain/RWKV-LM/RWKV-v4-1.5B-Pile.png
pretrain/RWKV-LM/RWKV-v5-benchmark-1.png
pretrain/RWKV-LM/RWKV-v5-minipile.png
pretrain/RWKV-LM/RWKV-v6.png
pretrain/RWKV-LM/RWKV-v7-loss.png
pretrain/RWKV-LM/RWKV-v7-niah.png
pretrain/RWKV-LM/RWKV-v7.png
pretrain/RWKV-LM/RWKV-vs-MHA.png
pretrain/RWKV-LM/rwkv-x060.png
pretrain/RWKV-LM/train_rwkv_fineweb.py
pretrain/RWKV-LM/.github/FUNDING.yml
pretrain/RWKV-LM/RWKV-v1/train.py
pretrain/RWKV-LM/RWKV-v1/src/__init__.py
pretrain/RWKV-LM/RWKV-v1/src/model.py
pretrain/RWKV-LM/RWKV-v1/src/trainer.py
pretrain/RWKV-LM/RWKV-v1/src/utils.py
pretrain/RWKV-LM/RWKV-v2-RNN/enwik8-vocab.json
pretrain/RWKV-LM/RWKV-v2-RNN/run.py
pretrain/RWKV-LM/RWKV-v2-RNN/train.py
pretrain/RWKV-LM/RWKV-v2-RNN/cuda/timex_cuda.cu
pretrain/RWKV-LM/RWKV-v2-RNN/cuda/timex_op.cpp
pretrain/RWKV-LM/RWKV-v2-RNN/src/model.py
pretrain/RWKV-LM/RWKV-v2-RNN/src/model_run.py
pretrain/RWKV-LM/RWKV-v2-RNN/src/trainer.py
pretrain/RWKV-LM/RWKV-v2-RNN/src/utils.py
pretrain/RWKV-LM/RWKV-v3/run.py
pretrain/RWKV-LM/RWKV-v3/train.py
pretrain/RWKV-LM/RWKV-v3/verify.py
pretrain/RWKV-LM/RWKV-v3/cuda/timex_cuda.cu
pretrain/RWKV-LM/RWKV-v3/cuda/timex_op.cpp
pretrain/RWKV-LM/RWKV-v3/src/model.py
pretrain/RWKV-LM/RWKV-v3/src/model_run.py
pretrain/RWKV-LM/RWKV-v3/src/trainer.py
pretrain/RWKV-LM/RWKV-v3/src/utils.py
pretrain/RWKV-LM/RWKV-v4/20B_tokenizer.json
pretrain/RWKV-LM/RWKV-v4/run.py
pretrain/RWKV-LM/RWKV-v4/train.py
pretrain/RWKV-LM/RWKV-v4/verify.py
pretrain/RWKV-LM/RWKV-v4/cuda/wkv_cuda.cu
pretrain/RWKV-LM/RWKV-v4/cuda/wkv_op.cpp
pretrain/RWKV-LM/RWKV-v4/src/binidx.py
pretrain/RWKV-LM/RWKV-v4/src/model.py
pretrain/RWKV-LM/RWKV-v4/src/model_run.py
pretrain/RWKV-LM/RWKV-v4/src/trainer.py
pretrain/RWKV-LM/RWKV-v4/src/utils.py
pretrain/RWKV-LM/RWKV-v4neo/20B_tokenizer.json
pretrain/RWKV-LM/RWKV-v4neo/chat.py
pretrain/RWKV-LM/RWKV-v4neo/img_demoAE.py
pretrain/RWKV-LM/RWKV-v4neo/run.py
pretrain/RWKV-LM/RWKV-v4neo/train.py
pretrain/RWKV-LM/RWKV-v4neo/verify.py
pretrain/RWKV-LM/RWKV-v4neo/cuda/wkv5_cuda.cu
pretrain/RWKV-LM/RWKV-v4neo/cuda/wkv5_op.cpp
pretrain/RWKV-LM/RWKV-v4neo/cuda/wkv_cuda.cu
pretrain/RWKV-LM/RWKV-v4neo/cuda/wkv_cuda_bf16.cu
pretrain/RWKV-LM/RWKV-v4neo/cuda/wkv_op.cpp
pretrain/RWKV-LM/RWKV-v4neo/cuda/wkv_op_bf16.cpp
pretrain/RWKV-LM/RWKV-v4neo/math_demo/run.py
pretrain/RWKV-LM/RWKV-v4neo/math_demo/rwkv-200.pth
pretrain/RWKV-LM/RWKV-v4neo/src/__init__.py
pretrain/RWKV-LM/RWKV-v4neo/src/binidx.py
pretrain/RWKV-LM/RWKV-v4neo/src/dataset.py
pretrain/RWKV-LM/RWKV-v4neo/src/model.py
pretrain/RWKV-LM/RWKV-v4neo/src/model_img.py
pretrain/RWKV-LM/RWKV-v4neo/src/model_run.py
pretrain/RWKV-LM/RWKV-v4neo/src/trainer.py
pretrain/RWKV-LM/RWKV-v4neo/src/utils.py
pretrain/RWKV-LM/RWKV-v5/compute_magic_prime.py
pretrain/RWKV-LM/RWKV-v5/demo-training-prepare-v7-pile.sh
pretrain/RWKV-LM/RWKV-v5/demo-training-prepare.sh
pretrain/RWKV-LM/RWKV-v5/demo-training-run-v7-pile.sh
pretrain/RWKV-LM/RWKV-v5/demo-training-run.sh
pretrain/RWKV-LM/RWKV-v5/demo.jsonl
pretrain/RWKV-LM/RWKV-v5/make_data.py
pretrain/RWKV-LM/RWKV-v5/requirements.txt
pretrain/RWKV-LM/RWKV-v5/rwkv_v6_demo.py
pretrain/RWKV-LM/RWKV-v5/train.py
pretrain/RWKV-LM/RWKV-v5/cuda/wkv5_cuda.cu
pretrain/RWKV-LM/RWKV-v5/cuda/wkv5_op.cpp
pretrain/RWKV-LM/RWKV-v5/cuda/wkv6_cuda.cu
pretrain/RWKV-LM/RWKV-v5/cuda/wkv6_op.cpp
pretrain/RWKV-LM/RWKV-v5/cuda/wkv6state_cuda.cu
pretrain/RWKV-LM/RWKV-v5/cuda/wkv6state_op.cpp
pretrain/RWKV-LM/RWKV-v5/cuda/wkv7_cuda.cu
pretrain/RWKV-LM/RWKV-v5/cuda/wkv7_op.cpp
pretrain/RWKV-LM/RWKV-v5/src/__init__.py
pretrain/RWKV-LM/RWKV-v5/src/binidx.py
pretrain/RWKV-LM/RWKV-v5/src/dataset.py
pretrain/RWKV-LM/RWKV-v5/src/model.py
pretrain/RWKV-LM/RWKV-v5/src/trainer.py
pretrain/RWKV-LM/RWKV-v5/src/utils.py
pretrain/RWKV-LM/RWKV-v5/tokenizer/__init__.py
pretrain/RWKV-LM/RWKV-v5/tokenizer/rwkv_tokenizer.py
pretrain/RWKV-LM/RWKV-v5/tokenizer/rwkv_vocab_v20230424.txt
pretrain/RWKV-LM/RWKV-v6/README.md
pretrain/RWKV-LM/RWKV-v7/README.md
pretrain/RWKV-LM/RWKV-v7/rwkv_mmlu_eval.py
pretrain/RWKV-LM/RWKV-v7/rwkv_v7_demo.py
pretrain/RWKV-LM/RWKV-v7/rwkv_v7_demo_fast.py
pretrain/RWKV-LM/RWKV-v7/rwkv_v7_demo_rnn.py
pretrain/RWKV-LM/RWKV-v7/rwkv_v7_numpy.py
pretrain/RWKV-LM/RWKV-v7/rwkv_v8_rc00_demo.py
pretrain/RWKV-LM/RWKV-v7/rwkv_v8_rc00_hybrid_demo.py
pretrain/RWKV-LM/RWKV-v7/rwkv_vocab_v20230424.txt
pretrain/RWKV-LM/RWKV-v7/cuda/wkv7.cu
pretrain/RWKV-LM/RWKV-v7/cuda/wkv7_op.cpp
pretrain/RWKV-LM/RWKV-v7/cuda/wkv7s.cu
pretrain/RWKV-LM/RWKV-v7/cuda/wkv7s_op.cpp
pretrain/RWKV-LM/RWKV-v7/misc/lambada_test.jsonl
pretrain/RWKV-LM/RWKV-v7/mmlu_dev_dataset/data-00000-of-00001.arrow
pretrain/RWKV-LM/RWKV-v7/mmlu_dev_dataset/dataset_info.json
pretrain/RWKV-LM/RWKV-v7/mmlu_dev_dataset/state.json
pretrain/RWKV-LM/RWKV-v7/mmlu_test_dataset/data-00000-of-00001.arrow
pretrain/RWKV-LM/RWKV-v7/mmlu_test_dataset/dataset_info.json
pretrain/RWKV-LM/RWKV-v7/mmlu_test_dataset/state.json
pretrain/RWKV-LM/RWKV-v7/train_temp/README.md
pretrain/RWKV-LM/RWKV-v7/train_temp/demo-training-prepare-v7-pile.sh
pretrain/RWKV-LM/RWKV-v7/train_temp/demo-training-prepare.sh
pretrain/RWKV-LM/RWKV-v7/train_temp/demo-training-run-v7-pile.sh
pretrain/RWKV-LM/RWKV-v7/train_temp/demo-training-run.sh
pretrain/RWKV-LM/RWKV-v7/train_temp/requirements.txt
pretrain/RWKV-LM/RWKV-v7/train_temp/train.py
pretrain/RWKV-LM/RWKV-v7/train_temp/cuda/wkv7_cuda.cu
pretrain/RWKV-LM/RWKV-v7/train_temp/cuda/wkv7_op.cpp
pretrain/RWKV-LM/RWKV-v7/train_temp/src/__init__.py
pretrain/RWKV-LM/RWKV-v7/train_temp/src/binidx.py
pretrain/RWKV-LM/RWKV-v7/train_temp/src/dataset.py
pretrain/RWKV-LM/RWKV-v7/train_temp/src/model.py
pretrain/RWKV-LM/RWKV-v7/train_temp/src/trainer.py
pretrain/RWKV-LM/Research/RWKV-6-MQAR.png
pretrain/RWKV-LM/Research/better_lr_schedule.png
pretrain/RWKV-LM/Research/rwkv7-g0-7.2b.md
pretrain/mamba/AUTHORS
pretrain/mamba/LICENSE
pretrain/mamba/MANIFEST.in
pretrain/mamba/README.md
pretrain/mamba/pyproject.toml
pretrain/mamba/setup.py
pretrain/mamba/train_mamba_fineweb.py
pretrain/mamba/usage.md
pretrain/mamba/.github/workflows/publish.yaml
pretrain/mamba/assets/selection.png
pretrain/mamba/assets/ssd_algorithm.png
pretrain/mamba/benchmarks/benchmark_generation_mamba_simple.py
pretrain/mamba/csrc/selective_scan/reverse_scan.cuh
pretrain/mamba/csrc/selective_scan/selective_scan.cpp
pretrain/mamba/csrc/selective_scan/selective_scan.h
pretrain/mamba/csrc/selective_scan/selective_scan_bwd_bf16_complex.cu
pretrain/mamba/csrc/selective_scan/selective_scan_bwd_bf16_real.cu
pretrain/mamba/csrc/selective_scan/selective_scan_bwd_fp16_complex.cu
pretrain/mamba/csrc/selective_scan/selective_scan_bwd_fp16_real.cu
pretrain/mamba/csrc/selective_scan/selective_scan_bwd_fp32_complex.cu
pretrain/mamba/csrc/selective_scan/selective_scan_bwd_fp32_real.cu
pretrain/mamba/csrc/selective_scan/selective_scan_bwd_kernel.cuh
pretrain/mamba/csrc/selective_scan/selective_scan_common.h
pretrain/mamba/csrc/selective_scan/selective_scan_fwd_bf16.cu
pretrain/mamba/csrc/selective_scan/selective_scan_fwd_fp16.cu
pretrain/mamba/csrc/selective_scan/selective_scan_fwd_fp32.cu
pretrain/mamba/csrc/selective_scan/selective_scan_fwd_kernel.cuh
pretrain/mamba/csrc/selective_scan/static_switch.h
pretrain/mamba/csrc/selective_scan/uninitialized_copy.cuh
pretrain/mamba/evals/lm_harness_eval.py
pretrain/mamba/mamba_ssm/__init__.py
pretrain/mamba/mamba_ssm/distributed/__init__.py
pretrain/mamba/mamba_ssm/distributed/distributed_utils.py
pretrain/mamba/mamba_ssm/distributed/tensor_parallel.py
pretrain/mamba/mamba_ssm/models/__init__.py
pretrain/mamba/mamba_ssm/models/config_mamba.py
pretrain/mamba/mamba_ssm/models/mixer_seq_simple.py
pretrain/mamba/mamba_ssm/modules/__init__.py
pretrain/mamba/mamba_ssm/modules/block.py
pretrain/mamba/mamba_ssm/modules/mamba2.py
pretrain/mamba/mamba_ssm/modules/mamba2_simple.py
pretrain/mamba/mamba_ssm/modules/mamba_simple.py
pretrain/mamba/mamba_ssm/modules/mha.py
pretrain/mamba/mamba_ssm/modules/mlp.py
pretrain/mamba/mamba_ssm/modules/ssd_minimal.py
pretrain/mamba/mamba_ssm/ops/__init__.py
pretrain/mamba/mamba_ssm/ops/selective_scan_interface.py
pretrain/mamba/mamba_ssm/ops/triton/__init__.py
pretrain/mamba/mamba_ssm/ops/triton/k_activations.py
pretrain/mamba/mamba_ssm/ops/triton/layer_norm.py
pretrain/mamba/mamba_ssm/ops/triton/layernorm_gated.py
pretrain/mamba/mamba_ssm/ops/triton/selective_state_update.py
pretrain/mamba/mamba_ssm/ops/triton/softplus.py
pretrain/mamba/mamba_ssm/ops/triton/ssd_bmm.py
pretrain/mamba/mamba_ssm/ops/triton/ssd_chunk_scan.py
pretrain/mamba/mamba_ssm/ops/triton/ssd_chunk_state.py
pretrain/mamba/mamba_ssm/ops/triton/ssd_combined.py
pretrain/mamba/mamba_ssm/ops/triton/ssd_state_passing.py
pretrain/mamba/mamba_ssm/utils/__init__.py
pretrain/mamba/mamba_ssm/utils/generation.py
pretrain/mamba/mamba_ssm/utils/hf.py
pretrain/mamba/mamba_ssm/utils/torch.py
pretrain/mamba/rocm_patch/rocm6_0.patch
pretrain/mamba/tests/test_generation.py
pretrain/mamba/tests/ops/test_selective_scan.py
pretrain/mamba/tests/ops/triton/test_layernorm_gated.py
pretrain/mamba/tests/ops/triton/test_selective_state_update.py
pretrain/mamba/tests/ops/triton/test_ssd.py
pretrain/pythia/CODEOWNERS
pretrain/pythia/LICENSE
pretrain/pythia/README.md
pretrain/pythia/requirements.txt
pretrain/pythia/train_pythia_fineweb.py
pretrain/pythia/case-studies/README.md
pretrain/pythia/case-studies/crowspairs_plots.ipynb
pretrain/pythia/case-studies/lambada_openai_plots.ipynb
pretrain/pythia/case-studies/rename_jsons.ipynb
pretrain/pythia/case-studies/winobias.ipynb
pretrain/pythia/case-studies/crowspair_plots/crows_pairs_english_gender_lesser_steps.pdf
pretrain/pythia/case-studies/crowspair_plots/crows_pairs_english_gender_more_steps.pdf
pretrain/pythia/case-studies/lambada_openai_plots/lambada_openai_400M_1.4B_vstack.pdf
pretrain/pythia/case-studies/lambada_openai_plots/lambada_openai_70M_6.9B_vstack.pdf
pretrain/pythia/case-studies/term_frequency/model.py
pretrain/pythia/case-studies/term_frequency/numerical_reasoning_arithmetic.py
pretrain/pythia/case-studies/term_frequency/numerical_reasoning_time_unit_conversion.py
pretrain/pythia/case-studies/term_frequency/run_freq_count.py
pretrain/pythia/case-studies/term_frequency/run_model_eval.py
pretrain/pythia/case-studies/term_frequency/task.py
pretrain/pythia/case-studies/term_frequency/term_frequency.py
pretrain/pythia/case-studies/winobias_plots/winobias_scale_final.pdf
pretrain/pythia/evals/README.md
pretrain/pythia/evals/bias-evals/intervention-1.3b-deduped-step67000_eval_results_01-21-2023-20-16-29.json
pretrain/pythia/evals/bias-evals/intervention-1.3b-deduped-step67500_eval_results_01-21-2023-20-16-06.json
pretrain/pythia/evals/bias-evals/intervention-1.3b-deduped-step68000_eval_results_01-21-2023-19-26-25.json
pretrain/pythia/evals/bias-evals/intervention-1.3b-deduped-step68500_eval_results_01-21-2023-19-26-16.json
pretrain/pythia/evals/bias-evals/intervention-1.3b-deduped-step69000_eval_results_01-21-2023-19-26-05.json
pretrain/pythia/evals/bias-evals/intervention-1.3b-deduped-step69500_eval_results_01-21-2023-19-26-16.json
pretrain/pythia/evals/bias-evals/intervention-1.3b-deduped-step70000_eval_results_01-21-2023-19-25-28.json
pretrain/pythia/evals/bias-evals/intervention-1.3b-deduped-step70500_eval_results_01-21-2023-19-25-08.json
pretrain/pythia/evals/bias-evals/intervention-1.3b-deduped-step71500_eval_results_01-21-2023-19-18-21.json
pretrain/pythia/evals/bias-evals/intervention-19m-deduped-step134000_eval_results_01-21-2023-21-04-18.json
pretrain/pythia/evals/bias-evals/intervention-19m-deduped-step135000_eval_results_01-21-2023-20-58-08.json
pretrain/pythia/evals/bias-evals/intervention-19m-deduped-step136000_eval_results_01-21-2023-21-00-16.json
pretrain/pythia/evals/bias-evals/intervention-19m-deduped-step137000_eval_results_01-21-2023-21-02-18.json
pretrain/pythia/evals/bias-evals/intervention-19m-deduped-step138000_eval_results_01-21-2023-21-41-10.json
pretrain/pythia/evals/bias-evals/intervention-19m-deduped-step139000_eval_results_01-21-2023-21-09-12.json
pretrain/pythia/evals/bias-evals/intervention-19m-deduped-step140000_eval_results_01-21-2023-21-41-21.json
pretrain/pythia/evals/bias-evals/intervention-19m-deduped-step141000_eval_results_01-21-2023-21-41-21.json
pretrain/pythia/evals/bias-evals/intervention-19m-deduped-step142000_eval_results_01-21-2023-21-41-26.json
pretrain/pythia/evals/bias-evals/intervention-19m-deduped-step143000_eval_results_01-21-2023-21-41-13.json
pretrain/pythia/evals/bias-evals/intervention-350m-deduped-step67000_eval_results_01-21-2023-22-12-15.json
pretrain/pythia/evals/bias-evals/intervention-350m-deduped-step67500_eval_results_01-21-2023-22-12-20.json
pretrain/pythia/evals/bias-evals/intervention-350m-deduped-step68000_eval_results_01-21-2023-22-12-17.json
pretrain/pythia/evals/bias-evals/intervention-350m-deduped-step68500_eval_results_01-21-2023-22-12-14.json
pretrain/pythia/evals/bias-evals/intervention-350m-deduped-step69000_eval_results_01-21-2023-22-12-07.json
pretrain/pythia/evals/bias-evals/intervention-350m-deduped-step69500_eval_results_01-21-2023-22-12-16.json
pretrain/pythia/evals/bias-evals/intervention-350m-deduped-step70000_eval_results_01-21-2023-22-12-18.json
pretrain/pythia/evals/bias-evals/intervention-350m-deduped-step70500_eval_results_01-21-2023-22-12-15.json
pretrain/pythia/evals/bias-evals/intervention-350m-deduped-step71000_eval_results_01-21-2023-22-12-13.json
pretrain/pythia/evals/bias-evals/intervention-350m-deduped-step71500_eval_results_01-21-2023-22-12-24.json
pretrain/pythia/evals/bias-evals/intervention-6.9b-deduped-step134000_eval_results_01-23-2023-01-11-15.json
pretrain/pythia/evals/bias-evals/intervention-6.9b-deduped-step135000_eval_results_01-23-2023-01-11-44.json
pretrain/pythia/evals/bias-evals/intervention-6.9b-deduped-step136000_eval_results_01-23-2023-01-11-38.json
pretrain/pythia/evals/bias-evals/intervention-6.9b-deduped-step137000_eval_results_01-23-2023-01-11-50.json
pretrain/pythia/evals/bias-evals/intervention-6.9b-deduped-step138000_eval_results_01-23-2023-01-11-57.json
pretrain/pythia/evals/bias-evals/intervention-6.9b-deduped-step139000_eval_results_01-23-2023-01-11-28.json
pretrain/pythia/evals/bias-evals/intervention-6.9b-deduped-step140000_eval_results_01-23-2023-01-12-18.json
pretrain/pythia/evals/bias-evals/intervention-6.9b-deduped-step141000_eval_results_01-23-2023-01-12-25.json
pretrain/pythia/evals/bias-evals/intervention-6.9b-deduped-step142000_eval_results_01-23-2023-01-12-19.json
pretrain/pythia/evals/bias-evals/intervention-6.9b-deduped-step143000_eval_results_01-23-2023-01-12-30.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step57000_eval_results_01-23-2023-14-05-01.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step57500_eval_results_01-23-2023-14-07-41.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step58000_eval_results_01-23-2023-14-08-21.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step58500_eval_results_01-23-2023-14-08-43.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step59000_eval_results_01-23-2023-14-08-44.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step59500_eval_results_01-23-2023-14-08-52.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step60000_eval_results_01-23-2023-14-09-23.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step60500_eval_results_01-23-2023-14-09-29.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step61000_eval_results_01-23-2023-14-09-17.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step61500_eval_results_01-23-2023-14-09-15.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step62000_eval_results_01-23-2023-14-09-28.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step62500_eval_results_01-23-2023-14-09-22.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step63000_eval_results_01-24-2023-03-58-04.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step63500_eval_results_01-23-2023-14-09-24.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step64000_eval_results_01-23-2023-14-09-21.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step64500_eval_results_01-23-2023-14-09-58.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step65000_eval_results_01-23-2023-14-10-27.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step65500_eval_results_01-23-2023-14-11-03.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step66000_eval_results_01-23-2023-14-10-58.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step66500_eval_results_01-23-2023-14-10-57.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step67000_eval_results_01-23-2023-14-11-34.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step67500_eval_results_01-23-2023-14-11-34.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step68000_eval_results_01-23-2023-14-11-34.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step68500_eval_results_01-23-2023-14-11-30.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step69000_eval_results_01-23-2023-14-11-28.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step69500_eval_results_01-23-2023-14-11-33.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step70000_eval_results_01-23-2023-14-11-30.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step70500_eval_results_01-23-2023-14-11-28.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step71000_eval_results_01-23-2023-14-11-57.json
pretrain/pythia/evals/bias-evals/long-intervention-1.3b-deduped-step71500_eval_results_01-23-2023-14-12-28.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step11500_eval_results_01-20-2023-14-41-42.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step1500_eval_results_01-20-2023-14-42-09.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step16500_eval_results_01-20-2023-14-44-09.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step21500_eval_results_01-20-2023-14-44-57.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step26500_eval_results_01-20-2023-14-44-19.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step31500_eval_results_01-20-2023-14-46-00.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step36500_eval_results_01-20-2023-14-46-48.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step41500_eval_results_01-20-2023-15-13-30.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step46500_eval_results_01-20-2023-14-49-13.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step51500_eval_results_01-20-2023-14-49-21.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step56500_eval_results_01-20-2023-14-50-08.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step61500_eval_results_01-20-2023-14-50-46.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step6500_eval_results_01-20-2023-14-41-33.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step66500_eval_results_01-20-2023-15-13-13.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step67000_eval_results_01-22-2023-09-14-16.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step67500_eval_results_01-22-2023-09-15-51.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step68000_eval_results_01-22-2023-09-17-24.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step68500_eval_results_01-22-2023-09-18-58.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step69000_eval_results_01-22-2023-09-20-33.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step69500_eval_results_01-22-2023-09-22-17.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step70000_eval_results_01-22-2023-09-23-52.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step70500_eval_results_01-22-2023-09-25-25.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step71000_eval_results_01-22-2023-12-36-26.json
pretrain/pythia/evals/bias-evals/pythia-1.3b-deduped-step71500_eval_results_01-20-2023-15-13-07.json
pretrain/pythia/evals/bias-evals/pythia-19m-deduped-step103000_eval_results_01-20-2023-15-59-23.json
pretrain/pythia/evals/bias-evals/pythia-19m-deduped-step113000_eval_results_01-20-2023-15-59-26.json
pretrain/pythia/evals/bias-evals/pythia-19m-deduped-step123000_eval_results_01-20-2023-16-00-05.json
pretrain/pythia/evals/bias-evals/pythia-19m-deduped-step13000_eval_results_01-20-2023-15-58-56.json
pretrain/pythia/evals/bias-evals/pythia-19m-deduped-step133000_eval_results_01-20-2023-16-00-20.json
pretrain/pythia/evals/bias-evals/pythia-19m-deduped-step143000_eval_results_01-20-2023-16-00-15.json
pretrain/pythia/evals/bias-evals/pythia-19m-deduped-step23000_eval_results_01-20-2023-15-59-07.json
pretrain/pythia/evals/bias-evals/pythia-19m-deduped-step3000_eval_results_01-20-2023-15-58-23.json
pretrain/pythia/evals/bias-evals/pythia-19m-deduped-step33000_eval_results_01-20-2023-15-59-05.json
pretrain/pythia/evals/bias-evals/pythia-19m-deduped-step43000_eval_results_01-20-2023-15-59-07.json
pretrain/pythia/evals/bias-evals/pythia-19m-deduped-step53000_eval_results_01-20-2023-15-59-19.json
pretrain/pythia/evals/bias-evals/pythia-19m-deduped-step63000_eval_results_01-20-2023-15-59-19.json
pretrain/pythia/evals/bias-evals/pythia-19m-deduped-step73000_eval_results_01-20-2023-15-59-19.json
pretrain/pythia/evals/bias-evals/pythia-19m-deduped-step83000_eval_results_01-20-2023-15-59-19.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step11500_eval_results_01-23-2023-01-36-34.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step1500_eval_results_01-23-2023-01-30-40.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step16500_eval_results_01-23-2023-01-39-10.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step21500_eval_results_01-23-2023-01-41-49.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step26500_eval_results_01-23-2023-01-44-30.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step31500_eval_results_01-23-2023-01-46-19.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step36500_eval_results_01-23-2023-01-47-16.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step41500_eval_results_01-23-2023-01-49-14.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step46500_eval_results_01-23-2023-01-50-02.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step51500_eval_results_01-23-2023-01-52-20.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step56500_eval_results_01-23-2023-01-52-40.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step61500_eval_results_01-23-2023-01-54-57.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step6500_eval_results_01-23-2023-01-33-51.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step66500_eval_results_01-25-2023-20-11-01.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step67000_eval_results_01-23-2023-09-54-19.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step67500_eval_results_01-23-2023-09-55-14.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step68000_eval_results_01-23-2023-09-56-08.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step68500_eval_results_01-23-2023-09-56-59.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step69000_eval_results_01-23-2023-09-57-50.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step69500_eval_results_01-23-2023-09-58-51.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step70000_eval_results_01-23-2023-09-59-40.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step70500_eval_results_01-23-2023-10-00-35.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step71000_eval_results_01-23-2023-10-01-26.json
pretrain/pythia/evals/bias-evals/pythia-350m-deduped-step71500_eval_results_01-25-2023-20-11-11.json
pretrain/pythia/evals/bias-evals/pythia-6.9b-deduped-step103000_eval_results_01-23-2023-01-15-10.json
pretrain/pythia/evals/bias-evals/pythia-6.9b-deduped-step113000_eval_results_01-23-2023-01-15-43.json
pretrain/pythia/evals/bias-evals/pythia-6.9b-deduped-step123000_eval_results_01-23-2023-03-18-29.json
pretrain/pythia/evals/bias-evals/pythia-6.9b-deduped-step13000_eval_results_01-23-2023-01-15-04.json
pretrain/pythia/evals/bias-evals/pythia-6.9b-deduped-step133000_eval_results_01-23-2023-01-15-52.json
pretrain/pythia/evals/bias-evals/pythia-6.9b-deduped-step143000_eval_results_01-23-2023-01-15-14.json
pretrain/pythia/evals/bias-evals/pythia-6.9b-deduped-step23000_eval_results_01-23-2023-01-14-52.json
pretrain/pythia/evals/bias-evals/pythia-6.9b-deduped-step3000_eval_results_01-23-2023-01-15-43.json
pretrain/pythia/evals/bias-evals/pythia-6.9b-deduped-step33000_eval_results_01-23-2023-01-15-34.json
pretrain/pythia/evals/bias-evals/pythia-6.9b-deduped-step43000_eval_results_01-23-2023-01-15-20.json
pretrain/pythia/evals/bias-evals/pythia-6.9b-deduped-step53000_eval_results_01-23-2023-01-15-38.json
pretrain/pythia/evals/bias-evals/pythia-6.9b-deduped-step63000_eval_results_01-23-2023-01-14-58.json
pretrain/pythia/evals/bias-evals/pythia-6.9b-deduped-step73000_eval_results_01-23-2023-01-15-21.json
pretrain/pythia/evals/bias-evals/pythia-6.9b-deduped-step83000_eval_results_01-23-2023-01-15-32.json
pretrain/pythia/evals/bias-evals/pythia-6.9b-deduped-step93000_eval_results_01-23-2023-01-15-03.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-15-2023-21-59-54.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-15-2023-22-19-49.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-15-2023-22-20-32.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-15-2023-22-30-32.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-15-2023-22-33-31.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-15-2023-22-33-57.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-15-2023-22-45-41.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-15-2023-22-49-36.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-15-2023-22-56-30.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-15-2023-23-02-48.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-15-2023-23-39-36.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-16-2023-00-16-26.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-16-2023-00-16-54.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-16-2023-00-17-09.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-16-2023-00-17-42.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-16-2023-00-18-12.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-16-2023-00-24-09.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-16-2023-00-25-37.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-16-2023-00-28-00.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-16-2023-00-28-49.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-16-2023-00-38-17.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-16-2023-00-44-43.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-16-2023-00-47-17.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_02-16-2023-00-59-29.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-03-30-10.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-03-30-51.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-03-31-39.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-03-32-20.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-03-33-38.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-03-33-46.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-03-34-01.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-03-34-05.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-03-34-33.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-03-34-36.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-03-35-16.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-03-38-49.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-03-39-24.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-03-42-39.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-03-42-50.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-03-47-40.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-04-12-22.json
pretrain/pythia/evals/bias-evals/winobias/1.4B/eval_results_03-11-2023-12-44-30.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-00-59-19.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-00-46.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-04-06.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-07-13.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-08-01.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-09-15.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-09-59.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-10-18.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-16-53.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-19-42.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-19-53.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-21-41.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-22-51.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-26-41.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-40-15.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-44-57.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-49-46.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-51-43.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-53-56.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-55-14.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-01-55-31.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-02-09-45.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-02-12-25.json
pretrain/pythia/evals/bias-evals/winobias/410M/eval_results_02-16-2023-02-20-05.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_02-16-2023-01-30-50.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_02-16-2023-01-33-32.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_02-16-2023-01-35-54.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_02-16-2023-01-37-24.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_02-16-2023-01-37-48.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_02-16-2023-01-39-29.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_02-16-2023-01-39-38.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_02-16-2023-01-57-32.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_02-16-2023-02-14-15.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_02-16-2023-03-32-04.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_02-16-2023-03-33-17.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_02-16-2023-03-41-48.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_02-16-2023-03-45-19.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_02-16-2023-04-15-01.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_02-16-2023-04-17-41.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_02-16-2023-05-18-33.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_03-09-2023-05-30-31.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_03-09-2023-05-35-04.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_03-09-2023-05-35-22.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_03-09-2023-06-25-26.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_03-09-2023-17-18-12.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_03-09-2023-18-07-50.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_03-09-2023-18-09-53.json
pretrain/pythia/evals/bias-evals/winobias/6.9B/eval_results_03-09-2023-21-17-07.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_114000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_115000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_116000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_117000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_118000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_119000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_120000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_121000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_122000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_123000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_124000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_125000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_126000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_127000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_128000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_129000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_130000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_131000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_132000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_133000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_134000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_135000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_136000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_137000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_138000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_139000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_140000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_141000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_142000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_21/1.4B/eval_results_1.4b-deduped-long_143000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/1.4B/eval_results_1.4b-deduped_134000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/1.4B/eval_results_1.4b-deduped_135000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/1.4B/eval_results_1.4b-deduped_136000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/1.4B/eval_results_1.4b-deduped_137000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/1.4B/eval_results_1.4b-deduped_138000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/1.4B/eval_results_1.4b-deduped_139000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/1.4B/eval_results_1.4b-deduped_140000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/1.4B/eval_results_1.4b-deduped_141000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/1.4B/eval_results_1.4b-deduped_142000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/1.4B/eval_results_1.4b-deduped_143000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/410M/eval_results_410m-deduped_134000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/410M/eval_results_410m-deduped_135000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/410M/eval_results_410m-deduped_136000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/410M/eval_results_410m-deduped_137000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/410M/eval_results_410m-deduped_138000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/410M/eval_results_410m-deduped_139000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/410M/eval_results_410m-deduped_140000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/410M/eval_results_410m-deduped_141000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/410M/eval_results_410m-deduped_142000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/410M/eval_results_410m-deduped_143000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/6.9B/eval_results_6.9b-deduped_134000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/6.9B/eval_results_6.9b-deduped_135000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/6.9B/eval_results_6.9b-deduped_136000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/6.9B/eval_results_6.9b-deduped_137000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/6.9B/eval_results_6.9b-deduped_138000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/6.9B/eval_results_6.9b-deduped_139000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/6.9B/eval_results_6.9b-deduped_140000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/6.9B/eval_results_6.9b-deduped_141000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/6.9B/eval_results_6.9b-deduped_142000.json
pretrain/pythia/evals/bias-evals/winobias/intervene_7/6.9B/eval_results_6.9b-deduped_143000.json
pretrain/pythia/evals/bias-evals/winobias/winobias_plots/winobias_scale_final.pdf
pretrain/pythia/evals/bloom/bloom-1b1.json
pretrain/pythia/evals/bloom/bloom-1b7.json
pretrain/pythia/evals/bloom/bloom-3b.json
pretrain/pythia/evals/bloom/bloom-560m.json
pretrain/pythia/evals/bloom/bloom-7b1.json
pretrain/pythia/evals/csv/pythia-1.3b-deduped/term_frquency_all_shots.csv
pretrain/pythia/evals/csv/pythia-125m-deduped/term_frquency_all_shots.csv
pretrain/pythia/evals/csv/pythia-13b-deduped/term_frquency_all_shots.csv
pretrain/pythia/evals/csv/pythia-2.7b-deduped/term_frquency_all_shots.csv
pretrain/pythia/evals/csv/pythia-350m-deduped/term_frquency_all_shots.csv
pretrain/pythia/evals/csv/pythia-6.7b-deduped/term_frquency_all_shots.csv
pretrain/pythia/evals/csv/pythia-800m-deduped/term_frquency_all_shots.csv
pretrain/pythia/evals/opt/opt-1.3b.json
pretrain/pythia/evals/opt/opt-125m.json
pretrain/pythia/evals/opt/opt-13b.json
pretrain/pythia/evals/opt/opt-2.7b.json
pretrain/pythia/evals/opt/opt-30b.json
pretrain/pythia/evals/opt/opt-350m.json
pretrain/pythia/evals/opt/opt-6.7b.json
pretrain/pythia/evals/opt/opt-66b.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/five-shot/pythia-1.4b-deduped-5shot-global_step11500_eval_results_12-30-2022-03-48-08.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/five-shot/pythia-1.4b-deduped-5shot-global_step1500_eval_results_12-30-2022-03-48-08.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/five-shot/pythia-1.4b-deduped-5shot-global_step16500_eval_results_12-30-2022-03-48-15.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/five-shot/pythia-1.4b-deduped-5shot-global_step21500_eval_results_12-30-2022-03-51-53.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/five-shot/pythia-1.4b-deduped-5shot-global_step26500_eval_results_12-30-2022-03-51-50.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/five-shot/pythia-1.4b-deduped-5shot-global_step31500_eval_results_12-30-2022-03-51-46.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/five-shot/pythia-1.4b-deduped-5shot-global_step36500_eval_results_12-30-2022-04-01-56.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/five-shot/pythia-1.4b-deduped-5shot-global_step41500_eval_results_12-30-2022-04-01-30.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/five-shot/pythia-1.4b-deduped-5shot-global_step46500_eval_results_12-30-2022-04-38-36.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/five-shot/pythia-1.4b-deduped-5shot-global_step51500_eval_results_12-30-2022-04-01-37.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/five-shot/pythia-1.4b-deduped-5shot-global_step56500_eval_results_12-30-2022-04-01-45.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/five-shot/pythia-1.4b-deduped-5shot-global_step61500_eval_results_12-30-2022-03-52-59.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/five-shot/pythia-1.4b-deduped-5shot-global_step6500_eval_results_12-30-2022-03-48-32.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/five-shot/pythia-1.4b-deduped-5shot-global_step66500_eval_results_12-30-2022-03-53-34.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/five-shot/pythia-1.4b-deduped-5shot-global_step71500_eval_results_12-30-2022-04-21-13.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/zero-shot/pythia-1.4b-deduped-0shot-global_step11500_eval_results_12-30-2022-03-54-18.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/zero-shot/pythia-1.4b-deduped-0shot-global_step1500_eval_results_12-30-2022-04-13-45.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/zero-shot/pythia-1.4b-deduped-0shot-global_step16500_eval_results_12-30-2022-03-54-27.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/zero-shot/pythia-1.4b-deduped-0shot-global_step21500_eval_results_12-30-2022-03-54-59.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/zero-shot/pythia-1.4b-deduped-0shot-global_step26500_eval_results_12-30-2022-03-57-27.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/zero-shot/pythia-1.4b-deduped-0shot-global_step31500_eval_results_12-30-2022-04-14-29.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/zero-shot/pythia-1.4b-deduped-0shot-global_step36500_eval_results_12-30-2022-04-13-44.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/zero-shot/pythia-1.4b-deduped-0shot-global_step41500_eval_results_12-30-2022-04-13-51.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/zero-shot/pythia-1.4b-deduped-0shot-global_step46500_eval_results_12-30-2022-04-14-46.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/zero-shot/pythia-1.4b-deduped-0shot-global_step51500_eval_results_12-30-2022-04-13-47.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/zero-shot/pythia-1.4b-deduped-0shot-global_step56500_eval_results_12-30-2022-04-13-44.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/zero-shot/pythia-1.4b-deduped-0shot-global_step61500_eval_results_12-30-2022-04-56-20.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/zero-shot/pythia-1.4b-deduped-0shot-global_step6500_eval_results_12-30-2022-03-54-21.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/zero-shot/pythia-1.4b-deduped-0shot-global_step66500_eval_results_12-30-2022-04-00-01.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b-deduped/zero-shot/pythia-1.4b-deduped-0shot-global_step71500_eval_results_12-30-2022-04-43-36.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/five-shot/pythia-1.4b-5shot-global_step11500_eval_results_12-29-2022-16-26-51.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/five-shot/pythia-1.4b-5shot-global_step1500_eval_results_12-29-2022-16-24-51.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/five-shot/pythia-1.4b-5shot-global_step16500_eval_results_12-29-2022-16-27-09.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/five-shot/pythia-1.4b-5shot-global_step21500_eval_results_12-29-2022-16-27-24.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/five-shot/pythia-1.4b-5shot-global_step26500_eval_results_12-29-2022-16-49-20.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/five-shot/pythia-1.4b-5shot-global_step31500_eval_results_12-29-2022-16-49-49.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/five-shot/pythia-1.4b-5shot-global_step36500_eval_results_12-29-2022-16-51-31.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/five-shot/pythia-1.4b-5shot-global_step41500_eval_results_12-29-2022-21-21-22.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/five-shot/pythia-1.4b-5shot-global_step46500_eval_results_12-29-2022-16-51-24.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/five-shot/pythia-1.4b-5shot-global_step51500_eval_results_12-29-2022-16-51-02.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/five-shot/pythia-1.4b-5shot-global_step56500_eval_results_12-29-2022-16-51-33.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/five-shot/pythia-1.4b-5shot-global_step61500_eval_results_12-29-2022-16-51-30.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/five-shot/pythia-1.4b-5shot-global_step6500_eval_results_12-29-2022-16-26-41.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/five-shot/pythia-1.4b-5shot-global_step66500_eval_results_12-29-2022-16-51-33.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/five-shot/pythia-1.4b-5shot-global_step71500_eval_results_12-29-2022-16-51-39.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/zero-shot/pythia-1.4b-0shot-global_step11500_eval_results_12-29-2022-16-09-11.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/zero-shot/pythia-1.4b-0shot-global_step1500_eval_results_12-27-2022-00-29-50.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/zero-shot/pythia-1.4b-0shot-global_step16500_eval_results_12-26-2022-22-11-03.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/zero-shot/pythia-1.4b-0shot-global_step21500_eval_results_12-26-2022-21-45-52.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/zero-shot/pythia-1.4b-0shot-global_step26500_eval_results_12-29-2022-16-09-11.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/zero-shot/pythia-1.4b-0shot-global_step31500_eval_results_12-29-2022-16-08-59.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/zero-shot/pythia-1.4b-0shot-global_step36500_eval_results_12-29-2022-16-34-14.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/zero-shot/pythia-1.4b-0shot-global_step41500_eval_results_12-29-2022-16-25-00.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/zero-shot/pythia-1.4b-0shot-global_step46500_eval_results_12-29-2022-16-25-05.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/zero-shot/pythia-1.4b-0shot-global_step51500_eval_results_12-29-2022-16-25-14.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/zero-shot/pythia-1.4b-0shot-global_step56500_eval_results_12-29-2022-16-26-12.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/zero-shot/pythia-1.4b-0shot-global_step61500_eval_results_12-29-2022-16-23-29.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/zero-shot/pythia-1.4b-0shot-global_step6500_eval_results_12-26-2022-21-46-51.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/zero-shot/pythia-1.4b-0shot-global_step66500_eval_results_12-29-2022-17-00-50.json
pretrain/pythia/evals/pythia-v0/pythia-1.4b/zero-shot/pythia-1.4b-0shot-global_step71500_eval_results_12-29-2022-16-23-33.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/five-shot/pythia-12b-deduped-5shot-global_step103000_eval_results_12-20-2022-13-59-32.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/five-shot/pythia-12b-deduped-5shot-global_step113000_eval_results_12-20-2022-13-34-55.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/five-shot/pythia-12b-deduped-5shot-global_step123000_eval_results_12-20-2022-13-09-58.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/five-shot/pythia-12b-deduped-5shot-global_step13000_eval_results_12-20-2022-12-45-28.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/five-shot/pythia-12b-deduped-5shot-global_step133000_eval_results_12-20-2022-12-20-59.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/five-shot/pythia-12b-deduped-5shot-global_step143000_eval_results_12-20-2022-11-52-04.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/five-shot/pythia-12b-deduped-5shot-global_step23000_eval_results_12-20-2022-11-27-33.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/five-shot/pythia-12b-deduped-5shot-global_step3000_eval_results_12-20-2022-11-01-58.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/five-shot/pythia-12b-deduped-5shot-global_step33000_eval_results_12-20-2022-10-37-40.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/five-shot/pythia-12b-deduped-5shot-global_step43000_eval_results_12-20-2022-10-12-29.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/five-shot/pythia-12b-deduped-5shot-global_step53000_eval_results_12-20-2022-09-47-38.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/five-shot/pythia-12b-deduped-5shot-global_step63000_eval_results_12-20-2022-09-18-13.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/five-shot/pythia-12b-deduped-5shot-global_step73000_eval_results_12-20-2022-08-53-54.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/five-shot/pythia-12b-deduped-5shot-global_step83000_eval_results_12-20-2022-08-28-18.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/five-shot/pythia-12b-deduped-5shot-global_step93000_eval_results_12-20-2022-08-03-23.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/zero-shot/pythia-12b-deduped-0shot-global_step103000_eval_results_12-16-2022-18-15-05.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/zero-shot/pythia-12b-deduped-0shot-global_step113000_eval_results_12-16-2022-18-28-45.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/zero-shot/pythia-12b-deduped-0shot-global_step123000_eval_results_12-16-2022-18-42-32.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/zero-shot/pythia-12b-deduped-0shot-global_step13000_eval_results_12-16-2022-18-56-02.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/zero-shot/pythia-12b-deduped-0shot-global_step133000_eval_results_12-16-2022-19-09-33.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/zero-shot/pythia-12b-deduped-0shot-global_step143000_eval_results_12-16-2022-19-23-03.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/zero-shot/pythia-12b-deduped-0shot-global_step23000_eval_results_12-16-2022-19-36-35.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/zero-shot/pythia-12b-deduped-0shot-global_step3000_eval_results_12-16-2022-19-50-04.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/zero-shot/pythia-12b-deduped-0shot-global_step33000_eval_results_12-16-2022-20-03-48.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/zero-shot/pythia-12b-deduped-0shot-global_step43000_eval_results_12-16-2022-20-17-13.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/zero-shot/pythia-12b-deduped-0shot-global_step53000_eval_results_12-16-2022-20-30-42.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/zero-shot/pythia-12b-deduped-0shot-global_step63000_eval_results_12-16-2022-20-44-20.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/zero-shot/pythia-12b-deduped-0shot-global_step73000_eval_results_12-16-2022-20-57-48.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/zero-shot/pythia-12b-deduped-0shot-global_step83000_eval_results_12-16-2022-21-11-22.json
pretrain/pythia/evals/pythia-v0/pythia-12b-deduped/zero-shot/pythia-12b-deduped-0shot-global_step93000_eval_results_12-16-2022-21-25-07.json
pretrain/pythia/evals/pythia-v0/pythia-12b/five-shot/pythia-12b-5shot-global_step103000_eval_results_12-20-2022-07-39-05.json
pretrain/pythia/evals/pythia-v0/pythia-12b/five-shot/pythia-12b-5shot-global_step113000_eval_results_12-20-2022-07-14-37.json
pretrain/pythia/evals/pythia-v0/pythia-12b/five-shot/pythia-12b-5shot-global_step123000_eval_results_12-20-2022-06-49-11.json
pretrain/pythia/evals/pythia-v0/pythia-12b/five-shot/pythia-12b-5shot-global_step13000_eval_results_12-20-2022-06-23-19.json
pretrain/pythia/evals/pythia-v0/pythia-12b/five-shot/pythia-12b-5shot-global_step133000_eval_results_12-20-2022-05-59-05.json
pretrain/pythia/evals/pythia-v0/pythia-12b/five-shot/pythia-12b-5shot-global_step143000_eval_results_12-20-2022-05-33-56.json
pretrain/pythia/evals/pythia-v0/pythia-12b/five-shot/pythia-12b-5shot-global_step23000_eval_results_12-20-2022-05-09-51.json
pretrain/pythia/evals/pythia-v0/pythia-12b/five-shot/pythia-12b-5shot-global_step3000_eval_results_12-20-2022-04-44-00.json
pretrain/pythia/evals/pythia-v0/pythia-12b/five-shot/pythia-12b-5shot-global_step33000_eval_results_12-20-2022-04-19-59.json
pretrain/pythia/evals/pythia-v0/pythia-12b/five-shot/pythia-12b-5shot-global_step43000_eval_results_12-20-2022-03-53-43.json
pretrain/pythia/evals/pythia-v0/pythia-12b/five-shot/pythia-12b-5shot-global_step53000_eval_results_12-20-2022-03-29-29.json
pretrain/pythia/evals/pythia-v0/pythia-12b/five-shot/pythia-12b-5shot-global_step63000_eval_results_12-20-2022-03-05-12.json
pretrain/pythia/evals/pythia-v0/pythia-12b/five-shot/pythia-12b-5shot-global_step73000_eval_results_12-20-2022-02-41-06.json
pretrain/pythia/evals/pythia-v0/pythia-12b/five-shot/pythia-12b-5shot-global_step83000_eval_results_12-20-2022-02-16-03.json
pretrain/pythia/evals/pythia-v0/pythia-12b/five-shot/pythia-12b-5shot-global_step93000_eval_results_12-20-2022-01-52-01.json
pretrain/pythia/evals/pythia-v0/pythia-12b/zero-shot/pythia-12b-0shot-global_step103000_eval_results_12-15-2022-22-24-35.json
pretrain/pythia/evals/pythia-v0/pythia-12b/zero-shot/pythia-12b-0shot-global_step113000_eval_results_12-15-2022-22-38-24.json
pretrain/pythia/evals/pythia-v0/pythia-12b/zero-shot/pythia-12b-0shot-global_step123000_eval_results_12-15-2022-22-52-05.json
pretrain/pythia/evals/pythia-v0/pythia-12b/zero-shot/pythia-12b-0shot-global_step13000_eval_results_12-15-2022-23-05-33.json
pretrain/pythia/evals/pythia-v0/pythia-12b/zero-shot/pythia-12b-0shot-global_step133000_eval_results_12-15-2022-23-19-06.json
pretrain/pythia/evals/pythia-v0/pythia-12b/zero-shot/pythia-12b-0shot-global_step143000_eval_results_12-15-2022-23-32-34.json
pretrain/pythia/evals/pythia-v0/pythia-12b/zero-shot/pythia-12b-0shot-global_step23000_eval_results_12-15-2022-23-45-57.json
pretrain/pythia/evals/pythia-v0/pythia-12b/zero-shot/pythia-12b-0shot-global_step3000_eval_results_12-15-2022-23-59-29.json
pretrain/pythia/evals/pythia-v0/pythia-12b/zero-shot/pythia-12b-0shot-global_step33000_eval_results_12-16-2022-00-23-30.json
pretrain/pythia/evals/pythia-v0/pythia-12b/zero-shot/pythia-12b-0shot-global_step43000_eval_results_12-16-2022-00-37-09.json
pretrain/pythia/evals/pythia-v0/pythia-12b/zero-shot/pythia-12b-0shot-global_step53000_eval_results_12-16-2022-00-55-53.json
pretrain/pythia/evals/pythia-v0/pythia-12b/zero-shot/pythia-12b-0shot-global_step63000_eval_results_12-16-2022-01-09-29.json
pretrain/pythia/evals/pythia-v0/pythia-12b/zero-shot/pythia-12b-0shot-global_step73000_eval_results_12-16-2022-01-28-05.json
pretrain/pythia/evals/pythia-v0/pythia-12b/zero-shot/pythia-12b-0shot-global_step83000_eval_results_12-16-2022-01-49-26.json
pretrain/pythia/evals/pythia-v0/pythia-12b/zero-shot/pythia-12b-0shot-global_step93000_eval_results_12-16-2022-02-08-04.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/five-shot/pythia-160m-deduped-5shot-global_step11500_eval_results_12-30-2022-22-34-25.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/five-shot/pythia-160m-deduped-5shot-global_step1500_eval_results_12-30-2022-22-46-27.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/five-shot/pythia-160m-deduped-5shot-global_step16500_eval_results_12-30-2022-22-34-14.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/five-shot/pythia-160m-deduped-5shot-global_step21500_eval_results_12-30-2022-22-34-43.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/five-shot/pythia-160m-deduped-5shot-global_step26500_eval_results_12-30-2022-22-34-38.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/five-shot/pythia-160m-deduped-5shot-global_step31500_eval_results_12-30-2022-22-34-38.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/five-shot/pythia-160m-deduped-5shot-global_step36500_eval_results_12-30-2022-22-34-44.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/five-shot/pythia-160m-deduped-5shot-global_step41500_eval_results_12-30-2022-22-34-25.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/five-shot/pythia-160m-deduped-5shot-global_step46500_eval_results_12-30-2022-22-34-45.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/five-shot/pythia-160m-deduped-5shot-global_step51500_eval_results_12-30-2022-22-34-48.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/five-shot/pythia-160m-deduped-5shot-global_step56500_eval_results_12-30-2022-22-47-06.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/five-shot/pythia-160m-deduped-5shot-global_step61500_eval_results_12-30-2022-22-34-51.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/five-shot/pythia-160m-deduped-5shot-global_step6500_eval_results_12-30-2022-22-35-57.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/five-shot/pythia-160m-deduped-5shot-global_step66500_eval_results_12-30-2022-22-34-52.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/five-shot/pythia-160m-deduped-5shot-global_step71500_eval_results_12-30-2022-22-34-55.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/zero-shot/pythia-160m-deduped-0shot-global_step11500_eval_results_12-30-2022-22-37-17.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/zero-shot/pythia-160m-deduped-0shot-global_step1500_eval_results_12-30-2022-22-50-08.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/zero-shot/pythia-160m-deduped-0shot-global_step16500_eval_results_12-30-2022-22-38-08.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/zero-shot/pythia-160m-deduped-0shot-global_step21500_eval_results_12-30-2022-22-38-14.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/zero-shot/pythia-160m-deduped-0shot-global_step26500_eval_results_12-30-2022-22-38-13.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/zero-shot/pythia-160m-deduped-0shot-global_step31500_eval_results_12-30-2022-22-38-01.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/zero-shot/pythia-160m-deduped-0shot-global_step36500_eval_results_12-30-2022-22-37-28.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/zero-shot/pythia-160m-deduped-0shot-global_step41500_eval_results_12-30-2022-22-38-28.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/zero-shot/pythia-160m-deduped-0shot-global_step46500_eval_results_12-30-2022-22-38-21.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/zero-shot/pythia-160m-deduped-0shot-global_step51500_eval_results_12-30-2022-22-37-46.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/zero-shot/pythia-160m-deduped-0shot-global_step56500_eval_results_12-30-2022-22-37-44.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/zero-shot/pythia-160m-deduped-0shot-global_step61500_eval_results_12-30-2022-22-37-42.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/zero-shot/pythia-160m-deduped-0shot-global_step6500_eval_results_12-30-2022-22-37-26.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/zero-shot/pythia-160m-deduped-0shot-global_step66500_eval_results_12-30-2022-22-37-49.json
pretrain/pythia/evals/pythia-v0/pythia-160m-deduped/zero-shot/pythia-160m-deduped-0shot-global_step71500_eval_results_12-30-2022-22-38-31.json
pretrain/pythia/evals/pythia-v0/pythia-160m/five-shot/pythia-160m-5shot-global_step11500_eval_results_12-30-2022-23-02-58.json
pretrain/pythia/evals/pythia-v0/pythia-160m/five-shot/pythia-160m-5shot-global_step1500_eval_results_12-31-2022-01-00-06.json
pretrain/pythia/evals/pythia-v0/pythia-160m/five-shot/pythia-160m-5shot-global_step16500_eval_results_12-30-2022-23-03-02.json
pretrain/pythia/evals/pythia-v0/pythia-160m/five-shot/pythia-160m-5shot-global_step21500_eval_results_12-30-2022-23-02-51.json
pretrain/pythia/evals/pythia-v0/pythia-160m/five-shot/pythia-160m-5shot-global_step26500_eval_results_12-30-2022-23-03-08.json
pretrain/pythia/evals/pythia-v0/pythia-160m/five-shot/pythia-160m-5shot-global_step31500_eval_results_12-30-2022-23-02-49.json
pretrain/pythia/evals/pythia-v0/pythia-160m/five-shot/pythia-160m-5shot-global_step36500_eval_results_12-30-2022-23-02-50.json
pretrain/pythia/evals/pythia-v0/pythia-160m/five-shot/pythia-160m-5shot-global_step41500_eval_results_12-30-2022-23-02-53.json
pretrain/pythia/evals/pythia-v0/pythia-160m/five-shot/pythia-160m-5shot-global_step46500_eval_results_12-30-2022-23-03-12.json
pretrain/pythia/evals/pythia-v0/pythia-160m/five-shot/pythia-160m-5shot-global_step51500_eval_results_12-31-2022-01-00-04.json
pretrain/pythia/evals/pythia-v0/pythia-160m/five-shot/pythia-160m-5shot-global_step56500_eval_results_12-30-2022-23-02-57.json
pretrain/pythia/evals/pythia-v0/pythia-160m/five-shot/pythia-160m-5shot-global_step61500_eval_results_12-30-2022-23-03-00.json
pretrain/pythia/evals/pythia-v0/pythia-160m/five-shot/pythia-160m-5shot-global_step6500_eval_results_12-30-2022-23-02-54.json
pretrain/pythia/evals/pythia-v0/pythia-160m/five-shot/pythia-160m-5shot-global_step66500_eval_results_12-30-2022-23-03-18.json
pretrain/pythia/evals/pythia-v0/pythia-160m/five-shot/pythia-160m-5shot-global_step71500_eval_results_12-30-2022-23-03-22.json
pretrain/pythia/evals/pythia-v0/pythia-160m/zero-shot/pythia-160m-0shot-global_step11500_eval_results_12-30-2022-23-05-56.json
pretrain/pythia/evals/pythia-v0/pythia-160m/zero-shot/pythia-160m-0shot-global_step1500_eval_results_12-30-2022-23-06-34.json
pretrain/pythia/evals/pythia-v0/pythia-160m/zero-shot/pythia-160m-0shot-global_step16500_eval_results_12-30-2022-23-06-00.json
pretrain/pythia/evals/pythia-v0/pythia-160m/zero-shot/pythia-160m-0shot-global_step21500_eval_results_12-30-2022-23-06-16.json
pretrain/pythia/evals/pythia-v0/pythia-160m/zero-shot/pythia-160m-0shot-global_step26500_eval_results_12-30-2022-23-05-58.json
pretrain/pythia/evals/pythia-v0/pythia-160m/zero-shot/pythia-160m-0shot-global_step31500_eval_results_12-30-2022-23-05-58.json
pretrain/pythia/evals/pythia-v0/pythia-160m/zero-shot/pythia-160m-0shot-global_step36500_eval_results_12-30-2022-23-06-52.json
pretrain/pythia/evals/pythia-v0/pythia-160m/zero-shot/pythia-160m-0shot-global_step41500_eval_results_12-30-2022-23-06-47.json
pretrain/pythia/evals/pythia-v0/pythia-160m/zero-shot/pythia-160m-0shot-global_step46500_eval_results_12-30-2022-23-06-56.json
pretrain/pythia/evals/pythia-v0/pythia-160m/zero-shot/pythia-160m-0shot-global_step51500_eval_results_12-30-2022-23-06-13.json
pretrain/pythia/evals/pythia-v0/pythia-160m/zero-shot/pythia-160m-0shot-global_step56500_eval_results_12-30-2022-23-06-53.json
pretrain/pythia/evals/pythia-v0/pythia-160m/zero-shot/pythia-160m-0shot-global_step61500_eval_results_12-30-2022-23-06-15.json
pretrain/pythia/evals/pythia-v0/pythia-160m/zero-shot/pythia-160m-0shot-global_step6500_eval_results_12-30-2022-23-06-33.json
pretrain/pythia/evals/pythia-v0/pythia-160m/zero-shot/pythia-160m-0shot-global_step66500_eval_results_12-30-2022-23-07-07.json
pretrain/pythia/evals/pythia-v0/pythia-160m/zero-shot/pythia-160m-0shot-global_step71500_eval_results_12-30-2022-23-06-54.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/five-shot/pythia-1b-deduped-5shot-global_step103000_eval_results_11-28-2022-18-00-33.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/five-shot/pythia-1b-deduped-5shot-global_step113000_eval_results_11-28-2022-18-01-24.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/five-shot/pythia-1b-deduped-5shot-global_step123000_eval_results_11-28-2022-18-02-23.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/five-shot/pythia-1b-deduped-5shot-global_step13000_eval_results_11-28-2022-17-51-42.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/five-shot/pythia-1b-deduped-5shot-global_step133000_eval_results_11-28-2022-18-03-21.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/five-shot/pythia-1b-deduped-5shot-global_step143000_eval_results_11-28-2022-18-04-11.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/five-shot/pythia-1b-deduped-5shot-global_step23000_eval_results_11-28-2022-17-52-44.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/five-shot/pythia-1b-deduped-5shot-global_step3000_eval_results_11-28-2022-17-50-14.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/five-shot/pythia-1b-deduped-5shot-global_step33000_eval_results_11-28-2022-17-53-44.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/five-shot/pythia-1b-deduped-5shot-global_step43000_eval_results_11-28-2022-17-54-21.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/five-shot/pythia-1b-deduped-5shot-global_step53000_eval_results_11-28-2022-17-55-36.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/five-shot/pythia-1b-deduped-5shot-global_step63000_eval_results_11-28-2022-17-56-52.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/five-shot/pythia-1b-deduped-5shot-global_step73000_eval_results_11-28-2022-17-57-29.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/five-shot/pythia-1b-deduped-5shot-global_step83000_eval_results_11-28-2022-17-58-34.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/five-shot/pythia-1b-deduped-5shot-global_step93000_eval_results_11-28-2022-17-59-50.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/zero-shot/pythia-1b-deduped-0shot-global_step103000_eval_results_11-28-2022-18-03-23.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/zero-shot/pythia-1b-deduped-0shot-global_step113000_eval_results_11-28-2022-18-04-01.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/zero-shot/pythia-1b-deduped-0shot-global_step123000_eval_results_11-28-2022-18-05-05.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/zero-shot/pythia-1b-deduped-0shot-global_step13000_eval_results_11-28-2022-17-53-09.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/zero-shot/pythia-1b-deduped-0shot-global_step133000_eval_results_11-28-2022-18-05-58.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/zero-shot/pythia-1b-deduped-0shot-global_step143000_eval_results_11-28-2022-18-07-27.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/zero-shot/pythia-1b-deduped-0shot-global_step23000_eval_results_11-28-2022-17-54-12.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/zero-shot/pythia-1b-deduped-0shot-global_step3000_eval_results_11-28-2022-17-51-47.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/zero-shot/pythia-1b-deduped-0shot-global_step33000_eval_results_11-28-2022-17-56-21.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/zero-shot/pythia-1b-deduped-0shot-global_step43000_eval_results_11-28-2022-17-57-17.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/zero-shot/pythia-1b-deduped-0shot-global_step53000_eval_results_11-28-2022-17-58-24.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/zero-shot/pythia-1b-deduped-0shot-global_step63000_eval_results_11-28-2022-17-59-15.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/zero-shot/pythia-1b-deduped-0shot-global_step73000_eval_results_11-28-2022-18-00-31.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/zero-shot/pythia-1b-deduped-0shot-global_step83000_eval_results_11-28-2022-18-00-19.json
pretrain/pythia/evals/pythia-v0/pythia-1b-deduped/zero-shot/pythia-1b-deduped-0shot-global_step93000_eval_results_11-28-2022-18-01-59.json
pretrain/pythia/evals/pythia-v0/pythia-1b/five-shot/pythia-1b-5shot-global_step103000_eval_results_11-28-2022-15-10-46.json
pretrain/pythia/evals/pythia-v0/pythia-1b/five-shot/pythia-1b-5shot-global_step113000_eval_results_11-28-2022-15-10-43.json
pretrain/pythia/evals/pythia-v0/pythia-1b/five-shot/pythia-1b-5shot-global_step123000_eval_results_11-28-2022-15-10-45.json
pretrain/pythia/evals/pythia-v0/pythia-1b/five-shot/pythia-1b-5shot-global_step13000_eval_results_11-28-2022-15-10-48.json
pretrain/pythia/evals/pythia-v0/pythia-1b/five-shot/pythia-1b-5shot-global_step133000_eval_results_11-28-2022-15-10-39.json
pretrain/pythia/evals/pythia-v0/pythia-1b/five-shot/pythia-1b-5shot-global_step143000_eval_results_11-28-2022-15-10-39.json
pretrain/pythia/evals/pythia-v0/pythia-1b/five-shot/pythia-1b-5shot-global_step23000_eval_results_11-28-2022-15-10-43.json
pretrain/pythia/evals/pythia-v0/pythia-1b/five-shot/pythia-1b-5shot-global_step3000_eval_results_11-28-2022-15-06-31.json
pretrain/pythia/evals/pythia-v0/pythia-1b/five-shot/pythia-1b-5shot-global_step33000_eval_results_11-28-2022-15-10-39.json
pretrain/pythia/evals/pythia-v0/pythia-1b/five-shot/pythia-1b-5shot-global_step43000_eval_results_11-28-2022-15-10-44.json
pretrain/pythia/evals/pythia-v0/pythia-1b/five-shot/pythia-1b-5shot-global_step53000_eval_results_11-28-2022-15-10-47.json
pretrain/pythia/evals/pythia-v0/pythia-1b/five-shot/pythia-1b-5shot-global_step63000_eval_results_11-28-2022-15-11-10.json
pretrain/pythia/evals/pythia-v0/pythia-1b/five-shot/pythia-1b-5shot-global_step73000_eval_results_11-28-2022-15-10-36.json
pretrain/pythia/evals/pythia-v0/pythia-1b/five-shot/pythia-1b-5shot-global_step83000_eval_results_11-28-2022-15-10-51.json
pretrain/pythia/evals/pythia-v0/pythia-1b/five-shot/pythia-1b-5shot-global_step93000_eval_results_11-28-2022-15-10-49.json
pretrain/pythia/evals/pythia-v0/pythia-1b/zero-shot/pythia-1b-0shot-global_step103000_eval_results_11-28-2022-15-14-22.json
pretrain/pythia/evals/pythia-v0/pythia-1b/zero-shot/pythia-1b-0shot-global_step113000_eval_results_11-28-2022-15-14-25.json
pretrain/pythia/evals/pythia-v0/pythia-1b/zero-shot/pythia-1b-0shot-global_step123000_eval_results_11-28-2022-15-15-35.json
pretrain/pythia/evals/pythia-v0/pythia-1b/zero-shot/pythia-1b-0shot-global_step13000_eval_results_11-28-2022-15-10-08.json
pretrain/pythia/evals/pythia-v0/pythia-1b/zero-shot/pythia-1b-0shot-global_step133000_eval_results_11-28-2022-15-15-29.json
pretrain/pythia/evals/pythia-v0/pythia-1b/zero-shot/pythia-1b-0shot-global_step143000_eval_results_11-28-2022-15-14-35.json
pretrain/pythia/evals/pythia-v0/pythia-1b/zero-shot/pythia-1b-0shot-global_step23000_eval_results_11-28-2022-15-15-27.json
pretrain/pythia/evals/pythia-v0/pythia-1b/zero-shot/pythia-1b-0shot-global_step3000_eval_results_11-28-2022-15-05-57.json
pretrain/pythia/evals/pythia-v0/pythia-1b/zero-shot/pythia-1b-0shot-global_step33000_eval_results_11-28-2022-15-15-30.json
pretrain/pythia/evals/pythia-v0/pythia-1b/zero-shot/pythia-1b-0shot-global_step43000_eval_results_11-28-2022-15-14-28.json
pretrain/pythia/evals/pythia-v0/pythia-1b/zero-shot/pythia-1b-0shot-global_step53000_eval_results_11-28-2022-15-15-26.json
pretrain/pythia/evals/pythia-v0/pythia-1b/zero-shot/pythia-1b-0shot-global_step63000_eval_results_11-28-2022-15-15-24.json
pretrain/pythia/evals/pythia-v0/pythia-1b/zero-shot/pythia-1b-0shot-global_step73000_eval_results_11-28-2022-15-14-32.json
pretrain/pythia/evals/pythia-v0/pythia-1b/zero-shot/pythia-1b-0shot-global_step83000_eval_results_11-28-2022-15-14-22.json
pretrain/pythia/evals/pythia-v0/pythia-1b/zero-shot/pythia-1b-0shot-global_step93000_eval_results_11-28-2022-15-14-36.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/five-shot/pythia-2.8b-deduped-5shot-global_step103000_eval_results_11-26-2022-05-01-36.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/five-shot/pythia-2.8b-deduped-5shot-global_step113000_eval_results_11-26-2022-02-36-10.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/five-shot/pythia-2.8b-deduped-5shot-global_step123000_eval_results_11-26-2022-02-35-47.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/five-shot/pythia-2.8b-deduped-5shot-global_step13000_eval_results_11-26-2022-05-01-37.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/five-shot/pythia-2.8b-deduped-5shot-global_step133000_eval_results_11-26-2022-02-36-09.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/five-shot/pythia-2.8b-deduped-5shot-global_step143000_eval_results_11-26-2022-02-36-21.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/five-shot/pythia-2.8b-deduped-5shot-global_step23000_eval_results_11-26-2022-02-23-28.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/five-shot/pythia-2.8b-deduped-5shot-global_step3000_eval_results_11-26-2022-02-23-25.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/five-shot/pythia-2.8b-deduped-5shot-global_step33000_eval_results_11-26-2022-02-23-34.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/five-shot/pythia-2.8b-deduped-5shot-global_step43000_eval_results_11-26-2022-02-23-34.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/five-shot/pythia-2.8b-deduped-5shot-global_step53000_eval_results_11-26-2022-02-23-33.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/five-shot/pythia-2.8b-deduped-5shot-global_step63000_eval_results_11-26-2022-02-23-49.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/five-shot/pythia-2.8b-deduped-5shot-global_step73000_eval_results_11-26-2022-02-23-50.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/five-shot/pythia-2.8b-deduped-5shot-global_step83000_eval_results_11-26-2022-02-23-44.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/five-shot/pythia-2.8b-deduped-5shot-global_step93000_eval_results_11-26-2022-02-24-09.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/zero-shot/pythia-2.8b-deduped-0shot-global_step103000_eval_results_11-26-2022-02-28-33.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/zero-shot/pythia-2.8b-deduped-0shot-global_step113000_eval_results_11-26-2022-02-40-27.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/zero-shot/pythia-2.8b-deduped-0shot-global_step123000_eval_results_11-26-2022-02-40-13.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/zero-shot/pythia-2.8b-deduped-0shot-global_step13000_eval_results_11-26-2022-02-28-07.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/zero-shot/pythia-2.8b-deduped-0shot-global_step133000_eval_results_11-26-2022-02-39-33.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/zero-shot/pythia-2.8b-deduped-0shot-global_step143000_eval_results_11-26-2022-02-41-00.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/zero-shot/pythia-2.8b-deduped-0shot-global_step23000_eval_results_11-26-2022-02-28-10.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/zero-shot/pythia-2.8b-deduped-0shot-global_step3000_eval_results_11-26-2022-02-28-22.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/zero-shot/pythia-2.8b-deduped-0shot-global_step33000_eval_results_11-26-2022-02-29-15.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/zero-shot/pythia-2.8b-deduped-0shot-global_step43000_eval_results_11-26-2022-02-28-12.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/zero-shot/pythia-2.8b-deduped-0shot-global_step53000_eval_results_11-26-2022-02-27-39.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/zero-shot/pythia-2.8b-deduped-0shot-global_step63000_eval_results_11-26-2022-02-28-25.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/zero-shot/pythia-2.8b-deduped-0shot-global_step73000_eval_results_11-26-2022-02-28-12.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/zero-shot/pythia-2.8b-deduped-0shot-global_step83000_eval_results_11-26-2022-02-28-25.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b-deduped/zero-shot/pythia-2.8b-deduped-0shot-global_step93000_eval_results_11-26-2022-02-28-30.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/five-shot/pythia-2.8b-5shot-global_step103000__eval_results_11-25-2022-03-54-15.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/five-shot/pythia-2.8b-5shot-global_step113000__eval_results_11-25-2022-03-54-38.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/five-shot/pythia-2.8b-5shot-global_step123000__eval_results_11-25-2022-04-05-24.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/five-shot/pythia-2.8b-5shot-global_step13000__eval_results_11-25-2022-02-45-25.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/five-shot/pythia-2.8b-5shot-global_step133000__eval_results_11-25-2022-04-06-55.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/five-shot/pythia-2.8b-5shot-global_step143000__eval_results_11-25-2022-02-43-24.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/five-shot/pythia-2.8b-5shot-global_step23000__eval_results_11-25-2022-03-09-25.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/five-shot/pythia-2.8b-5shot-global_step3000__eval_results_11-25-2022-02-43-32.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/five-shot/pythia-2.8b-5shot-global_step33000__eval_results_11-25-2022-03-09-11.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/five-shot/pythia-2.8b-5shot-global_step43000__eval_results_11-25-2022-03-21-37.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/five-shot/pythia-2.8b-5shot-global_step53000__eval_results_11-25-2022-03-25-43.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/five-shot/pythia-2.8b-5shot-global_step63000__eval_results_11-25-2022-03-36-41.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/five-shot/pythia-2.8b-5shot-global_step73000__eval_results_11-25-2022-03-41-16.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/five-shot/pythia-2.8b-5shot-global_step83000__eval_results_11-25-2022-03-49-52.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/five-shot/pythia-2.8b-5shot-global_step93000__eval_results_11-25-2022-03-54-21.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/zero-shot/pythia-2.8b-0shot-global_step103000__eval_results_11-25-2022-03-57-52.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/zero-shot/pythia-2.8b-0shot-global_step113000__eval_results_11-25-2022-03-58-41.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/zero-shot/pythia-2.8b-0shot-global_step123000__eval_results_11-25-2022-04-06-21.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/zero-shot/pythia-2.8b-0shot-global_step13000__eval_results_11-25-2022-02-48-04.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/zero-shot/pythia-2.8b-0shot-global_step133000__eval_results_11-25-2022-04-10-59.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/zero-shot/pythia-2.8b-0shot-global_step143000__eval_results_11-24-2022-16-20-50.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/zero-shot/pythia-2.8b-0shot-global_step23000__eval_results_11-25-2022-03-11-56.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/zero-shot/pythia-2.8b-0shot-global_step3000__eval_results_11-25-2022-02-47-21.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/zero-shot/pythia-2.8b-0shot-global_step33000__eval_results_11-25-2022-03-13-32.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/zero-shot/pythia-2.8b-0shot-global_step43000__eval_results_11-25-2022-03-24-11.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/zero-shot/pythia-2.8b-0shot-global_step53000__eval_results_11-25-2022-03-28-39.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/zero-shot/pythia-2.8b-0shot-global_step63000__eval_results_11-25-2022-03-37-35.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/zero-shot/pythia-2.8b-0shot-global_step73000__eval_results_11-25-2022-03-42-15.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/zero-shot/pythia-2.8b-0shot-global_step83000__eval_results_11-25-2022-03-52-40.json
pretrain/pythia/evals/pythia-v0/pythia-2.8b/zero-shot/pythia-2.8b-0shot-global_step93000__eval_results_11-25-2022-03-56-42.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/five-shot/pythia-410m-deduped-5shot-global_step11500_eval_results_12-30-2022-22-04-10.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/five-shot/pythia-410m-deduped-5shot-global_step1500_eval_results_12-30-2022-22-04-06.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/five-shot/pythia-410m-deduped-5shot-global_step16500_eval_results_12-30-2022-22-04-37.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/five-shot/pythia-410m-deduped-5shot-global_step21500_eval_results_12-30-2022-22-04-38.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/five-shot/pythia-410m-deduped-5shot-global_step26500_eval_results_12-30-2022-22-04-27.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/five-shot/pythia-410m-deduped-5shot-global_step31500_eval_results_12-30-2022-22-04-28.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/five-shot/pythia-410m-deduped-5shot-global_step36500_eval_results_12-30-2022-22-05-26.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/five-shot/pythia-410m-deduped-5shot-global_step41500_eval_results_12-30-2022-22-05-12.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/five-shot/pythia-410m-deduped-5shot-global_step46500_eval_results_12-30-2022-22-05-08.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/five-shot/pythia-410m-deduped-5shot-global_step51500_eval_results_12-30-2022-22-05-13.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/five-shot/pythia-410m-deduped-5shot-global_step56500_eval_results_12-30-2022-22-05-35.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/five-shot/pythia-410m-deduped-5shot-global_step61500_eval_results_12-30-2022-22-05-40.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/five-shot/pythia-410m-deduped-5shot-global_step6500_eval_results_12-30-2022-22-04-04.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/five-shot/pythia-410m-deduped-5shot-global_step66500_eval_results_12-30-2022-22-05-21.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/five-shot/pythia-410m-deduped-5shot-global_step71500_eval_results_12-30-2022-22-05-30.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/zero-shot/pythia-410m-deduped-0shot-global_step11500_eval_results_12-30-2022-22-07-55.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/zero-shot/pythia-410m-deduped-0shot-global_step1500_eval_results_12-30-2022-22-07-51.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/zero-shot/pythia-410m-deduped-0shot-global_step16500_eval_results_12-30-2022-22-07-24.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/zero-shot/pythia-410m-deduped-0shot-global_step21500_eval_results_12-30-2022-22-07-54.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/zero-shot/pythia-410m-deduped-0shot-global_step26500_eval_results_12-30-2022-22-21-57.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/zero-shot/pythia-410m-deduped-0shot-global_step31500_eval_results_12-30-2022-22-08-23.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/zero-shot/pythia-410m-deduped-0shot-global_step36500_eval_results_12-30-2022-22-08-08.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/zero-shot/pythia-410m-deduped-0shot-global_step41500_eval_results_12-30-2022-22-08-10.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/zero-shot/pythia-410m-deduped-0shot-global_step46500_eval_results_12-30-2022-22-09-03.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/zero-shot/pythia-410m-deduped-0shot-global_step51500_eval_results_12-30-2022-22-26-17.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/zero-shot/pythia-410m-deduped-0shot-global_step56500_eval_results_12-30-2022-22-08-41.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/zero-shot/pythia-410m-deduped-0shot-global_step61500_eval_results_12-30-2022-22-08-41.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/zero-shot/pythia-410m-deduped-0shot-global_step6500_eval_results_12-30-2022-22-07-13.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/zero-shot/pythia-410m-deduped-0shot-global_step66500_eval_results_12-30-2022-22-09-21.json
pretrain/pythia/evals/pythia-v0/pythia-410m-deduped/zero-shot/pythia-410m-deduped-0shot-global_step71500_eval_results_12-30-2022-22-09-21.json
pretrain/pythia/evals/pythia-v0/pythia-410m/five-shot/pythia-410m-5shot-global_step11500_eval_results_12-30-2022-21-45-58.json
pretrain/pythia/evals/pythia-v0/pythia-410m/five-shot/pythia-410m-5shot-global_step1500_eval_results_12-30-2022-21-45-51.json
pretrain/pythia/evals/pythia-v0/pythia-410m/five-shot/pythia-410m-5shot-global_step16500_eval_results_12-30-2022-21-46-01.json
pretrain/pythia/evals/pythia-v0/pythia-410m/five-shot/pythia-410m-5shot-global_step21500_eval_results_12-30-2022-21-46-09.json
pretrain/pythia/evals/pythia-v0/pythia-410m/five-shot/pythia-410m-5shot-global_step26500_eval_results_12-30-2022-21-46-34.json
pretrain/pythia/evals/pythia-v0/pythia-410m/five-shot/pythia-410m-5shot-global_step31500_eval_results_12-30-2022-21-46-15.json
pretrain/pythia/evals/pythia-v0/pythia-410m/five-shot/pythia-410m-5shot-global_step36500_eval_results_12-30-2022-21-46-19.json
pretrain/pythia/evals/pythia-v0/pythia-410m/five-shot/pythia-410m-5shot-global_step41500_eval_results_12-30-2022-21-46-53.json
pretrain/pythia/evals/pythia-v0/pythia-410m/five-shot/pythia-410m-5shot-global_step46500_eval_results_12-30-2022-21-46-53.json
pretrain/pythia/evals/pythia-v0/pythia-410m/five-shot/pythia-410m-5shot-global_step51500_eval_results_12-30-2022-21-47-01.json
pretrain/pythia/evals/pythia-v0/pythia-410m/five-shot/pythia-410m-5shot-global_step56500_eval_results_12-30-2022-21-46-34.json
pretrain/pythia/evals/pythia-v0/pythia-410m/five-shot/pythia-410m-5shot-global_step61500_eval_results_12-30-2022-21-47-14.json
pretrain/pythia/evals/pythia-v0/pythia-410m/five-shot/pythia-410m-5shot-global_step6500_eval_results_12-30-2022-21-46-25.json
pretrain/pythia/evals/pythia-v0/pythia-410m/five-shot/pythia-410m-5shot-global_step66500_eval_results_12-30-2022-21-46-41.json
pretrain/pythia/evals/pythia-v0/pythia-410m/five-shot/pythia-410m-5shot-global_step71500_eval_results_12-30-2022-21-47-06.json
pretrain/pythia/evals/pythia-v0/pythia-410m/zero-shot/pythia-410m-0shot-global_step11500_eval_results_12-30-2022-21-51-56.json
pretrain/pythia/evals/pythia-v0/pythia-410m/zero-shot/pythia-410m-0shot-global_step1500_eval_results_12-30-2022-21-50-38.json
pretrain/pythia/evals/pythia-v0/pythia-410m/zero-shot/pythia-410m-0shot-global_step16500_eval_results_12-30-2022-21-50-46.json
pretrain/pythia/evals/pythia-v0/pythia-410m/zero-shot/pythia-410m-0shot-global_step21500_eval_results_12-30-2022-21-52-17.json
pretrain/pythia/evals/pythia-v0/pythia-410m/zero-shot/pythia-410m-0shot-global_step26500_eval_results_12-30-2022-21-52-17.json
pretrain/pythia/evals/pythia-v0/pythia-410m/zero-shot/pythia-410m-0shot-global_step31500_eval_results_12-30-2022-21-51-01.json
pretrain/pythia/evals/pythia-v0/pythia-410m/zero-shot/pythia-410m-0shot-global_step36500_eval_results_12-30-2022-21-51-17.json
pretrain/pythia/evals/pythia-v0/pythia-410m/zero-shot/pythia-410m-0shot-global_step41500_eval_results_12-30-2022-21-52-30.json
pretrain/pythia/evals/pythia-v0/pythia-410m/zero-shot/pythia-410m-0shot-global_step46500_eval_results_12-30-2022-21-52-25.json
pretrain/pythia/evals/pythia-v0/pythia-410m/zero-shot/pythia-410m-0shot-global_step51500_eval_results_12-30-2022-21-51-14.json
pretrain/pythia/evals/pythia-v0/pythia-410m/zero-shot/pythia-410m-0shot-global_step56500_eval_results_12-30-2022-21-51-20.json
pretrain/pythia/evals/pythia-v0/pythia-410m/zero-shot/pythia-410m-0shot-global_step61500_eval_results_12-30-2022-21-51-26.json
pretrain/pythia/evals/pythia-v0/pythia-410m/zero-shot/pythia-410m-0shot-global_step6500_eval_results_12-30-2022-21-51-14.json
pretrain/pythia/evals/pythia-v0/pythia-410m/zero-shot/pythia-410m-0shot-global_step66500_eval_results_12-30-2022-21-52-40.json
pretrain/pythia/evals/pythia-v0/pythia-410m/zero-shot/pythia-410m-0shot-global_step71500_eval_results_12-30-2022-21-51-27.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/five-shot/pythia-6.9b-deduped-5shot-global_step103000_eval_results_12-20-2022-00-48-39.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/five-shot/pythia-6.9b-deduped-5shot-global_step113000_eval_results_12-20-2022-00-33-15.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/five-shot/pythia-6.9b-deduped-5shot-global_step123000_eval_results_12-20-2022-00-17-38.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/five-shot/pythia-6.9b-deduped-5shot-global_step13000_eval_results_12-20-2022-00-01-42.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/five-shot/pythia-6.9b-deduped-5shot-global_step133000_eval_results_12-19-2022-23-45-11.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/five-shot/pythia-6.9b-deduped-5shot-global_step143000_eval_results_12-19-2022-23-29-46.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/five-shot/pythia-6.9b-deduped-5shot-global_step23000_eval_results_12-19-2022-23-12-53.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/five-shot/pythia-6.9b-deduped-5shot-global_step3000_eval_results_12-19-2022-22-57-29.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/five-shot/pythia-6.9b-deduped-5shot-global_step33000_eval_results_12-19-2022-22-41-50.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/five-shot/pythia-6.9b-deduped-5shot-global_step43000_eval_results_12-19-2022-22-26-30.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/five-shot/pythia-6.9b-deduped-5shot-global_step53000_eval_results_12-19-2022-22-10-49.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/five-shot/pythia-6.9b-deduped-5shot-global_step63000_eval_results_12-19-2022-21-55-22.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/five-shot/pythia-6.9b-deduped-5shot-global_step73000_eval_results_12-19-2022-21-38-17.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/five-shot/pythia-6.9b-deduped-5shot-global_step83000_eval_results_12-19-2022-21-22-52.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/five-shot/pythia-6.9b-deduped-5shot-global_step93000_eval_results_12-19-2022-21-07-09.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/zero-shot/pythia-6.9b-deduped-0shot-global_step103000_eval_results_12-20-2022-20-54-37.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/zero-shot/pythia-6.9b-deduped-0shot-global_step113000_eval_results_12-20-2022-20-46-45.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/zero-shot/pythia-6.9b-deduped-0shot-global_step123000_eval_results_12-20-2022-20-38-56.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/zero-shot/pythia-6.9b-deduped-0shot-global_step13000_eval_results_12-20-2022-20-31-05.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/zero-shot/pythia-6.9b-deduped-0shot-global_step133000_eval_results_12-20-2022-20-23-11.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/zero-shot/pythia-6.9b-deduped-0shot-global_step143000_eval_results_12-20-2022-20-15-20.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/zero-shot/pythia-6.9b-deduped-0shot-global_step23000_eval_results_12-20-2022-20-07-26.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/zero-shot/pythia-6.9b-deduped-0shot-global_step3000_eval_results_12-20-2022-19-59-34.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/zero-shot/pythia-6.9b-deduped-0shot-global_step33000_eval_results_12-20-2022-19-51-35.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/zero-shot/pythia-6.9b-deduped-0shot-global_step43000_eval_results_12-20-2022-19-43-43.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/zero-shot/pythia-6.9b-deduped-0shot-global_step53000_eval_results_12-20-2022-19-35-45.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/zero-shot/pythia-6.9b-deduped-0shot-global_step63000_eval_results_12-20-2022-19-27-53.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/zero-shot/pythia-6.9b-deduped-0shot-global_step73000_eval_results_12-20-2022-19-20-00.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/zero-shot/pythia-6.9b-deduped-0shot-global_step83000_eval_results_12-20-2022-19-12-06.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b-deduped/zero-shot/pythia-6.9b-deduped-0shot-global_step93000_eval_results_12-20-2022-19-04-13.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/five-shot/pythia-6.9b-5shot-global_step103000_eval_results_12-19-2022-20-51-26.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/five-shot/pythia-6.9b-5shot-global_step113000_eval_results_12-19-2022-20-36-03.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/five-shot/pythia-6.9b-5shot-global_step123000_eval_results_12-19-2022-20-20-40.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/five-shot/pythia-6.9b-5shot-global_step13000_eval_results_12-19-2022-20-04-51.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/five-shot/pythia-6.9b-5shot-global_step133000_eval_results_12-19-2022-19-49-14.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/five-shot/pythia-6.9b-5shot-global_step143000_eval_results_12-19-2022-19-33-55.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/five-shot/pythia-6.9b-5shot-global_step23000_eval_results_12-19-2022-19-18-34.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/five-shot/pythia-6.9b-5shot-global_step3000_eval_results_12-19-2022-19-03-15.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/five-shot/pythia-6.9b-5shot-global_step33000_eval_results_12-19-2022-18-46-18.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/five-shot/pythia-6.9b-5shot-global_step43000_eval_results_12-19-2022-18-30-54.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/five-shot/pythia-6.9b-5shot-global_step53000_eval_results_12-19-2022-18-15-30.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/five-shot/pythia-6.9b-5shot-global_step63000_eval_results_12-19-2022-18-00-00.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/five-shot/pythia-6.9b-5shot-global_step73000_eval_results_12-19-2022-17-44-34.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/five-shot/pythia-6.9b-5shot-global_step83000_eval_results_12-19-2022-17-27-28.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/five-shot/pythia-6.9b-5shot-global_step93000_eval_results_12-19-2022-17-04-44.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/zero-shot/pythia-6.9b-0shot-global_step103000_eval_results_12-18-2022-18-19-16.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/zero-shot/pythia-6.9b-0shot-global_step113000_eval_results_12-18-2022-18-27-02.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/zero-shot/pythia-6.9b-0shot-global_step123000_eval_results_12-18-2022-18-34-56.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/zero-shot/pythia-6.9b-0shot-global_step13000_eval_results_12-18-2022-18-42-52.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/zero-shot/pythia-6.9b-0shot-global_step133000_eval_results_12-18-2022-18-50-47.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/zero-shot/pythia-6.9b-0shot-global_step143000_eval_results_12-18-2022-18-58-35.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/zero-shot/pythia-6.9b-0shot-global_step23000_eval_results_12-18-2022-19-06-30.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/zero-shot/pythia-6.9b-0shot-global_step3000_eval_results_12-18-2022-19-14-21.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/zero-shot/pythia-6.9b-0shot-global_step33000_eval_results_12-18-2022-19-22-09.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/zero-shot/pythia-6.9b-0shot-global_step43000_eval_results_12-18-2022-23-03-40.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/zero-shot/pythia-6.9b-0shot-global_step53000_eval_results_12-18-2022-22-55-40.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/zero-shot/pythia-6.9b-0shot-global_step63000_eval_results_12-18-2022-22-47-49.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/zero-shot/pythia-6.9b-0shot-global_step73000_eval_results_12-18-2022-22-39-58.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/zero-shot/pythia-6.9b-0shot-global_step83000_eval_results_12-18-2022-22-32-05.json
pretrain/pythia/evals/pythia-v0/pythia-6.9b/zero-shot/pythia-6.9b-0shot-global_step93000_eval_results_12-18-2022-22-24-13.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/five-shot/pythia-70m-deduped-5shot-global_step103000_eval_results_11-25-2022-21-28-37.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/five-shot/pythia-70m-deduped-5shot-global_step113000_eval_results_11-25-2022-21-29-04.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/five-shot/pythia-70m-deduped-5shot-global_step123000_eval_results_11-25-2022-21-29-46.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/five-shot/pythia-70m-deduped-5shot-global_step13000_eval_results_11-25-2022-20-58-06.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/five-shot/pythia-70m-deduped-5shot-global_step133000_eval_results_11-25-2022-21-30-01.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/five-shot/pythia-70m-deduped-5shot-global_step143000_eval_results_11-25-2022-21-30-49.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/five-shot/pythia-70m-deduped-5shot-global_step23000_eval_results_11-25-2022-21-04-29.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/five-shot/pythia-70m-deduped-5shot-global_step3000_eval_results_11-25-2022-20-54-46.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/five-shot/pythia-70m-deduped-5shot-global_step33000_eval_results_11-25-2022-21-08-23.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/five-shot/pythia-70m-deduped-5shot-global_step43000_eval_results_11-25-2022-21-17-47.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/five-shot/pythia-70m-deduped-5shot-global_step53000_eval_results_11-25-2022-21-22-31.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/five-shot/pythia-70m-deduped-5shot-global_step63000_eval_results_11-25-2022-21-22-29.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/five-shot/pythia-70m-deduped-5shot-global_step73000_eval_results_11-25-2022-21-22-47.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/five-shot/pythia-70m-deduped-5shot-global_step83000_eval_results_11-25-2022-21-23-37.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/five-shot/pythia-70m-deduped-5shot-global_step93000_eval_results_11-25-2022-21-24-32.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/zero-shot/pythia-70m-deduped-0shot-global_step103000_eval_results_11-25-2022-21-29-28.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/zero-shot/pythia-70m-deduped-0shot-global_step113000_eval_results_11-25-2022-21-29-34.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/zero-shot/pythia-70m-deduped-0shot-global_step123000_eval_results_11-25-2022-21-30-17.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/zero-shot/pythia-70m-deduped-0shot-global_step13000_eval_results_11-25-2022-20-58-19.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/zero-shot/pythia-70m-deduped-0shot-global_step133000_eval_results_11-25-2022-21-30-39.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/zero-shot/pythia-70m-deduped-0shot-global_step143000_eval_results_11-25-2022-21-31-34.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/zero-shot/pythia-70m-deduped-0shot-global_step23000_eval_results_11-25-2022-21-02-02.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/zero-shot/pythia-70m-deduped-0shot-global_step3000_eval_results_11-25-2022-20-47-16.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/zero-shot/pythia-70m-deduped-0shot-global_step33000_eval_results_11-25-2022-21-05-41.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/zero-shot/pythia-70m-deduped-0shot-global_step43000_eval_results_11-25-2022-21-16-52.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/zero-shot/pythia-70m-deduped-0shot-global_step53000_eval_results_11-25-2022-21-22-17.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/zero-shot/pythia-70m-deduped-0shot-global_step63000_eval_results_11-25-2022-21-23-33.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/zero-shot/pythia-70m-deduped-0shot-global_step73000_eval_results_11-25-2022-21-23-11.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/zero-shot/pythia-70m-deduped-0shot-global_step83000_eval_results_11-25-2022-21-23-32.json
pretrain/pythia/evals/pythia-v0/pythia-70m-deduped/zero-shot/pythia-70m-deduped-0shot-global_step93000_eval_results_11-25-2022-21-24-25.json
pretrain/pythia/evals/pythia-v0/pythia-70m/five-shot/pythia-70m-5shot-global_step103000_eval_results_11-25-2022-07-51-28.json
pretrain/pythia/evals/pythia-v0/pythia-70m/five-shot/pythia-70m-5shot-global_step113000_eval_results_11-25-2022-05-47-11.json
pretrain/pythia/evals/pythia-v0/pythia-70m/five-shot/pythia-70m-5shot-global_step113000_eval_results_11-25-2022-08-05-23.json
pretrain/pythia/evals/pythia-v0/pythia-70m/five-shot/pythia-70m-5shot-global_step123000_eval_results_11-25-2022-10-03-17.json
pretrain/pythia/evals/pythia-v0/pythia-70m/five-shot/pythia-70m-5shot-global_step13000_eval_results_11-25-2022-06-27-49.json
pretrain/pythia/evals/pythia-v0/pythia-70m/five-shot/pythia-70m-5shot-global_step133000_eval_results_11-25-2022-10-09-57.json
pretrain/pythia/evals/pythia-v0/pythia-70m/five-shot/pythia-70m-5shot-global_step143000_eval_results_11-25-2022-10-23-30.json
pretrain/pythia/evals/pythia-v0/pythia-70m/five-shot/pythia-70m-5shot-global_step23000_eval_results_11-25-2022-06-41-36.json
pretrain/pythia/evals/pythia-v0/pythia-70m/five-shot/pythia-70m-5shot-global_step3000_eval_results_11-25-2022-06-14-21.json
pretrain/pythia/evals/pythia-v0/pythia-70m/five-shot/pythia-70m-5shot-global_step33000_eval_results_11-25-2022-06-55-24.json
pretrain/pythia/evals/pythia-v0/pythia-70m/five-shot/pythia-70m-5shot-global_step43000_eval_results_11-25-2022-07-09-00.json
pretrain/pythia/evals/pythia-v0/pythia-70m/five-shot/pythia-70m-5shot-global_step53000_eval_results_11-25-2022-06-00-35.json
pretrain/pythia/evals/pythia-v0/pythia-70m/five-shot/pythia-70m-5shot-global_step53000_eval_results_11-25-2022-07-22-36.json
pretrain/pythia/evals/pythia-v0/pythia-70m/five-shot/pythia-70m-5shot-global_step63000_eval_results_11-25-2022-07-29-28.json
pretrain/pythia/evals/pythia-v0/pythia-70m/five-shot/pythia-70m-5shot-global_step73000_eval_results_11-25-2022-07-36-03.json
pretrain/pythia/evals/pythia-v0/pythia-70m/five-shot/pythia-70m-5shot-global_step83000_eval_results_11-25-2022-07-37-55.json
pretrain/pythia/evals/pythia-v0/pythia-70m/five-shot/pythia-70m-5shot-global_step93000_eval_results_11-25-2022-07-42-59.json
pretrain/pythia/evals/pythia-v0/pythia-70m/zero-shot/pythia-70m-0shot-global_step103000_eval_results_11-25-2022-07-44-49.json
pretrain/pythia/evals/pythia-v0/pythia-70m/zero-shot/pythia-70m-0shot-global_step113000_eval_results_11-25-2022-07-58-32.json
pretrain/pythia/evals/pythia-v0/pythia-70m/zero-shot/pythia-70m-0shot-global_step123000_eval_results_11-25-2022-05-54-21.json
pretrain/pythia/evals/pythia-v0/pythia-70m/zero-shot/pythia-70m-0shot-global_step123000_eval_results_11-25-2022-08-12-38.json
pretrain/pythia/evals/pythia-v0/pythia-70m/zero-shot/pythia-70m-0shot-global_step13000_eval_results_11-25-2022-06-21-35.json
pretrain/pythia/evals/pythia-v0/pythia-70m/zero-shot/pythia-70m-0shot-global_step133000_eval_results_11-25-2022-11-14-21.json
pretrain/pythia/evals/pythia-v0/pythia-70m/zero-shot/pythia-70m-0shot-global_step143000_eval_results_11-25-2022-10-16-50.json
pretrain/pythia/evals/pythia-v0/pythia-70m/zero-shot/pythia-70m-0shot-global_step23000_eval_results_11-25-2022-06-35-08.json
pretrain/pythia/evals/pythia-v0/pythia-70m/zero-shot/pythia-70m-0shot-global_step3000_eval_results_11-25-2022-06-07-56.json
pretrain/pythia/evals/pythia-v0/pythia-70m/zero-shot/pythia-70m-0shot-global_step33000_eval_results_11-25-2022-06-49-01.json
pretrain/pythia/evals/pythia-v0/pythia-70m/zero-shot/pythia-70m-0shot-global_step43000_eval_results_11-25-2022-07-02-34.json
pretrain/pythia/evals/pythia-v0/pythia-70m/zero-shot/pythia-70m-0shot-global_step53000_eval_results_11-25-2022-07-16-11.json
pretrain/pythia/evals/pythia-v0/pythia-70m/zero-shot/pythia-70m-0shot-global_step63000_eval_results_11-25-2022-07-24-20.json
pretrain/pythia/evals/pythia-v0/pythia-70m/zero-shot/pythia-70m-0shot-global_step73000_eval_results_11-25-2022-07-31-37.json
pretrain/pythia/evals/pythia-v0/pythia-70m/zero-shot/pythia-70m-0shot-global_step83000_eval_results_11-25-2022-07-36-35.json
pretrain/pythia/evals/pythia-v0/pythia-70m/zero-shot/pythia-70m-0shot-global_step93000_eval_results_11-25-2022-07-43-06.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-21-2023-14-30-34.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-21-2023-15-22-38.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-21-2023-15-24-20.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-21-2023-15-26-33.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-21-2023-15-28-38.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-21-2023-15-28-54.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-21-2023-15-29-38.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-21-2023-15-33-29.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-21-2023-15-33-34.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-21-2023-15-35-09.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-21-2023-15-37-10.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-21-2023-15-37-45.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-21-2023-15-37-55.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-21-2023-15-50-01.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-21-2023-15-52-00.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-24-2023-18-31-29.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-24-2023-18-31-37.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-24-2023-18-32-02.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-24-2023-18-32-13.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-24-2023-18-37-07.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-24-2023-18-45-44.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-24-2023-19-00-25.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-25-2023-03-04-17.json
pretrain/pythia/evals/pythia-v0/winobias/1.3B/eval_results_01-25-2023-03-47-45.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-20-2023-23-52-37.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-21-2023-01-19-03.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-21-2023-02-20-36.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-21-2023-03-19-40.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-21-2023-04-18-14.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-21-2023-05-16-05.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-21-2023-06-14-38.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-21-2023-07-14-31.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-21-2023-08-12-00.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-21-2023-09-10-08.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-21-2023-10-07-48.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-21-2023-14-29-49.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-21-2023-15-26-53.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-21-2023-22-43-09.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-21-2023-22-51-44.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-24-2023-19-42-45.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-24-2023-19-42-53.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-24-2023-19-42-56.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-24-2023-19-43-38.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-24-2023-19-44-31.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-24-2023-19-46-01.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-24-2023-19-50-56.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-24-2023-19-52-23.json
pretrain/pythia/evals/pythia-v0/winobias/19M/eval_results_01-25-2023-15-43-07.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-21-2023-02-14-11.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-21-2023-02-23-20.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-21-2023-02-29-55.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-21-2023-02-32-16.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-21-2023-02-33-32.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-21-2023-02-50-11.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-21-2023-02-53-18.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-21-2023-04-23-21.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-21-2023-05-43-59.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-21-2023-05-54-05.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-21-2023-05-55-00.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-21-2023-06-11-51.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-21-2023-06-19-18.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-21-2023-06-40-14.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-21-2023-08-10-36.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-24-2023-18-08-29.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-24-2023-18-18-52.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-24-2023-18-20-13.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-24-2023-18-21-25.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-24-2023-18-26-43.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-24-2023-18-27-30.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-24-2023-18-32-35.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-24-2023-18-35-29.json
pretrain/pythia/evals/pythia-v0/winobias/350M/eval_results_01-24-2023-18-55-08.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-22-2023-01-58-42.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-22-2023-02-25-13.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-22-2023-02-30-02.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-22-2023-02-30-13.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-22-2023-02-31-42.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-22-2023-02-32-49.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-22-2023-02-33-32.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-22-2023-02-35-03.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-22-2023-02-36-06.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-22-2023-02-36-07.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-22-2023-02-37-28.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-22-2023-02-42-08.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-22-2023-02-45-20.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-22-2023-03-06-22.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-22-2023-03-08-28.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-24-2023-23-56-32.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-24-2023-23-56-36.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-24-2023-23-56-43.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-25-2023-00-07-18.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-25-2023-00-07-32.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-25-2023-00-10-35.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-25-2023-00-13-40.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-25-2023-00-26-01.json
pretrain/pythia/evals/pythia-v0/winobias/6.7B/eval_results_01-25-2023-00-29-10.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-03-46-14.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-03-47-20.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-03-47-36.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-03-48-07.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-03-48-49.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-03-49-18.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-03-49-36.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-03-49-44.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-03-51-26.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-03-53-30.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-03-53-59.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-03-54-28.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-03-55-35.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-03-57-27.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-04-05-03.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-04-06-10.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-04-07-28.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-04-19-13.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_21/1.3B/eval_results_01-25-2023-04-22-09.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/1.3B/eval_results_01-22-2023-21-31-01.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/1.3B/eval_results_01-22-2023-21-36-10.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/1.3B/eval_results_01-22-2023-21-52-02.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/1.3B/eval_results_01-22-2023-22-04-15.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/1.3B/eval_results_01-22-2023-22-24-59.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/1.3B/eval_results_01-23-2023-00-52-51.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/1.3B/eval_results_01-23-2023-00-59-54.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/1.3B/eval_results_01-23-2023-01-27-13.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/1.3B/eval_results_01-23-2023-01-49-14.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/1.3B/eval_results_01-23-2023-01-51-41.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/19M/eval_results_01-25-2023-01-02-31.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/19M/eval_results_01-25-2023-01-03-03.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/19M/eval_results_01-25-2023-01-03-22.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/19M/eval_results_01-25-2023-01-03-53.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/19M/eval_results_01-25-2023-01-04-39.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/19M/eval_results_01-25-2023-01-09-32.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/19M/eval_results_01-25-2023-01-09-56.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/19M/eval_results_01-25-2023-01-12-37.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/19M/eval_results_01-25-2023-01-13-32.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/19M/eval_results_01-25-2023-13-15-40.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/350M/eval_results_01-22-2023-21-12-36.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/350M/eval_results_01-22-2023-21-21-15.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/350M/eval_results_01-22-2023-21-38-04.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/350M/eval_results_01-23-2023-00-35-32.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/350M/eval_results_01-23-2023-00-40-23.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/350M/eval_results_01-23-2023-00-59-51.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/350M/eval_results_01-23-2023-03-57-28.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/350M/eval_results_01-23-2023-04-10-36.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/350M/eval_results_01-23-2023-07-17-13.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/350M/eval_results_01-23-2023-08-09-45.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/6.7B/eval_results_01-25-2023-04-33-40.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/6.7B/eval_results_01-25-2023-04-34-59.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/6.7B/eval_results_01-25-2023-04-37-33.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/6.7B/eval_results_01-25-2023-04-37-48.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/6.7B/eval_results_01-25-2023-04-39-00.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/6.7B/eval_results_01-25-2023-04-39-56.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/6.7B/eval_results_01-25-2023-04-49-40.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/6.7B/eval_results_01-25-2023-05-09-12.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/6.7B/eval_results_01-25-2023-05-23-12.json
pretrain/pythia/evals/pythia-v0/winobias/intervene_7/6.7B/eval_results_01-25-2023-13-28-09.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-1MtokBS/1.4b-1MtokBS_step106000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-1MtokBS/1.4b-1MtokBS_step126000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-1MtokBS/1.4b-1MtokBS_step146000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-1MtokBS/1.4b-1MtokBS_step166000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-1MtokBS/1.4b-1MtokBS_step186000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-1MtokBS/1.4b-1MtokBS_step206000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-1MtokBS/1.4b-1MtokBS_step226000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-1MtokBS/1.4b-1MtokBS_step246000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-1MtokBS/1.4b-1MtokBS_step26000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-1MtokBS/1.4b-1MtokBS_step266000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-1MtokBS/1.4b-1MtokBS_step286000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-1MtokBS/1.4b-1MtokBS_step46000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-1MtokBS/1.4b-1MtokBS_step6000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-1MtokBS/1.4b-1MtokBS_step66000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-1MtokBS/1.4b-1MtokBS_step86000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step114000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step115000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step116000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step117000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step118000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step119000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step120000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step121000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step122000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step124000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step125000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step126000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step127000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step128000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step129000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step130000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step131000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step132000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step134000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step135000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step136000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step137000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step138000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step139000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step140000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step141000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step142000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/baseline/baseline-1.4b-deduped_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/five-shot/1.4b-deduped-5shot_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/five-shot/1.4b-deduped-5shot_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/five-shot/1.4b-deduped-5shot_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/five-shot/1.4b-deduped-5shot_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/five-shot/1.4b-deduped-5shot_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/five-shot/1.4b-deduped-5shot_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/five-shot/1.4b-deduped-5shot_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/five-shot/1.4b-deduped-5shot_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/five-shot/1.4b-deduped-5shot_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/five-shot/1.4b-deduped-5shot_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/five-shot/1.4b-deduped-5shot_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/five-shot/1.4b-deduped-5shot_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/five-shot/1.4b-deduped-5shot_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/five-shot/1.4b-deduped-5shot_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/five-shot/1.4b-deduped-5shot_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step114000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step115000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step116000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step117000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step118000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step119000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step120000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step121000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step122000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step124000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step125000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step126000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step127000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step128000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step129000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step130000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step131000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step132000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step134000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step135000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step136000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step137000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step138000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step139000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step140000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step141000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step142000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped-long_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped_step134000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped_step135000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped_step136000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped_step137000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped_step138000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped_step139000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped_step140000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped_step141000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped_step142000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/intervention/intervention-1.4b-deduped_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step0.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step1.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step1000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step128.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step16.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step2.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step256.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step32.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step4.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step512.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step64.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step8.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b-deduped/zero-shot/1.4b-deduped_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/five-shot/1.4b-5shot_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/five-shot/1.4b-5shot_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/five-shot/1.4b-5shot_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/five-shot/1.4b-5shot_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/five-shot/1.4b-5shot_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/five-shot/1.4b-5shot_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/five-shot/1.4b-5shot_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/five-shot/1.4b-5shot_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/five-shot/1.4b-5shot_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/five-shot/1.4b-5shot_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/five-shot/1.4b-5shot_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/five-shot/1.4b-5shot_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/five-shot/1.4b-5shot_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/five-shot/1.4b-5shot_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/five-shot/1.4b-5shot_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step0.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step1.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step1000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step128.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step16.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step2.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step256.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step32.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step4.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step512.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step64.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step8.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-1.4b/zero-shot/1.4b_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/five-shot/12b-deduped-5shot_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/five-shot/12b-deduped-5shot_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/five-shot/12b-deduped-5shot_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/five-shot/12b-deduped-5shot_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/five-shot/12b-deduped-5shot_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/five-shot/12b-deduped-5shot_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/five-shot/12b-deduped-5shot_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/five-shot/12b-deduped-5shot_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/five-shot/12b-deduped-5shot_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/five-shot/12b-deduped-5shot_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/five-shot/12b-deduped-5shot_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/five-shot/12b-deduped-5shot_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/five-shot/12b-deduped-5shot_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/five-shot/12b-deduped-5shot_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/five-shot/12b-deduped-5shot_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step0.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step1.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step1000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step128.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step16.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step2.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step256.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step32.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step4.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step512.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step64.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step8.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-12b-deduped/zero-shot/12b-deduped_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/five-shot/12b-5shot_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/five-shot/12b-5shot_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/five-shot/12b-5shot_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/five-shot/12b-5shot_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/five-shot/12b-5shot_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/five-shot/12b-5shot_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/five-shot/12b-5shot_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/five-shot/12b-5shot_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/five-shot/12b-5shot_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/five-shot/12b-5shot_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/five-shot/12b-5shot_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/five-shot/12b-5shot_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/five-shot/12b-5shot_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/five-shot/12b-5shot_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/five-shot/12b-5shot_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step0.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step1.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step1000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step128.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step16.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step2.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step256.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step32.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step4.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step512.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step64.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step8.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-12b/zero-shot/12b_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-0.5MtokBS/160m-0.5MtokBS_step12000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-0.5MtokBS/160m-0.5MtokBS_step132000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-0.5MtokBS/160m-0.5MtokBS_step172000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-0.5MtokBS/160m-0.5MtokBS_step212000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-0.5MtokBS/160m-0.5MtokBS_step252000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-0.5MtokBS/160m-0.5MtokBS_step292000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-0.5MtokBS/160m-0.5MtokBS_step332000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-0.5MtokBS/160m-0.5MtokBS_step372000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-0.5MtokBS/160m-0.5MtokBS_step412000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-0.5MtokBS/160m-0.5MtokBS_step452000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-0.5MtokBS/160m-0.5MtokBS_step492000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-0.5MtokBS/160m-0.5MtokBS_step52000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-0.5MtokBS/160m-0.5MtokBS_step532000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-0.5MtokBS/160m-0.5MtokBS_step572000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-0.5MtokBS/160m-0.5MtokBS_step92000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/five-shot/160m-deduped-5shot_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/five-shot/160m-deduped-5shot_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/five-shot/160m-deduped-5shot_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/five-shot/160m-deduped-5shot_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/five-shot/160m-deduped-5shot_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/five-shot/160m-deduped-5shot_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/five-shot/160m-deduped-5shot_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/five-shot/160m-deduped-5shot_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/five-shot/160m-deduped-5shot_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/five-shot/160m-deduped-5shot_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/five-shot/160m-deduped-5shot_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/five-shot/160m-deduped-5shot_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/five-shot/160m-deduped-5shot_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/five-shot/160m-deduped-5shot_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/five-shot/160m-deduped-5shot_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step0.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step1.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step1000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step128.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step16.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step2.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step256.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step32.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step4.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step512.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step64.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step8.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-160m-deduped/zero-shot/160m-deduped_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/five-shot/160m-5shot_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/five-shot/160m-5shot_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/five-shot/160m-5shot_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/five-shot/160m-5shot_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/five-shot/160m-5shot_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/five-shot/160m-5shot_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/five-shot/160m-5shot_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/five-shot/160m-5shot_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/five-shot/160m-5shot_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/five-shot/160m-5shot_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/five-shot/160m-5shot_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/five-shot/160m-5shot_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/five-shot/160m-5shot_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/five-shot/160m-5shot_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/five-shot/160m-5shot_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step0.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step1.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step1000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step128.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step16.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step2.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step256.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step32.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step4.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step512.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step64.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step8.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-160m/zero-shot/160m_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-0.5MtokBS/five-shot/1b-0.5MtokBS_step12000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-0.5MtokBS/five-shot/1b-0.5MtokBS_step132000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-0.5MtokBS/five-shot/1b-0.5MtokBS_step172000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-0.5MtokBS/five-shot/1b-0.5MtokBS_step212000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-0.5MtokBS/five-shot/1b-0.5MtokBS_step252000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-0.5MtokBS/five-shot/1b-0.5MtokBS_step292000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-0.5MtokBS/five-shot/1b-0.5MtokBS_step332000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-0.5MtokBS/five-shot/1b-0.5MtokBS_step372000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-0.5MtokBS/five-shot/1b-0.5MtokBS_step412000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-0.5MtokBS/five-shot/1b-0.5MtokBS_step452000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-0.5MtokBS/five-shot/1b-0.5MtokBS_step492000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-0.5MtokBS/five-shot/1b-0.5MtokBS_step52000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-0.5MtokBS/five-shot/1b-0.5MtokBS_step532000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-0.5MtokBS/five-shot/1b-0.5MtokBS_step572000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-0.5MtokBS/five-shot/1b-0.5MtokBS_step92000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/five-shot/1b-5shot_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/five-shot/1b-5shot_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/five-shot/1b-5shot_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/five-shot/1b-5shot_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/five-shot/1b-5shot_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/five-shot/1b-5shot_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/five-shot/1b-5shot_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/five-shot/1b-5shot_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/five-shot/1b-5shot_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/five-shot/1b-5shot_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/five-shot/1b-5shot_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/five-shot/1b-5shot_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/five-shot/1b-5shot_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/five-shot/1b-5shot_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/five-shot/1b-5shot_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16-5shot_step1000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16-5shot_step128.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16-5shot_step256.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16-5shot_step512.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step0.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step1.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step16.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step2.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step32.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step4.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step64.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step8.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-bf16/zero-shot/1b-bf16_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/five-shot/1b-deduped-5shot_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/five-shot/1b-deduped-5shot_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/five-shot/1b-deduped-5shot_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/five-shot/1b-deduped-5shot_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/five-shot/1b-deduped-5shot_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/five-shot/1b-deduped-5shot_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/five-shot/1b-deduped-5shot_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/five-shot/1b-deduped-5shot_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/five-shot/1b-deduped-5shot_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/five-shot/1b-deduped-5shot_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/five-shot/1b-deduped-5shot_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/five-shot/1b-deduped-5shot_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/five-shot/1b-deduped-5shot_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/five-shot/1b-deduped-5shot_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/five-shot/1b-deduped-5shot_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step0.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step1.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step1000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step128.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step16.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step2.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step256.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step32.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step4.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step512.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step64.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step8.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-1b-deduped/zero-shot/1b-deduped_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/five-shot/2.8b-deduped-5shot_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/five-shot/2.8b-deduped-5shot_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/five-shot/2.8b-deduped-5shot_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/five-shot/2.8b-deduped-5shot_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/five-shot/2.8b-deduped-5shot_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/five-shot/2.8b-deduped-5shot_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/five-shot/2.8b-deduped-5shot_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/five-shot/2.8b-deduped-5shot_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/five-shot/2.8b-deduped-5shot_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/five-shot/2.8b-deduped-5shot_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/five-shot/2.8b-deduped-5shot_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/five-shot/2.8b-deduped-5shot_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/five-shot/2.8b-deduped-5shot_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/five-shot/2.8b-deduped-5shot_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/five-shot/2.8b-deduped-5shot_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step0.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step1.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step1000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step128.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step16.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step2.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step256.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step32.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step4.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step512.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step64.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step8.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b-deduped/zero-shot/2.8b-deduped_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/five-shot/2.8b-5shot_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/five-shot/2.8b-5shot_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/five-shot/2.8b-5shot_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/five-shot/2.8b-5shot_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/five-shot/2.8b-5shot_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/five-shot/2.8b-5shot_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/five-shot/2.8b-5shot_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/five-shot/2.8b-5shot_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/five-shot/2.8b-5shot_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/five-shot/2.8b-5shot_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/five-shot/2.8b-5shot_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/five-shot/2.8b-5shot_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/five-shot/2.8b-5shot_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/five-shot/2.8b-5shot_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/five-shot/2.8b-5shot_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step0.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step1.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step1000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step128.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step16.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step2.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step256.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step32.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step4.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step512.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step64.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step8.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-2.8b/zero-shot/2.8b_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-0.5MtokBS/410m-0.5MtokBS_step12000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-0.5MtokBS/410m-0.5MtokBS_step132000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-0.5MtokBS/410m-0.5MtokBS_step172000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-0.5MtokBS/410m-0.5MtokBS_step212000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-0.5MtokBS/410m-0.5MtokBS_step252000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-0.5MtokBS/410m-0.5MtokBS_step292000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-0.5MtokBS/410m-0.5MtokBS_step332000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-0.5MtokBS/410m-0.5MtokBS_step372000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-0.5MtokBS/410m-0.5MtokBS_step412000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-0.5MtokBS/410m-0.5MtokBS_step452000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-0.5MtokBS/410m-0.5MtokBS_step492000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-0.5MtokBS/410m-0.5MtokBS_step52000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-0.5MtokBS/410m-0.5MtokBS_step532000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-0.5MtokBS/410m-0.5MtokBS_step572000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-0.5MtokBS/410m-0.5MtokBS_step92000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/baseline/baseline-410m-deduped_step134000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/baseline/baseline-410m-deduped_step135000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/baseline/baseline-410m-deduped_step136000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/baseline/baseline-410m-deduped_step137000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/baseline/baseline-410m-deduped_step138000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/baseline/baseline-410m-deduped_step139000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/baseline/baseline-410m-deduped_step140000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/baseline/baseline-410m-deduped_step141000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/baseline/baseline-410m-deduped_step142000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/baseline/baseline-410m-deduped_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/five-shot/410m-deduped-5shot_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/five-shot/410m-deduped-5shot_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/five-shot/410m-deduped-5shot_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/five-shot/410m-deduped-5shot_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/five-shot/410m-deduped-5shot_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/five-shot/410m-deduped-5shot_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/five-shot/410m-deduped-5shot_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/five-shot/410m-deduped-5shot_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/five-shot/410m-deduped-5shot_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/five-shot/410m-deduped-5shot_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/five-shot/410m-deduped-5shot_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/five-shot/410m-deduped-5shot_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/five-shot/410m-deduped-5shot_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/five-shot/410m-deduped-5shot_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/five-shot/410m-deduped-5shot_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/intervention/intervention-410m-deduped_step134000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/intervention/intervention-410m-deduped_step135000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/intervention/intervention-410m-deduped_step136000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/intervention/intervention-410m-deduped_step137000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/intervention/intervention-410m-deduped_step138000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/intervention/intervention-410m-deduped_step139000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/intervention/intervention-410m-deduped_step140000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/intervention/intervention-410m-deduped_step141000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/intervention/intervention-410m-deduped_step142000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/intervention/intervention-410m-deduped_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step0.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step1.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step1000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step128.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step16.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step2.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step256.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step32.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step4.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step512.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step64.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step8.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-410m-deduped/zero-shot/410m-deduped_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/five-shot/410m-5shot_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/five-shot/410m-5shot_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/five-shot/410m-5shot_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/five-shot/410m-5shot_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/five-shot/410m-5shot_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/five-shot/410m-5shot_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/five-shot/410m-5shot_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/five-shot/410m-5shot_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/five-shot/410m-5shot_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/five-shot/410m-5shot_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/five-shot/410m-5shot_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/five-shot/410m-5shot_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/five-shot/410m-5shot_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/five-shot/410m-5shot_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/five-shot/410m-5shot_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step0.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step1.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step1000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step128.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step16.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step2.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step256.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step32.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step4.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step512.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step64.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step8.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-410m/zero-shot/410m_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/baseline/baseline-6.9b-deduped_step134000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/baseline/baseline-6.9b-deduped_step135000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/baseline/baseline-6.9b-deduped_step136000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/baseline/baseline-6.9b-deduped_step137000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/baseline/baseline-6.9b-deduped_step138000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/baseline/baseline-6.9b-deduped_step139000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/baseline/baseline-6.9b-deduped_step140000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/baseline/baseline-6.9b-deduped_step141000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/baseline/baseline-6.9b-deduped_step142000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/baseline/baseline-6.9b-deduped_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/five-shot/6.9b-deduped-5shot_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/five-shot/6.9b-deduped-5shot_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/five-shot/6.9b-deduped-5shot_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/five-shot/6.9b-deduped-5shot_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/five-shot/6.9b-deduped-5shot_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/five-shot/6.9b-deduped-5shot_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/five-shot/6.9b-deduped-5shot_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/five-shot/6.9b-deduped-5shot_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/five-shot/6.9b-deduped-5shot_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/five-shot/6.9b-deduped-5shot_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/five-shot/6.9b-deduped-5shot_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/five-shot/6.9b-deduped-5shot_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/five-shot/6.9b-deduped-5shot_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/five-shot/6.9b-deduped-5shot_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/five-shot/6.9b-deduped-5shot_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/intervention/intervention-6.9b-deduped_step134000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/intervention/intervention-6.9b-deduped_step135000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/intervention/intervention-6.9b-deduped_step136000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/intervention/intervention-6.9b-deduped_step137000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/intervention/intervention-6.9b-deduped_step138000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/intervention/intervention-6.9b-deduped_step139000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/intervention/intervention-6.9b-deduped_step140000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/intervention/intervention-6.9b-deduped_step141000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/intervention/intervention-6.9b-deduped_step142000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/intervention/intervention-6.9b-deduped_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step0.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step1.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step1000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step128.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step16.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step2.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step256.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step32.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step4.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step512.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step64.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step8.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b-deduped/zero-shot/6.9b-deduped_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/five-shot/6.9b-5shot_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/five-shot/6.9b-5shot_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/five-shot/6.9b-5shot_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/five-shot/6.9b-5shot_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/five-shot/6.9b-5shot_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/five-shot/6.9b-5shot_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/five-shot/6.9b-5shot_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/five-shot/6.9b-5shot_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/five-shot/6.9b-5shot_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/five-shot/6.9b-5shot_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/five-shot/6.9b-5shot_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/five-shot/6.9b-5shot_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/five-shot/6.9b-5shot_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/five-shot/6.9b-5shot_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/five-shot/6.9b-5shot_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step0.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step1.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step1000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step128.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step16.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step2.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step256.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step32.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step4.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step512.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step64.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step8.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-6.9b/zero-shot/6.9b_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-0.25MtokBS/five-shot/70m-0.25MtokBS_step104000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-0.25MtokBS/five-shot/70m-0.25MtokBS_step1144000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-0.25MtokBS/five-shot/70m-0.25MtokBS_step184000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-0.25MtokBS/five-shot/70m-0.25MtokBS_step24000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-0.25MtokBS/five-shot/70m-0.25MtokBS_step264000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-0.25MtokBS/five-shot/70m-0.25MtokBS_step344000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-0.25MtokBS/five-shot/70m-0.25MtokBS_step424000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-0.25MtokBS/five-shot/70m-0.25MtokBS_step504000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-0.25MtokBS/five-shot/70m-0.25MtokBS_step584000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-0.25MtokBS/five-shot/70m-0.25MtokBS_step664000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-0.25MtokBS/five-shot/70m-0.25MtokBS_step744000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-0.25MtokBS/five-shot/70m-0.25MtokBS_step824000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-0.25MtokBS/five-shot/70m-0.25MtokBS_step904000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-0.25MtokBS/five-shot/70m-0.25MtokBS_step984000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/baseline/baseline-70m-deduped_step134000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/baseline/baseline-70m-deduped_step135000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/baseline/baseline-70m-deduped_step136000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/baseline/baseline-70m-deduped_step137000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/baseline/baseline-70m-deduped_step138000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/baseline/baseline-70m-deduped_step139000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/baseline/baseline-70m-deduped_step140000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/baseline/baseline-70m-deduped_step141000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/baseline/baseline-70m-deduped_step142000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/baseline/baseline-70m-deduped_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/five-shot/70m-deduped-5shot_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/five-shot/70m-deduped-5shot_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/five-shot/70m-deduped-5shot_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/five-shot/70m-deduped-5shot_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/five-shot/70m-deduped-5shot_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/five-shot/70m-deduped-5shot_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/five-shot/70m-deduped-5shot_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/five-shot/70m-deduped-5shot_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/five-shot/70m-deduped-5shot_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/five-shot/70m-deduped-5shot_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/five-shot/70m-deduped-5shot_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/five-shot/70m-deduped-5shot_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/five-shot/70m-deduped-5shot_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/five-shot/70m-deduped-5shot_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/five-shot/70m-deduped-5shot_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/intervention/intervention-70m-deduped_step134000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/intervention/intervention-70m-deduped_step135000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/intervention/intervention-70m-deduped_step136000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/intervention/intervention-70m-deduped_step137000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/intervention/intervention-70m-deduped_step138000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/intervention/intervention-70m-deduped_step139000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/intervention/intervention-70m-deduped_step140000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/intervention/intervention-70m-deduped_step141000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/intervention/intervention-70m-deduped_step142000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/intervention/intervention-70m-deduped_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step0.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step1.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step1000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step128.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step16.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step2.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step256.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step32.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step4.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step512.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step64.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step8.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-70m-deduped/zero-shot/70m-deduped_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/five-shot/70m-5shot_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/five-shot/70m-5shot_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/five-shot/70m-5shot_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/five-shot/70m-5shot_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/five-shot/70m-5shot_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/five-shot/70m-5shot_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/five-shot/70m-5shot_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/five-shot/70m-5shot_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/five-shot/70m-5shot_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/five-shot/70m-5shot_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/five-shot/70m-5shot_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/five-shot/70m-5shot_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/five-shot/70m-5shot_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/five-shot/70m-5shot_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/five-shot/70m-5shot_step93000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step0.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step1.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step1000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step103000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step113000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step123000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step128.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step13000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step133000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step143000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step16.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step2.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step23000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step256.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step3000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step32.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step33000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step4.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step43000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step512.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step53000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step63000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step64.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step73000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step8.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step83000.json
pretrain/pythia/evals/pythia-v1/pythia-70m/zero-shot/70m_step93000.json
pretrain/pythia/models/1.4B/pythia-1.4b-deduped.yml
pretrain/pythia/models/1.4B/pythia-1.4b.yml
pretrain/pythia/models/12B/pythia-12b-deduped.yml
pretrain/pythia/models/12B/pythia-12b.yml
pretrain/pythia/models/14M/pythia-14m.yml
pretrain/pythia/models/160M/pythia-160m-deduped.yml
pretrain/pythia/models/160M/pythia-160m.yml
pretrain/pythia/models/1B/pythia-1b-deduped.yml
pretrain/pythia/models/1B/pythia-1b.yml
pretrain/pythia/models/2.8B/pythia-2.8b-deduped.yml
pretrain/pythia/models/2.8B/pythia-2.8b.yml
pretrain/pythia/models/31M/pythia-31m.yml
pretrain/pythia/models/410M/pythia-410m-deduped.yml
pretrain/pythia/models/410M/pythia-410m.yml
pretrain/pythia/models/6.9B/pythia-6.9b-deduped.yml
pretrain/pythia/models/6.9B/pythia-6.9b.yml
pretrain/pythia/models/70M/pythia-70m-deduped.yml
pretrain/pythia/models/70M/pythia-70m.yml
pretrain/pythia/polypythias/README.md
pretrain/pythia/polypythias/plots.ipynb
pretrain/pythia/polypythias/data/training_maps.tsv
pretrain/pythia/predictable-memorization/README.md
pretrain/pythia/predictable-memorization/eda.ipynb
pretrain/pythia/predictable-memorization/eval_memorization.py
pretrain/pythia/predictable-memorization/mem_graph.py
pretrain/pythia/predictable-memorization/memorization.py
pretrain/pythia/predictable-memorization/multinode_runner.sbatch
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_1.3b_105m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_1.3b_126m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_1.3b_146m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_1.3b_23m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_1.3b_44m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_1.3b_65m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_1.3b_85m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_125m_105m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_125m_126m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_125m_146m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_125m_23m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_125m_44m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_125m_65m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_125m_85m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_13b_105m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_13b_126m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_13b_146m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_13b_23m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_13b_44m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_13b_65m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_13b_85m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_19m_105m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_19m_126m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_19m_146m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_19m_23m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_19m_44m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_19m_65m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_19m_85m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_2.7b_105m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_2.7b_126m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_2.7b_146m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_2.7b_23m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_2.7b_44m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_2.7b_65m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_2.7b_85m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_350m_105m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_350m_126m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_350m_146m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_350m_23m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_350m_44m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_350m_65m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_350m_85m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_6.7b_105m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_6.7b_126m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_6.7b_146m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_6.7b_23m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_6.7b_44m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_6.7b_65m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_6.7b_85m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_800m_105m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_800m_126m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_800m_146m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_800m_23m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_800m_44m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_800m_65m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_early_checkpoint_predict_last_checkpoint/graph_800m_85m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_rates_through_time/graph_fnr.svg
pretrain/pythia/predictable-memorization/graphs/memorization_rates_through_time/graph_fpr.svg
pretrain/pythia/predictable-memorization/graphs/memorization_rates_through_time/graph_tpr.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_1.3b_105m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_1.3b_126m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_1.3b_146m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_1.3b_23m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_1.3b_44m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_1.3b_65m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_1.3b_85m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_125m_105m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_125m_126m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_125m_146m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_125m_23m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_125m_44m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_125m_65m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_125m_85m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_13b_105m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_13b_126m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_13b_146m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_13b_23m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_13b_44m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_13b_65m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_13b_85m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_19m_105m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_19m_126m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_19m_146m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_19m_23m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_19m_44m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_19m_65m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_19m_85m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_2.7b_105m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_2.7b_126m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_2.7b_146m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_2.7b_23m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_2.7b_44m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_2.7b_65m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_2.7b_85m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_350m_105m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_350m_126m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_350m_146m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_350m_23m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_350m_44m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_350m_65m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_350m_85m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_6.7b_105m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_6.7b_126m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_6.7b_146m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_6.7b_23m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_6.7b_44m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_6.7b_65m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_6.7b_85m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_800m_105m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_800m_126m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_800m_146m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_800m_23m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_800m_44m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_800m_65m.svg
pretrain/pythia/predictable-memorization/graphs/memorization_small_model_predict_large_model/graph_800m_85m.svg
pretrain/pythia/utils/20B_tokenizer.json
pretrain/pythia/utils/batch_viewer.py
pretrain/pythia/utils/checksum_shards.py
pretrain/pythia/utils/dummy_config.yml
pretrain/pythia/utils/mmap_dataset.py
pretrain/pythia/utils/scrape.py
pretrain/pythia/utils/shard_hashes.txt
pretrain/pythia/utils/shard_memmap.py
pretrain/pythia/utils/unshard_memmap.py
pretrain/scripts/collect_attention_free_results.py
pretrain/scripts/generate_attention_free_configs.sh
pretrain/scripts/run_all_attention_free_experiments.sh
pretrain/scripts/test_attention_free_setup.sh
quantization/lm-evaluation-harness-main/.coveragerc
quantization/lm-evaluation-harness-main/.flake8
quantization/lm-evaluation-harness-main/.pre-commit-config.yaml
quantization/lm-evaluation-harness-main/BENCHMARK_README.md
quantization/lm-evaluation-harness-main/CITATION.bib
quantization/lm-evaluation-harness-main/CODEOWNERS
quantization/lm-evaluation-harness-main/LICENSE.md
quantization/lm-evaluation-harness-main/README.md
quantization/lm-evaluation-harness-main/batch_eval.py
quantization/lm-evaluation-harness-main/demo_sample.py
quantization/lm-evaluation-harness-main/ignore.txt
quantization/lm-evaluation-harness-main/mypy.ini
quantization/lm-evaluation-harness-main/pile_statistics.json
quantization/lm-evaluation-harness-main/process_results.py
quantization/lm-evaluation-harness-main/pyproject.toml
quantization/lm-evaluation-harness-main/requirements.txt
quantization/lm-evaluation-harness-main/setup.py
quantization/lm-evaluation-harness-main/test_monitor.py
quantization/lm-evaluation-harness-main/.github/workflows/new_tasks.yml
quantization/lm-evaluation-harness-main/.github/workflows/publish.yml
quantization/lm-evaluation-harness-main/.github/workflows/unit_tests.yml
quantization/lm-evaluation-harness-main/docs/API_guide.md
quantization/lm-evaluation-harness-main/docs/CONTRIBUTING.md
quantization/lm-evaluation-harness-main/docs/README.md
quantization/lm-evaluation-harness-main/docs/chat-template-readme.md
quantization/lm-evaluation-harness-main/docs/decontamination.md
quantization/lm-evaluation-harness-main/docs/interface.md
quantization/lm-evaluation-harness-main/docs/model_guide.md
quantization/lm-evaluation-harness-main/docs/new_task_guide.md
quantization/lm-evaluation-harness-main/docs/task_guide.md
quantization/lm-evaluation-harness-main/docs/img/fewshot_example_gpt3.png
quantization/lm-evaluation-harness-main/examples/lm-eval-overview.ipynb
quantization/lm-evaluation-harness-main/examples/transformer-lens.py
quantization/lm-evaluation-harness-main/examples/visualize-wandb.ipynb
quantization/lm-evaluation-harness-main/examples/visualize-zeno.ipynb
quantization/lm-evaluation-harness-main/lm_eval/__init__.py
quantization/lm-evaluation-harness-main/lm_eval/__main__.py
quantization/lm-evaluation-harness-main/lm_eval/evaluator.py
quantization/lm-evaluation-harness-main/lm_eval/evaluator_utils.py
quantization/lm-evaluation-harness-main/lm_eval/utils.py
quantization/lm-evaluation-harness-main/lm_eval.egg-info/PKG-INFO
quantization/lm-evaluation-harness-main/lm_eval.egg-info/SOURCES.txt
quantization/lm-evaluation-harness-main/lm_eval.egg-info/dependency_links.txt
quantization/lm-evaluation-harness-main/lm_eval.egg-info/entry_points.txt
quantization/lm-evaluation-harness-main/lm_eval.egg-info/requires.txt
quantization/lm-evaluation-harness-main/lm_eval.egg-info/top_level.txt
quantization/lm-evaluation-harness-main/lm_eval/api/__init__.py
quantization/lm-evaluation-harness-main/lm_eval/api/filter.py
quantization/lm-evaluation-harness-main/lm_eval/api/group.py
quantization/lm-evaluation-harness-main/lm_eval/api/instance.py
quantization/lm-evaluation-harness-main/lm_eval/api/metrics.py
quantization/lm-evaluation-harness-main/lm_eval/api/model.py
quantization/lm-evaluation-harness-main/lm_eval/api/registry.py
quantization/lm-evaluation-harness-main/lm_eval/api/samplers.py
quantization/lm-evaluation-harness-main/lm_eval/api/task.py
quantization/lm-evaluation-harness-main/lm_eval/caching/__init__.py
quantization/lm-evaluation-harness-main/lm_eval/caching/cache.py
quantization/lm-evaluation-harness-main/lm_eval/decontamination/__init__.py
quantization/lm-evaluation-harness-main/lm_eval/decontamination/archiver.py
quantization/lm-evaluation-harness-main/lm_eval/decontamination/decontaminate.py
quantization/lm-evaluation-harness-main/lm_eval/decontamination/janitor.py
quantization/lm-evaluation-harness-main/lm_eval/filters/__init__.py
quantization/lm-evaluation-harness-main/lm_eval/filters/custom.py
quantization/lm-evaluation-harness-main/lm_eval/filters/decontamination.py
quantization/lm-evaluation-harness-main/lm_eval/filters/extraction.py
quantization/lm-evaluation-harness-main/lm_eval/filters/selection.py
quantization/lm-evaluation-harness-main/lm_eval/filters/transformation.py
quantization/lm-evaluation-harness-main/lm_eval/loggers/__init__.py
quantization/lm-evaluation-harness-main/lm_eval/loggers/evaluation_tracker.py
quantization/lm-evaluation-harness-main/lm_eval/loggers/utils.py
quantization/lm-evaluation-harness-main/lm_eval/loggers/wandb_logger.py
quantization/lm-evaluation-harness-main/lm_eval/models/__init__.py
quantization/lm-evaluation-harness-main/lm_eval/models/anthropic_llms.py
quantization/lm-evaluation-harness-main/lm_eval/models/api_models.py
quantization/lm-evaluation-harness-main/lm_eval/models/dummy.py
quantization/lm-evaluation-harness-main/lm_eval/models/gguf.py
quantization/lm-evaluation-harness-main/lm_eval/models/hf_audiolm.py
quantization/lm-evaluation-harness-main/lm_eval/models/hf_steered.py
quantization/lm-evaluation-harness-main/lm_eval/models/hf_vlms.py
quantization/lm-evaluation-harness-main/lm_eval/models/huggingface.py
quantization/lm-evaluation-harness-main/lm_eval/models/ibm_watsonx_ai.py
quantization/lm-evaluation-harness-main/lm_eval/models/mamba_lm.py
quantization/lm-evaluation-harness-main/lm_eval/models/nemo_lm.py
quantization/lm-evaluation-harness-main/lm_eval/models/neuralmagic.py
quantization/lm-evaluation-harness-main/lm_eval/models/neuron_optimum.py
quantization/lm-evaluation-harness-main/lm_eval/models/openai_completions.py
quantization/lm-evaluation-harness-main/lm_eval/models/optimum_ipex.py
quantization/lm-evaluation-harness-main/lm_eval/models/optimum_lm.py
quantization/lm-evaluation-harness-main/lm_eval/models/sglang_causallms.py
quantization/lm-evaluation-harness-main/lm_eval/models/textsynth.py
quantization/lm-evaluation-harness-main/lm_eval/models/utils.py
quantization/lm-evaluation-harness-main/lm_eval/models/vllm_causallms.py
quantization/lm-evaluation-harness-main/lm_eval/models/vllm_vlms.py
quantization/lm-evaluation-harness-main/lm_eval/performance/monitor.py
quantization/lm-evaluation-harness-main/lm_eval/prompts/__init__.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/__init__.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/_aclue.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/_default_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/aclue_ancient_chinese_culture.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/aclue_ancient_literature.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/aclue_ancient_medical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/aclue_ancient_phonetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/aclue_basic_ancient_chinese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/aclue_couplet_prediction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/aclue_homographic_character_resolution.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/aclue_named_entity_recognition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/aclue_poetry_appreciate.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/aclue_poetry_context_prediction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/aclue_poetry_quality_assessment.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/aclue_poetry_sentiment_analysis.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/aclue_polysemy_resolution.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/aclue_reading_comprehension.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aclue/aclue_sentence_segmentation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aexams/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/aexams/_aexams.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aexams/_default_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aexams/aexams_Biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aexams/aexams_IslamicStudies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aexams/aexams_Physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aexams/aexams_Science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aexams/aexams_Social.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/gen_yaml.sh
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/run.sh
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_amh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_eng.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_ewe.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_fra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_hau.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_ibo.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_kin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_lin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_lug.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_orm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_sna.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_sot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_swa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_twi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_wol.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_xho.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_yor.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/afrimgsm_direct_zul.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/direct/direct_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_amh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_eng.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_ewe.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_fra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_hau.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_ibo.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_kin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_lin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_lug.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_orm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_sna.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_sot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_swa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_twi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_wol.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_xho.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_yor.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/afrimgsm_en_cot_zul.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/en_cot/cot_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_amh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_eng.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_ewe.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_fra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_hau.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_ibo.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_kin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_lin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_lug.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_orm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_sna.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_sot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_swa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_twi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_wol.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_xho.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_yor.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/afrimgsm_translate_zul.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimgsm/translate/translate_direct_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/fewshot.sh
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_common_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_amh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_eng.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_ewe.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_fra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_hau.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_ibo.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_kin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_lin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_lug.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_orm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_sna.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_sot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_swa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_twi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_wol.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_xho.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_yor.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/afrimmlu_direct_zul.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/direct/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_common_translate_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_amh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_eng.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_ewe.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_fra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_hau.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_ibo.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_kin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_lin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_lug.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_orm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_sna.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_sot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_swa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_twi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_wol.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_xho.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_yor.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/afrimmlu_translate_zul.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrimmlu/translate/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_amh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_eng.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_ewe.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_fra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_hau.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_ibo.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_kin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_lin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_lug.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_orm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_sna.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_sot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_swa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_twi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_wol.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_xho.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_yor.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_zul.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/en-direct/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_amh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_eng.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_ewe.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_fra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_hau.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_ibo.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_kin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_lin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_lug.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_orm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_sna.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_sot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_swa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_twi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_wol.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_xho.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_yor.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_zul.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/native-direct/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_amh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_ewe.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_fra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_hau.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_ibo.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_kin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_lin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_lug.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_orm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_sna.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_sot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_swa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_twi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_wol.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_xho.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_yor.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_zul.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/anli prompt/translate/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_amh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_eng.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_ewe.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_fra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_hau.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_ibo.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_kin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_lin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_lug.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_orm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_sna.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_sot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_swa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_twi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_wol.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_xho.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_yor.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_zul.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/direct/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_amh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_ewe.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_fra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_hau.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_ibo.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_kin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_lin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_lug.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_orm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_sna.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_sot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_swa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_twi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_wol.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_xho.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_yor.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_zul.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/afrixnli/lai prompt/translate/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/agieval.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/agieval_cn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/agieval_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/agieval_nous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/aqua-rat.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/gaokao-biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/gaokao-chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/gaokao-chinese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/gaokao-english.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/gaokao-geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/gaokao-history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/gaokao-mathcloze.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/gaokao-mathqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/gaokao-physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/jec-qa-ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/jec-qa-kd.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/logiqa-en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/logiqa-zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/lsat-ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/lsat-lr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/lsat-rc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/sat-en-without-passage.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/sat-en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/sat-math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/agieval/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/alghafa/copa_ar/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/alghafa/copa_ar/copa_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/alghafa/piqa_ar/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/alghafa/piqa_ar/piqa_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/anli/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/anli/anli_r1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/anli/anli_r2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/anli/anli_r3.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_complete.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_mcq_exams_test_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_meta_ar_dialects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_meta_ar_msa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_multiple_choice_facts_truefalse_balanced_task.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_multiple_choice_grounded_statement_soqal_task.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_multiple_choice_grounded_statement_xglue_mlqa_task.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_multiple_choice_rating_sentiment_no_neutral_task.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_multiple_choice_rating_sentiment_task.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_multiple_choice_sentiment_task.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_exams/arabic_exams.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_exams/arabic_leaderboard_arabic_exams.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_exams/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_arc_challenge/arabic_leaderboard_arabic_mt_arc_challenge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_arc_challenge/arabic_mt_arc_challenge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_arc_challenge/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_arc_easy/arabic_leaderboard_arabic_mt_arc_easy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_arc_easy/arabic_mt_arc_easy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_arc_easy/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_boolq/arabic_leaderboard_arabic_mt_boolq.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_boolq/arabic_mt_boolq.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_boolq/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_copa/arabic_leaderboard_arabic_mt_copa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_copa/arabic_mt_copa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_copa/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_hellaswag/arabic_leaderboard_arabic_mt_hellaswag.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_hellaswag/arabic_mt_hellaswag.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_hellaswag/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_mmlu/arabic_leaderboard_arabic_mt_mmlu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_mmlu/arabic_mt_mmlu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_mmlu/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_openbook_qa/arabic_leaderboard_arabic_mt_openbook_qa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_openbook_qa/arabic_mt_openbook_qa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_openbook_qa/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_piqa/arabic_leaderboard_arabic_mt_piqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_piqa/arabic_mt_piqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_piqa/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_race/arabic_leaderboard_arabic_mt_race.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_race/arabic_mt_race.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_race/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_sciq/arabic_leaderboard_arabic_mt_sciq.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_sciq/arabic_mt_sciq.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_sciq/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_toxigen/arabic_leaderboard_arabic_mt_toxigen.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_toxigen/arabic_mt_toxigen.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_toxigen/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Algeria.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Ancient_Egypt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arab_Empire.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Architecture.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Art.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Calligraphy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Ceremony.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Clothing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Culture.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Food.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Funeral.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_History.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Language_Origin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Literature.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Music.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Ornament.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Physics_and_Chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Wedding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Bahrain.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Comoros.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Egypt_modern.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_InfluenceFromAncientEgypt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_InfluenceFromByzantium.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_InfluenceFromChina.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_InfluenceFromGreece.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_InfluenceFromIslam.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_InfluenceFromPersia.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_InfluenceFromRome.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Iraq.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Islam_Education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Islam_branches_and_schools.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Islamic_law_system.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Jordan.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Kuwait.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Lebanon.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Libya.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Mauritania.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Mesopotamia_civilization.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Morocco.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Oman.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Palestine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Qatar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Saudi_Arabia.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Somalia.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Sudan.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Syria.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Tunisia.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_United_Arab_Emirates.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Yemen.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_communication.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_computer_and_phone.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_daily_life.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_entertainment.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_mcq_exams_test_ar_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_meta_ar_dialects_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_meta_ar_msa_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_multiple_choice_facts_truefalse_balanced_task_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_multiple_choice_grounded_statement_soqal_task_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_multiple_choice_grounded_statement_xglue_mlqa_task_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_multiple_choice_rating_sentiment_no_neutral_task_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_multiple_choice_rating_sentiment_task_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_multiple_choice_sentiment_task_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_exams_light/arabic_exams_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_exams_light/arabic_leaderboard_arabic_exams_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_exams_light/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_abstract_algebra_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_anatomy_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_astronomy_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_business_ethics_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_clinical_knowledge_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_college_biology_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_college_chemistry_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_college_computer_science_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_college_mathematics_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_college_medicine_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_college_physics_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_computer_security_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_conceptual_physics_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_econometrics_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_electrical_engineering_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_elementary_mathematics_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_formal_logic_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_global_facts_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_biology_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_chemistry_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_computer_science_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_european_history_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_geography_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_government_and_politics_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_macroeconomics_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_mathematics_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_microeconomics_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_physics_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_psychology_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_statistics_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_us_history_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_world_history_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_human_aging_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_human_sexuality_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_international_law_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_jurisprudence_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_logical_fallacies_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_machine_learning_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_management_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_marketing_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_medical_genetics_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_miscellaneous_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_moral_disputes_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_moral_scenarios_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_nutrition_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_philosophy_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_prehistory_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_professional_accounting_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_professional_law_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_professional_medicine_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_professional_psychology_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_public_relations_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_security_studies_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_sociology_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_us_foreign_policy_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_virology_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_world_religions_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_arc_challenge_light/arabic_leaderboard_arabic_mt_arc_challenge_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_arc_challenge_light/arabic_mt_arc_challenge_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_arc_challenge_light/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_arc_easy_light/arabic_leaderboard_arabic_mt_arc_easy_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_arc_easy_light/arabic_mt_arc_easy_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_arc_easy_light/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_boolq_light/arabic_leaderboard_arabic_mt_boolq_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_boolq_light/arabic_mt_boolq_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_boolq_light/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_copa_light/arabic_mt_copa_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_copa_light/arbic_leaderboard_arabic_mt_copa_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_copa_light/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_hellaswag_light/arabic_leaderboard_arabic_mt_hellaswag_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_hellaswag_light/arabic_mt_hellaswag_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_hellaswag_light/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_mmlu_light/arabic_leaderboard_arabic_mt_mmlu_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_mmlu_light/arabic_mt_mmlu_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_mmlu_light/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_openbook_qa_light/arabic_leaderboard_arabic_mt_openbook_qa_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_openbook_qa_light/arabic_mt_openbook_qa_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_openbook_qa_light/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_piqa_light/arabic_leaderboard_arabic_mt_piqa_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_piqa_light/arabic_mt_piqa_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_piqa_light/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_race_light/arabic_leaderboard_arabic_mt_race_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_race_light/arabic_mt_race_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_race_light/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_sciq_light/arabic_leaderboard_arabic_mt_sciq_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_sciq_light/arabic_mt_sciq_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_sciq_light/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_toxigen_light/arabic_leaderboard_arabic_mt_toxigen_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_toxigen_light/arabic_mt_toxigen_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_toxigen_light/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Algeria_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Ancient_Egypt_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arab_Empire_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Architecture_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Art_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Astronomy_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Calligraphy_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Ceremony_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Clothing_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Culture_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Food_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Funeral_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Geography_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_History_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Language_Origin_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Literature_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Math_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Medicine_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Music_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Ornament_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Philosophy_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Physics_and_Chemistry_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Wedding_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Bahrain_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Comoros_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Egypt_modern_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_InfluenceFromAncientEgypt_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_InfluenceFromByzantium_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_InfluenceFromChina_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_InfluenceFromGreece_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_InfluenceFromIslam_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_InfluenceFromPersia_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_InfluenceFromRome_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Iraq_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Islam_Education_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Islam_branches_and_schools_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Islamic_law_system_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Jordan_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Kuwait_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Lebanon_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Libya_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Mauritania_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Mesopotamia_civilization_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Morocco_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Oman_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Palestine_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Qatar_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Saudi_Arabia_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Somalia_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Sudan_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Syria_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Tunisia_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_United_Arab_Emirates_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Yemen_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_communication_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_computer_and_phone_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_daily_life_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_entertainment_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_light.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/_arabicmmlu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/_arabicmmlu_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/_arabicmmlu_language.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/_arabicmmlu_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/_arabicmmlu_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/_arabicmmlu_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/_default_arabicmmlu_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_accounting_university.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_arabic_language_general.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_arabic_language_grammar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_arabic_language_high_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_arabic_language_middle_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_arabic_language_primary_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_biology_high_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_civics_high_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_civics_middle_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_computer_science_high_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_computer_science_middle_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_computer_science_primary_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_computer_science_university.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_driving_test.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_economics_high_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_economics_middle_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_economics_university.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_general_knowledge_middle_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_general_knowledge_primary_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_geography_high_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_geography_middle_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_geography_primary_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_history_high_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_history_middle_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_history_primary_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_islamic_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_islamic_studies_high_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_islamic_studies_middle_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_islamic_studies_primary_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_law_professional.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_management_university.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_math_primary_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_natural_science_middle_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_natural_science_primary_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_philosophy_high_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_physics_high_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_political_science_university.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_social_science_middle_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/arabicmmlu_social_science_primary_school.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arabicmmlu/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/aradice.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_humanities_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_humanities_islamic-studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_humanities_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_language_arabic-language.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_social-science_civics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_social-science_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_social-science_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_stem_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_stem_computer-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_stem_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_humanities_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_humanities_islamic-studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_language_arabic-language.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_other_general-knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_social-science_civics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_social-science_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_social-science_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_social-science_social-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_stem_computer-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_stem_natural-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_na_humanities_islamic-studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_na_language_arabic-language-general.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_na_language_arabic-language-grammar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_na_other_driving-test.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_na_other_general-knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_humanities_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_humanities_islamic-studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_language_arabic-language.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_other_general-knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_social-science_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_social-science_social-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_stem_computer-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_stem_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_stem_natural-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_prof_humanities_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_univ_other_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_univ_social-science_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_univ_social-science_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_univ_social-science_political-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_univ_stem_computer-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/_default_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/metrics.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/EGY/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_humanities_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_humanities_islamic-studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_humanities_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_language_arabic-language.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_social-science_civics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_social-science_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_social-science_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_stem_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_stem_computer-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_stem_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_humanities_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_humanities_islamic-studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_language_arabic-language.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_other_general-knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_social-science_civics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_social-science_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_social-science_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_social-science_social-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_stem_computer-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_stem_natural-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_na_humanities_islamic-studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_na_language_arabic-language-general.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_na_language_arabic-language-grammar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_na_other_driving-test.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_na_other_general-knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_humanities_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_humanities_islamic-studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_language_arabic-language.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_other_general-knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_social-science_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_social-science_social-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_stem_computer-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_stem_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_stem_natural-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_prof_humanities_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_univ_other_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_univ_social-science_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_univ_social-science_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_univ_social-science_political-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_univ_stem_computer-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/_default_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/metrics.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/ArabicMMLU/LEV/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/boolq/EGY/boolq_egy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/boolq/EGY/metrics.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/boolq/EGY/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/boolq/ENG/boolq_eng.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/boolq/ENG/metrics.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/boolq/ENG/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/boolq/LEV/boolq_lev.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/boolq/LEV/metrics.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/boolq/LEV/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/boolq/MSA/boolq_msa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/boolq/MSA/metrics.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/boolq/MSA/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/cultural-benchmark/egypt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/cultural-benchmark/jordan.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/cultural-benchmark/lebanon.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/cultural-benchmark/metrics.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/cultural-benchmark/palestine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/cultural-benchmark/qatar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/cultural-benchmark/syria.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/cultural-benchmark/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/openbookqa/metrics.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/openbookqa/openbookqa_egy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/openbookqa/openbookqa_eng.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/openbookqa/openbookqa_lev.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/openbookqa/openbookqa_msa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/openbookqa/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/piqa/metrics.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/piqa/piqa_egy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/piqa/piqa_eng.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/piqa/piqa_lev.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/piqa/piqa_msa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/truthfulqa_mcq/metrics.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/truthfulqa_mcq/truthfulqa_mc1_egy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/truthfulqa_mcq/truthfulqa_mc1_eng.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/truthfulqa_mcq/truthfulqa_mc1_lev.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/truthfulqa_mcq/truthfulqa_mc1_msa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/winogrande/metrics.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/winogrande/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/winogrande/winogrande_egy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/winogrande/winogrande_eng.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/winogrande/winogrande_lev.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/aradice/winogrande/winogrande_msa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arc/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/arc/arc_challenge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arc/arc_challenge_chat.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arc/arc_easy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arc_mt/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/arc_mt/arc_challenge_mt_da.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arc_mt/arc_challenge_mt_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arc_mt/arc_challenge_mt_el.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arc_mt/arc_challenge_mt_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arc_mt/arc_challenge_mt_fi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arc_mt/arc_challenge_mt_hu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arc_mt/arc_challenge_mt_is.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arc_mt/arc_challenge_mt_it.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arc_mt/arc_challenge_mt_nb.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arc_mt/arc_challenge_mt_pl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arc_mt/arc_challenge_mt_pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arc_mt/arc_challenge_mt_sv.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arithmetic/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/arithmetic/arithmetic_1dc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arithmetic/arithmetic_2da.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arithmetic/arithmetic_2dm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arithmetic/arithmetic_2ds.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arithmetic/arithmetic_3da.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arithmetic/arithmetic_3ds.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arithmetic/arithmetic_4da.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arithmetic/arithmetic_4ds.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arithmetic/arithmetic_5da.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/arithmetic/arithmetic_5ds.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/asdiv/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/asdiv/asdiv-cot-llama.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/asdiv/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/babi/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/babi/babi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/arc_eu_challenge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/arc_eu_easy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/basque_bench.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/mgsm_cot_native_eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/mgsm_direct_eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/paws_eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/piqa_eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/wnli_eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/xcopa_eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/_flores_common_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/create_yamls_flores_eu.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/flores_ca-eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/flores_de-eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/flores_en-eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/flores_es-eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/flores_eu-ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/flores_eu-de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/flores_eu-en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/flores_eu-es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/flores_eu-fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/flores_eu-gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/flores_eu-it.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/flores_eu-pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/flores_eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/flores_fr-eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/flores_gl-eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/flores_it-eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basque_bench/flores_eu/flores_pt-eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basqueglue/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/basqueglue/bec.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basqueglue/bhtc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basqueglue/coref.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basqueglue/qnli.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basqueglue/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/basqueglue/vaxx.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/basqueglue/wic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/_bbh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/_bbh_cot_fewshot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/_cot_fewshot_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/boolean_expressions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/causal_judgement.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/date_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/disambiguation_qa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/dyck_languages.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/formal_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/geometric_shapes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/hyperbaton.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/logical_deduction_five_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/logical_deduction_seven_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/logical_deduction_three_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/movie_recommendation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/multistep_arithmetic_two.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/navigate.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/object_counting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/penguins_in_a_table.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/reasoning_about_colored_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/ruin_names.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/salient_translation_error_detection.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/snarks.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/sports_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/temporal_sequences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/tracking_shuffled_objects_five_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/tracking_shuffled_objects_seven_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/tracking_shuffled_objects_three_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/web_of_lies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_fewshot/word_sorting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/_bbh_cot_zeroshot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/_cot_zeroshot_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/boolean_expressions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/causal_judgement.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/date_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/disambiguation_qa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/dyck_languages.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/formal_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/geometric_shapes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/hyperbaton.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/logical_deduction_five_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/logical_deduction_seven_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/logical_deduction_three_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/movie_recommendation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/multistep_arithmetic_two.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/navigate.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/object_counting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/penguins_in_a_table.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/reasoning_about_colored_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/ruin_names.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/salient_translation_error_detection.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/snarks.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/sports_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/temporal_sequences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/tracking_shuffled_objects_five_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/tracking_shuffled_objects_seven_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/tracking_shuffled_objects_three_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/web_of_lies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/cot_zeroshot/word_sorting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/_bbh_fewshot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/_fewshot_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/boolean_expressions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/causal_judgement.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/date_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/disambiguation_qa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/dyck_languages.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/formal_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/geometric_shapes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/hyperbaton.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/logical_deduction_five_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/logical_deduction_seven_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/logical_deduction_three_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/movie_recommendation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/multistep_arithmetic_two.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/navigate.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/object_counting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/penguins_in_a_table.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/reasoning_about_colored_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/ruin_names.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/salient_translation_error_detection.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/snarks.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/sports_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/temporal_sequences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/tracking_shuffled_objects_five_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/tracking_shuffled_objects_seven_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/tracking_shuffled_objects_three_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/web_of_lies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/fewshot/word_sorting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/_bbh_zeroshot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/_zeroshot_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/boolean_expressions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/causal_judgement.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/date_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/disambiguation_qa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/dyck_languages.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/formal_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/geometric_shapes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/hyperbaton.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/logical_deduction_five_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/logical_deduction_seven_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/logical_deduction_three_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/movie_recommendation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/multistep_arithmetic_two.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/navigate.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/object_counting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/penguins_in_a_table.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/reasoning_about_colored_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/ruin_names.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/salient_translation_error_detection.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/snarks.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/sports_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/temporal_sequences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/tracking_shuffled_objects_five_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/tracking_shuffled_objects_seven_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/tracking_shuffled_objects_three_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/web_of_lies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbh/zeroshot/word_sorting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbq/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbq/bbq_generate.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbq/bbq_generate_ambig.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbq/bbq_generate_disambig.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbq/bbq_multiple_choice.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbq/bbq_multiple_choice_ambig.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbq/bbq_multiple_choice_disambig.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bbq/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/_belebele.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/_default_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_acm_Arab.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_afr_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_als_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_amh_Ethi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_apc_Arab.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_arb_Arab.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_arb_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_ars_Arab.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_ary_Arab.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_arz_Arab.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_asm_Beng.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_azj_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_bam_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_ben_Beng.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_ben_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_bod_Tibt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_bul_Cyrl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_cat_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_ceb_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_ces_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_ckb_Arab.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_dan_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_deu_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_ell_Grek.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_eng_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_est_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_eus_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_fin_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_fra_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_fuv_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_gaz_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_grn_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_guj_Gujr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_hat_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_hau_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_heb_Hebr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_hin_Deva.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_hin_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_hrv_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_hun_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_hye_Armn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_ibo_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_ilo_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_ind_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_isl_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_ita_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_jav_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_jpn_Jpan.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_kac_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_kan_Knda.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_kat_Geor.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_kaz_Cyrl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_kea_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_khk_Cyrl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_khm_Khmr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_kin_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_kir_Cyrl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_kor_Hang.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_lao_Laoo.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_lin_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_lit_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_lug_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_luo_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_lvs_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_mal_Mlym.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_mar_Deva.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_mkd_Cyrl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_mlt_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_mri_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_mya_Mymr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_nld_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_nob_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_npi_Deva.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_npi_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_nso_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_nya_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_ory_Orya.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_pan_Guru.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_pbt_Arab.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_pes_Arab.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_plt_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_pol_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_por_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_ron_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_rus_Cyrl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_shn_Mymr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_sin_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_sin_Sinh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_slk_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_slv_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_sna_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_snd_Arab.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_som_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_sot_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_spa_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_srp_Cyrl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_ssw_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_sun_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_swe_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_swh_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_tam_Taml.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_tel_Telu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_tgk_Cyrl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_tgl_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_tha_Thai.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_tir_Ethi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_tsn_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_tso_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_tur_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_ukr_Cyrl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_urd_Arab.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_urd_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_uzn_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_vie_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_war_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_wol_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_xho_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_yor_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_zho_Hans.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_zho_Hant.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_zsm_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/belebele/belebele_zul_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/benchmarks/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/benchmarks/minerva_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/benchmarks/openllm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/benchmarks/pythia.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/benchmarks/t0_eval.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/benchmarks/flan/_held_in_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/benchmarks/flan/flan_held_in.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/benchmarks/flan/flan_held_out.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/benchmarks/multimedqa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/benchmarks/multimedqa/multimedqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/_bertaqa_template
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/bertaqa_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/bertaqa_en_mt_gemma-7b.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/bertaqa_en_mt_hitz.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/bertaqa_en_mt_itzuli.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/bertaqa_en_mt_latxa-13b-v1.1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/bertaqa_en_mt_latxa-13b-v1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/bertaqa_en_mt_latxa-70b-v1.1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/bertaqa_en_mt_latxa-70b-v1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/bertaqa_en_mt_latxa-7b-v1.1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/bertaqa_en_mt_latxa-7b-v1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/bertaqa_en_mt_llama-2-13b.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/bertaqa_en_mt_llama-2-70b.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/bertaqa_en_mt_llama-2-7b.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/bertaqa_en_mt_madlad.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/bertaqa_en_mt_nllb.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bertaqa/bertaqa_eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_tasks.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice_template_a_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice_template_b_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/push_bigbench_dataset.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/abstract_narrative_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/anachronisms.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/analogical_similarity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/analytic_entailment.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/arithmetic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/ascii_word_recognition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/authorship_verification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/auto_categorization.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/auto_debugging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/bbq_lite_json.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/bridging_anaphora_resolution_barqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/causal_judgment.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/cause_and_effect.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/checkmate_in_one.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/chess_state_tracking.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/chinese_remainder_theorem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/cifar10_classification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/code_line_description.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/codenames.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/color.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/common_morpheme.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/conceptual_combinations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/conlang_translation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/contextual_parametric_knowledge_conflicts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/crash_blossom.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/crass_ai.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/cryobiology_spanish.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/cryptonite.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/cs_algorithms.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/dark_humor_detection.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/date_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/disambiguation_qa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/discourse_marker_prediction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/disfl_qa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/dyck_languages.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/elementary_math_qa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/emoji_movie.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/emojis_emotion_prediction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/empirical_judgments.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/english_proverbs.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/english_russian_proverbs.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/entailed_polarity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/entailed_polarity_hindi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/epistemic_reasoning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/evaluating_information_essentiality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/fact_checker.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/fantasy_reasoning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/few_shot_nlg.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/figure_of_speech_detection.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/formal_fallacies_syllogisms_negation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/gem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/gender_inclusive_sentences_german.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/geometric_shapes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/goal_step_wikihow.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/gre_reading_comprehension.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/hhh_alignment.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/hindi_question_answering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/hindu_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/hinglish_toxicity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/human_organs_senses.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/hyperbaton.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/identify_math_theorems.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/identify_odd_metaphor.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/implicatures.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/implicit_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/intent_recognition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/international_phonetic_alphabet_nli.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/international_phonetic_alphabet_transliterate.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/intersect_geometry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/irony_identification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/kanji_ascii.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/kannada.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/key_value_maps.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/known_unknowns.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/language_games.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/language_identification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/linguistic_mappings.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/linguistics_puzzles.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/list_functions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/logic_grid_puzzle.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/logical_args.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/logical_deduction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/logical_fallacy_detection.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/logical_sequence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/mathematical_induction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/matrixshapes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/metaphor_boolean.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/metaphor_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/minute_mysteries_qa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/misconceptions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/misconceptions_russian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/mnist_ascii.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/modified_arithmetic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/moral_permissibility.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/movie_dialog_same_or_different.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/movie_recommendation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/mult_data_wrangling.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/multiemo.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/natural_instructions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/navigate.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/nonsense_words_grammar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/novel_concepts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/object_counting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/odd_one_out.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/operators.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/paragraph_segmentation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/parsinlu_qa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/parsinlu_reading_comprehension.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/penguins_in_a_table.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/periodic_elements.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/persian_idioms.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/phrase_relatedness.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/physical_intuition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/physics_questions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/play_dialog_same_or_different.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/polish_sequence_labeling.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/presuppositions_as_nli.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/qa_wikidata.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/question_selection.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/real_or_fake_text.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/reasoning_about_colored_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/repeat_copy_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/rephrase.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/riddle_sense.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/ruin_names.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/salient_translation_error_detection.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/scientific_press_release.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/semantic_parsing_in_context_sparc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/semantic_parsing_spider.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/sentence_ambiguity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/similarities_abstraction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/simp_turing_concept.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/simple_arithmetic_json.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/simple_arithmetic_json_multiple_choice.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/simple_arithmetic_json_subtasks.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/simple_arithmetic_multiple_targets_json.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/simple_ethical_questions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/simple_text_editing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/snarks.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/social_iqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/social_support.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/sports_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/strange_stories.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/strategyqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/sufficient_information.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/suicide_risk.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/swahili_english_proverbs.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/swedish_to_german_proverbs.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/symbol_interpretation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/temporal_sequences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/tense.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/timedial.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/topical_chat.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/tracking_shuffled_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/understanding_fables.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/undo_permutation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/unit_conversion.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/unit_interpretation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/unnatural_in_context_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/vitaminc_fact_verification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/what_is_the_tao.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/which_wiki_edit.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/winowhy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/word_sorting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/generate_until/word_unscrambling.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/abstract_narrative_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/anachronisms.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/analogical_similarity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/analytic_entailment.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/arithmetic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/authorship_verification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/bbq_lite_json.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/causal_judgment.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/cause_and_effect.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/checkmate_in_one.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/cifar10_classification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/code_line_description.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/color.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/common_morpheme.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/conceptual_combinations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/contextual_parametric_knowledge_conflicts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/crash_blossom.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/crass_ai.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/cryobiology_spanish.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/cs_algorithms.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/dark_humor_detection.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/date_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/disambiguation_qa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/discourse_marker_prediction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/dyck_languages.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/elementary_math_qa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/emoji_movie.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/emojis_emotion_prediction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/empirical_judgments.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/english_proverbs.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/english_russian_proverbs.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/entailed_polarity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/entailed_polarity_hindi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/epistemic_reasoning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/evaluating_information_essentiality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/fact_checker.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/fantasy_reasoning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/figure_of_speech_detection.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/formal_fallacies_syllogisms_negation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/geometric_shapes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/goal_step_wikihow.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/gre_reading_comprehension.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/hhh_alignment.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/hindu_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/hinglish_toxicity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/human_organs_senses.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/hyperbaton.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/identify_math_theorems.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/identify_odd_metaphor.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/implicatures.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/implicit_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/intent_recognition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/international_phonetic_alphabet_nli.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/intersect_geometry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/irony_identification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/kanji_ascii.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/kannada.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/key_value_maps.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/known_unknowns.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/language_identification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/logic_grid_puzzle.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/logical_args.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/logical_deduction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/logical_fallacy_detection.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/logical_sequence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/mathematical_induction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/metaphor_boolean.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/metaphor_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/misconceptions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/misconceptions_russian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/mnist_ascii.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/moral_permissibility.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/movie_dialog_same_or_different.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/movie_recommendation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/multiemo.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/navigate.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/nonsense_words_grammar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/novel_concepts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/odd_one_out.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/parsinlu_qa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/penguins_in_a_table.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/periodic_elements.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/persian_idioms.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/phrase_relatedness.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/physical_intuition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/play_dialog_same_or_different.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/presuppositions_as_nli.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/question_selection.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/real_or_fake_text.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/reasoning_about_colored_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/riddle_sense.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/ruin_names.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/salient_translation_error_detection.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/sentence_ambiguity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/similarities_abstraction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/simple_ethical_questions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/snarks.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/social_iqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/social_support.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/sports_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/strange_stories.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/strategyqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/suicide_risk.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/swahili_english_proverbs.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/swedish_to_german_proverbs.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/symbol_interpretation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/temporal_sequences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/timedial.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/tracking_shuffled_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/understanding_fables.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/undo_permutation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/unit_conversion.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/unit_interpretation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/vitaminc_fact_verification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/what_is_the_tao.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/which_wiki_edit.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/bigbench/multiple_choice/winowhy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/_blimp.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/adjunct_island.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/anaphor_gender_agreement.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/anaphor_number_agreement.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/animate_subject_passive.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/animate_subject_trans.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/causative.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/complex_NP_island.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/coordinate_structure_constraint_complex_left_branch.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/coordinate_structure_constraint_object_extraction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/determiner_noun_agreement_1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/determiner_noun_agreement_2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/determiner_noun_agreement_irregular_1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/determiner_noun_agreement_irregular_2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/determiner_noun_agreement_with_adj_2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/determiner_noun_agreement_with_adj_irregular_1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/determiner_noun_agreement_with_adj_irregular_2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/determiner_noun_agreement_with_adjective_1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/distractor_agreement_relational_noun.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/distractor_agreement_relative_clause.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/drop_argument.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/ellipsis_n_bar_1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/ellipsis_n_bar_2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/existential_there_object_raising.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/existential_there_quantifiers_1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/existential_there_quantifiers_2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/existential_there_subject_raising.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/expletive_it_object_raising.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/inchoative.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/intransitive.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/irregular_past_participle_adjectives.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/irregular_past_participle_verbs.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/irregular_plural_subject_verb_agreement_1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/irregular_plural_subject_verb_agreement_2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/left_branch_island_echo_question.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/left_branch_island_simple_question.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/matrix_question_npi_licensor_present.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/npi_present_1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/npi_present_2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/only_npi_licensor_present.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/only_npi_scope.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/passive_1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/passive_2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/principle_A_c_command.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/principle_A_case_1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/principle_A_case_2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/principle_A_domain_1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/principle_A_domain_2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/principle_A_domain_3.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/principle_A_reconstruction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/regular_plural_subject_verb_agreement_1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/regular_plural_subject_verb_agreement_2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/sentential_negation_npi_licensor_present.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/sentential_negation_npi_scope.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/sentential_subject_island.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/superlative_quantifiers_1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/superlative_quantifiers_2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/tough_vs_raising_1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/tough_vs_raising_2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/transitive.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/wh_island.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/wh_questions_object_gap.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/wh_questions_subject_gap.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/wh_questions_subject_gap_long_distance.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/wh_vs_that_no_gap.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/wh_vs_that_no_gap_long_distance.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/wh_vs_that_with_gap.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/blimp/wh_vs_that_with_gap_long_distance.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/careqa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/careqa/careqa_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/careqa/careqa_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/careqa/careqa_open.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/careqa/careqa_open_perplexity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/careqa/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/careqa/utils_open.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/careqa/utils_perplexity.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/_arc_ca_common_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/_cabreu_common_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/arc_ca_challenge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/arc_ca_easy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/cabreu_abstractive.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/cabreu_extractive.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/cabreu_extreme.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/catalan_bench.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/catalanqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/catcola.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/cocoteros_va.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/copa_ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/coqcat.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/mgsm_direct_ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/openbookqa_ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/parafraseja.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/paws_ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/piqa_ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/siqa_ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/teca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/wnli_ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/xnli_ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/xquad_ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/xstorycloze_ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/_flores_common_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/create_yamls_flores_ca.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/flores_ca-de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/flores_ca-en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/flores_ca-es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/flores_ca-eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/flores_ca-fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/flores_ca-gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/flores_ca-it.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/flores_ca-pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/flores_ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/flores_de-ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/flores_en-ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/flores_es-ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/flores_eu-ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/flores_fr-ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/flores_gl-ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/flores_it-ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/flores_ca/flores_pt-ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/phrases_va/_phrases_va_common
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/phrases_va/phrases_ca-va.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/catalan_bench/phrases_va/phrases_va-ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/_ceval-valid.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/_default_ceval_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_accountant.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_advanced_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_art_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_basic_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_business_administration.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_chinese_language_and_literature.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_civil_servant.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_clinical_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_college_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_college_programming.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_computer_architecture.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_computer_network.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_discrete_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_education_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_electrical_engineer.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_environmental_impact_assessment_engineer.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_fire_engineer.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_high_school_chinese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_high_school_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_high_school_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_ideological_and_moral_cultivation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_legal_professional.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_mao_zedong_thought.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_marxism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_metrology_engineer.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_middle_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_middle_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_middle_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_middle_school_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_middle_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_middle_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_middle_school_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_modern_chinese_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_operating_system.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_physician.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_plant_protection.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_probability_and_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_professional_tour_guide.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_sports_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_tax_accountant.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_teacher_qualification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_urban_and_rural_planner.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ceval/ceval-valid_veterinary_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/chartqa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/chartqa/chartqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/chartqa/chartqa_llama.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/chartqa/chartqa_llama_90.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/chartqa/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/_cmmlu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/_default_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_agronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_ancient_chinese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_arts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_chinese_civil_service_exam.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_chinese_driving_rule.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_chinese_food_culture.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_chinese_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_chinese_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_chinese_literature.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_chinese_teacher_qualification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_college_actuarial_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_college_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_college_engineering_hydrology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_college_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_college_medical_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_construction_project_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_agronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_ancient_chinese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_arts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_chinese_civil_service_exam.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_chinese_driving_rule.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_chinese_food_culture.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_chinese_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_chinese_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_chinese_literature.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_chinese_teacher_qualification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_college_actuarial_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_college_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_college_engineering_hydrology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_college_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_college_medical_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_construction_project_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_elementary_chinese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_elementary_commonsense.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_elementary_information_and_technology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_ethnology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_food_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_high_school_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_journalism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_legal_and_moral_basis.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_logical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_marxist_theory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_modern_chinese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_security_study.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_sports_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_traditional_chinese_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_default_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_elementary_chinese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_elementary_commonsense.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_elementary_information_and_technology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_ethnology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_food_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_high_school_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_journalism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_legal_and_moral_basis.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_logical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_marxist_theory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_modern_chinese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_security_study.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_sports_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_traditional_chinese_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/cmmlu/cmmlu_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/code_x_glue/code-text/bleu.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/code_x_glue/code-text/go.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/code_x_glue/code-text/java.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/code_x_glue/code-text/javascript.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/code_x_glue/code-text/php.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/code_x_glue/code-text/python.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/code_x_glue/code-text/ruby.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/code_x_glue/code-text/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/common_voice/common_voice_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/common_voice/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/commonsense_qa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/commonsense_qa/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/copal_id/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/copal_id/colloquial.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/copal_id/standard.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/copal_id/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/coqa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/coqa/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/coqa/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_english.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_english_age.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_english_autre.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_english_disability.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_english_gender.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_english_nationality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_english_physical_appearance.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_english_race_color.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_english_religion.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_english_sexual_orientation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_english_socioeconomic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_french.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_french_age.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_french_autre.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_french_disability.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_french_gender.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_french_nationality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_french_physical_appearance.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_french_race_color.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_french_religion.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_french_sexual_orientation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/crows_pairs_french_socioeconomic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/crows_pairs/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/csatqa/_csatqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/csatqa/_default_csatqa_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/csatqa/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/csatqa/csatqa_gr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/csatqa/csatqa_li.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/csatqa/csatqa_rch.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/csatqa/csatqa_rcs.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/csatqa/csatqa_rcss.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/csatqa/csatqa_wr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/csatqa/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/drop/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/drop/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/drop/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/eq_bench/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/eq_bench/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eq_bench/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_ejadministrativo.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_ejauxiliar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_ejsubalterno.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_ejtecnico.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeayuntamientovitoria.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opebilbao.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeehuadmin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeehuaux.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeehubiblio.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeehuderecho.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeehueconomicas.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeehuempresariales.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeehusubalterno.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeehutecnico.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeehutecnicob.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeosakiadmin.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeosakiaux.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeosakiauxenf.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeosakicelador.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeosakienf.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeosakijuridico.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeosakioperario.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeosakitecnico.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_opeosakivarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_osakidetza1c.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_osakidetza2c.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_osakidetza3c.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_osakidetza4c.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_osakidetza5c.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_osakidetza6c.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_osakidetza7c.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_osakidetza8c.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_es_osakidetza9c.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_ejadministrari.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_ejlaguntza.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_ejlaguntzaile.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_ejteknikari.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opebilbaoeu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opeehuadmineu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opeehuauxeu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opeehubiblioeu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opeehuderechoeu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opeehueconomicaseu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opeehuempresarialeseu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opeehusubalternoeu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opeehutecnicoeu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opeehuteknikarib.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opegasteizkoudala.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opeosakiadmineu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opeosakiauxenfeu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opeosakiauxeu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opeosakiceladoreu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opeosakienfeu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opeosakioperarioeu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opeosakitecnicoeu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_opeosakivarioseu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_osakidetza1e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_osakidetza2e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_osakidetza3e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_osakidetza5e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_osakidetza6e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/eus_exams_eu_osakidetza7e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_exams/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_proficiency/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_proficiency/eus_proficiency.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_reading/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_reading/eus_reading.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_reading/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_trivia/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_trivia/eus_trivia.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/eus_trivia/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_at_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_at_task_p1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_at_task_p2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_at_task_p3.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_at_task_p4.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_at_task_p5.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_at_task_p6.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_at_tasks.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_faq_p1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_faq_p2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_faq_p3.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_faq_p4.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_faq_p5.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_faq_p6.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_faq_tasks.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_gen.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_hs_p1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_hs_p2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_hs_p3.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_hs_p4.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_hs_p5.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_hs_p6.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_hs_task.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ls_p1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ls_p2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ls_task.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_mc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner-adg_group.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner-adg_group_p1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner-adg_group_p2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner-fic_group.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner-fic_group_p1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner-fic_group_p2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner-wn_group.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner-wn_group_p1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner-wn_group_p2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner_adg.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner_adg_p1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner_adg_p2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner_fic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner_fic_p1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner_fic_p2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner_group.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner_wn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner_wn_p1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_ner_wn_p2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_re_p1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_re_p2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_re_task.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_sa_p1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_sa_p2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_sa_p3.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_sa_p4.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_sa_p5.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_sa_p6.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_sa_tasks.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_sum_fp-small_p1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_sum_fp-small_p2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_sum_fp-small_task.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_sum_fp_p1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_sum_fp_p2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_sum_fp_task.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_te_p1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_te_p2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_te_p3.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_te_p4.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_te_p5.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_te_p6.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_te_tasks.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_wic_p1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_wic_p2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_wic_p3.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_wic_p4.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_wic_p5.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_wic_p6.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_evalita-mp_wic_tasks.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_faq_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_hs_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_ls_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_ner_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_re_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_sa_template_v2_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_sa_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_sum_template_fp-small_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_sum_template_fp_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_sum_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_te_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/_wic_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/metrics.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/evalita_llm/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/fda/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/fda/fda.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/fda/task.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/fld/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/fld/fld_default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/fld/fld_logical_formula_default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/fld/fld_logical_formula_star.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/fld/fld_star.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/_default_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_arc_challenge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_boolqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_fquadv2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_fquadv2_bool.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_fquadv2_genq.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_fquadv2_hasAns.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_grammar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_hellaswag.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_multifquad.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_opus_perplexity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_orangesum_abstract.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_orangesum_title.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_reading_comp.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_topic_based_nli.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_trivia.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_vocab.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_wikitext_fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/french_bench_xnli.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/preprocess_wikitext.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/french_bench/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/belebele_glg_Latn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/galcola.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/galician_bench.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/mgsm_direct_gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/openbookqa_gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/parafrases_gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/paws_gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/summarization_gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/truthfulqa_gl_gen.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/truthfulqa_gl_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/truthfulqa_gl_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/xnli_gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/xstorycloze_gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/_flores_common_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/create_yamls_flores_gl.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/flores_ca-gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/flores_de-gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/flores_en-gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/flores_es-gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/flores_eu-gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/flores_fr-gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/flores_gl-ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/flores_gl-de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/flores_gl-en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/flores_gl-es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/flores_gl-eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/flores_gl-fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/flores_gl-it.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/flores_gl-pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/flores_gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/flores_it-gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/galician_bench/flores_gl/flores_pt-gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/glianorex/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/glianorex/glianorex.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/glianorex/glianorex_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/glianorex/glianorex_fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/glianorex/preprocess_glianorex.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ar/_ar_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ar/_global_mmlu_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ar/global_mmlu_ar_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ar/global_mmlu_ar_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ar/global_mmlu_ar_medical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ar/global_mmlu_ar_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ar/global_mmlu_ar_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ar/global_mmlu_ar_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ar/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/bn/_bn_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/bn/_global_mmlu_bn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/bn/global_mmlu_bn_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/bn/global_mmlu_bn_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/bn/global_mmlu_bn_medical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/bn/global_mmlu_bn_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/bn/global_mmlu_bn_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/bn/global_mmlu_bn_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/bn/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/de/_de_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/de/_global_mmlu_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/de/global_mmlu_de_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/de/global_mmlu_de_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/de/global_mmlu_de_medical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/de/global_mmlu_de_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/de/global_mmlu_de_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/de/global_mmlu_de_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/de/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/en/_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/en/_global_mmlu_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/en/global_mmlu_en_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/en/global_mmlu_en_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/en/global_mmlu_en_medical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/en/global_mmlu_en_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/en/global_mmlu_en_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/en/global_mmlu_en_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/en/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/es/_es_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/es/_global_mmlu_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/es/global_mmlu_es_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/es/global_mmlu_es_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/es/global_mmlu_es_medical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/es/global_mmlu_es_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/es/global_mmlu_es_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/es/global_mmlu_es_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/es/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/fr/_fr_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/fr/_global_mmlu_fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/fr/global_mmlu_fr_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/fr/global_mmlu_fr_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/fr/global_mmlu_fr_medical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/fr/global_mmlu_fr_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/fr/global_mmlu_fr_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/fr/global_mmlu_fr_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/fr/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/hi/_global_mmlu_hi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/hi/_hi_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/hi/global_mmlu_hi_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/hi/global_mmlu_hi_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/hi/global_mmlu_hi_medical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/hi/global_mmlu_hi_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/hi/global_mmlu_hi_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/hi/global_mmlu_hi_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/hi/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/id/_global_mmlu_id.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/id/_id_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/id/global_mmlu_id_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/id/global_mmlu_id_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/id/global_mmlu_id_medical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/id/global_mmlu_id_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/id/global_mmlu_id_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/id/global_mmlu_id_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/id/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/it/_global_mmlu_it.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/it/_it_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/it/global_mmlu_it_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/it/global_mmlu_it_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/it/global_mmlu_it_medical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/it/global_mmlu_it_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/it/global_mmlu_it_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/it/global_mmlu_it_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/it/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ja/_global_mmlu_ja.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ja/_ja_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ja/global_mmlu_ja_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ja/global_mmlu_ja_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ja/global_mmlu_ja_medical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ja/global_mmlu_ja_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ja/global_mmlu_ja_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ja/global_mmlu_ja_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ja/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ko/_global_mmlu_ko.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ko/_ko_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ko/global_mmlu_ko_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ko/global_mmlu_ko_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ko/global_mmlu_ko_medical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ko/global_mmlu_ko_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ko/global_mmlu_ko_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ko/global_mmlu_ko_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/ko/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/pt/_global_mmlu_pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/pt/_pt_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/pt/global_mmlu_pt_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/pt/global_mmlu_pt_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/pt/global_mmlu_pt_medical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/pt/global_mmlu_pt_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/pt/global_mmlu_pt_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/pt/global_mmlu_pt_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/pt/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/sw/_global_mmlu_sw.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/sw/_sw_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/sw/global_mmlu_sw_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/sw/global_mmlu_sw_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/sw/global_mmlu_sw_medical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/sw/global_mmlu_sw_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/sw/global_mmlu_sw_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/sw/global_mmlu_sw_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/sw/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/yo/_global_mmlu_yo.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/yo/_yo_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/yo/global_mmlu_yo_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/yo/global_mmlu_yo_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/yo/global_mmlu_yo_medical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/yo/global_mmlu_yo_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/yo/global_mmlu_yo_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/yo/global_mmlu_yo_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/yo/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/zh/_global_mmlu_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/zh/_zh_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/zh/global_mmlu_zh_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/zh/global_mmlu_zh_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/zh/global_mmlu_zh_medical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/zh/global_mmlu_zh_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/zh/global_mmlu_zh_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/zh/global_mmlu_zh_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/default/zh/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/_am_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/_global_mmlu_full_am.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/_global_mmlu_full_am_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/_global_mmlu_full_am_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/_global_mmlu_full_am_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/_global_mmlu_full_am_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/global_mmlu_full_am_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/am/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/_ar_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/_global_mmlu_full_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/_global_mmlu_full_ar_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/_global_mmlu_full_ar_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/_global_mmlu_full_ar_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/_global_mmlu_full_ar_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/global_mmlu_full_ar_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ar/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/_bn_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/_global_mmlu_full_bn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/_global_mmlu_full_bn_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/_global_mmlu_full_bn_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/_global_mmlu_full_bn_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/_global_mmlu_full_bn_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/global_mmlu_full_bn_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/bn/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/_cs_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/_global_mmlu_full_cs.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/_global_mmlu_full_cs_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/_global_mmlu_full_cs_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/_global_mmlu_full_cs_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/_global_mmlu_full_cs_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/global_mmlu_full_cs_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/cs/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/_de_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/_global_mmlu_full_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/_global_mmlu_full_de_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/_global_mmlu_full_de_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/_global_mmlu_full_de_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/_global_mmlu_full_de_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/global_mmlu_full_de_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/de/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/_el_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/_global_mmlu_full_el.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/_global_mmlu_full_el_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/_global_mmlu_full_el_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/_global_mmlu_full_el_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/_global_mmlu_full_el_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/global_mmlu_full_el_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/el/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/_global_mmlu_full_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/_global_mmlu_full_en_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/_global_mmlu_full_en_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/_global_mmlu_full_en_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/_global_mmlu_full_en_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/global_mmlu_full_en_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/en/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/_es_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/_global_mmlu_full_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/_global_mmlu_full_es_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/_global_mmlu_full_es_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/_global_mmlu_full_es_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/_global_mmlu_full_es_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/global_mmlu_full_es_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/es/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/_fa_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/_global_mmlu_full_fa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/_global_mmlu_full_fa_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/_global_mmlu_full_fa_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/_global_mmlu_full_fa_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/_global_mmlu_full_fa_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/global_mmlu_full_fa_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fa/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/_fil_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/_global_mmlu_full_fil.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/_global_mmlu_full_fil_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/_global_mmlu_full_fil_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/_global_mmlu_full_fil_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/_global_mmlu_full_fil_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/global_mmlu_full_fil_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fil/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/_fr_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/_global_mmlu_full_fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/_global_mmlu_full_fr_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/_global_mmlu_full_fr_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/_global_mmlu_full_fr_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/_global_mmlu_full_fr_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/global_mmlu_full_fr_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/fr/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/_global_mmlu_full_ha.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/_global_mmlu_full_ha_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/_global_mmlu_full_ha_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/_global_mmlu_full_ha_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/_global_mmlu_full_ha_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/_ha_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/global_mmlu_full_ha_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ha/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/_global_mmlu_full_he.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/_global_mmlu_full_he_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/_global_mmlu_full_he_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/_global_mmlu_full_he_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/_global_mmlu_full_he_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/_he_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/global_mmlu_full_he_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/he/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/_global_mmlu_full_hi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/_global_mmlu_full_hi_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/_global_mmlu_full_hi_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/_global_mmlu_full_hi_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/_global_mmlu_full_hi_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/_hi_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/global_mmlu_full_hi_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/hi/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/_global_mmlu_full_id.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/_global_mmlu_full_id_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/_global_mmlu_full_id_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/_global_mmlu_full_id_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/_global_mmlu_full_id_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/_id_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/global_mmlu_full_id_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/id/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/_global_mmlu_full_ig.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/_global_mmlu_full_ig_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/_global_mmlu_full_ig_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/_global_mmlu_full_ig_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/_global_mmlu_full_ig_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/_ig_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/global_mmlu_full_ig_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ig/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/_global_mmlu_full_it.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/_global_mmlu_full_it_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/_global_mmlu_full_it_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/_global_mmlu_full_it_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/_global_mmlu_full_it_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/_it_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/global_mmlu_full_it_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/it/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/_global_mmlu_full_ja.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/_global_mmlu_full_ja_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/_global_mmlu_full_ja_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/_global_mmlu_full_ja_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/_global_mmlu_full_ja_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/_ja_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/global_mmlu_full_ja_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ja/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/_global_mmlu_full_ko.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/_global_mmlu_full_ko_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/_global_mmlu_full_ko_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/_global_mmlu_full_ko_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/_global_mmlu_full_ko_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/_ko_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/global_mmlu_full_ko_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ko/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/_global_mmlu_full_ky.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/_global_mmlu_full_ky_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/_global_mmlu_full_ky_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/_global_mmlu_full_ky_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/_global_mmlu_full_ky_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/_ky_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/global_mmlu_full_ky_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ky/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/_global_mmlu_full_lt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/_global_mmlu_full_lt_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/_global_mmlu_full_lt_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/_global_mmlu_full_lt_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/_global_mmlu_full_lt_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/_lt_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/global_mmlu_full_lt_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/lt/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/_global_mmlu_full_mg.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/_global_mmlu_full_mg_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/_global_mmlu_full_mg_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/_global_mmlu_full_mg_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/_global_mmlu_full_mg_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/_mg_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/global_mmlu_full_mg_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/mg/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/_global_mmlu_full_ms.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/_global_mmlu_full_ms_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/_global_mmlu_full_ms_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/_global_mmlu_full_ms_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/_global_mmlu_full_ms_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/_ms_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/global_mmlu_full_ms_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ms/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/_global_mmlu_full_ne.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/_global_mmlu_full_ne_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/_global_mmlu_full_ne_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/_global_mmlu_full_ne_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/_global_mmlu_full_ne_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/_ne_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/global_mmlu_full_ne_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ne/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/_global_mmlu_full_nl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/_global_mmlu_full_nl_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/_global_mmlu_full_nl_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/_global_mmlu_full_nl_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/_global_mmlu_full_nl_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/_nl_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/global_mmlu_full_nl_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/nl/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/_global_mmlu_full_ny.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/_global_mmlu_full_ny_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/_global_mmlu_full_ny_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/_global_mmlu_full_ny_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/_global_mmlu_full_ny_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/_ny_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/global_mmlu_full_ny_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ny/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/_global_mmlu_full_pl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/_global_mmlu_full_pl_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/_global_mmlu_full_pl_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/_global_mmlu_full_pl_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/_global_mmlu_full_pl_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/_pl_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/global_mmlu_full_pl_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pl/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/_global_mmlu_full_pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/_global_mmlu_full_pt_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/_global_mmlu_full_pt_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/_global_mmlu_full_pt_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/_global_mmlu_full_pt_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/_pt_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/global_mmlu_full_pt_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/pt/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/_global_mmlu_full_ro.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/_global_mmlu_full_ro_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/_global_mmlu_full_ro_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/_global_mmlu_full_ro_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/_global_mmlu_full_ro_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/_ro_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/global_mmlu_full_ro_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ro/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/_global_mmlu_full_ru.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/_global_mmlu_full_ru_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/_global_mmlu_full_ru_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/_global_mmlu_full_ru_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/_global_mmlu_full_ru_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/_ru_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/global_mmlu_full_ru_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/ru/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/_global_mmlu_full_si.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/_global_mmlu_full_si_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/_global_mmlu_full_si_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/_global_mmlu_full_si_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/_global_mmlu_full_si_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/_si_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/global_mmlu_full_si_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/si/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/_global_mmlu_full_sn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/_global_mmlu_full_sn_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/_global_mmlu_full_sn_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/_global_mmlu_full_sn_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/_global_mmlu_full_sn_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/_sn_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/global_mmlu_full_sn_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sn/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/_global_mmlu_full_so.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/_global_mmlu_full_so_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/_global_mmlu_full_so_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/_global_mmlu_full_so_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/_global_mmlu_full_so_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/_so_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/global_mmlu_full_so_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/so/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/_global_mmlu_full_sr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/_global_mmlu_full_sr_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/_global_mmlu_full_sr_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/_global_mmlu_full_sr_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/_global_mmlu_full_sr_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/_sr_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/global_mmlu_full_sr_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sr/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/_global_mmlu_full_sv.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/_global_mmlu_full_sv_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/_global_mmlu_full_sv_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/_global_mmlu_full_sv_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/_global_mmlu_full_sv_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/_sv_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/global_mmlu_full_sv_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sv/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/_global_mmlu_full_sw.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/_global_mmlu_full_sw_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/_global_mmlu_full_sw_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/_global_mmlu_full_sw_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/_global_mmlu_full_sw_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/_sw_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/global_mmlu_full_sw_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/sw/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/_global_mmlu_full_te.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/_global_mmlu_full_te_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/_global_mmlu_full_te_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/_global_mmlu_full_te_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/_global_mmlu_full_te_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/_te_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/global_mmlu_full_te_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/te/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/_global_mmlu_full_tr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/_global_mmlu_full_tr_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/_global_mmlu_full_tr_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/_global_mmlu_full_tr_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/_global_mmlu_full_tr_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/_tr_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/global_mmlu_full_tr_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/tr/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/_global_mmlu_full_uk.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/_global_mmlu_full_uk_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/_global_mmlu_full_uk_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/_global_mmlu_full_uk_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/_global_mmlu_full_uk_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/_uk_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/global_mmlu_full_uk_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/uk/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/_global_mmlu_full_vi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/_global_mmlu_full_vi_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/_global_mmlu_full_vi_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/_global_mmlu_full_vi_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/_global_mmlu_full_vi_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/_vi_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/global_mmlu_full_vi_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/vi/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/_global_mmlu_full_yo.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/_global_mmlu_full_yo_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/_global_mmlu_full_yo_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/_global_mmlu_full_yo_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/_global_mmlu_full_yo_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/_yo_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/global_mmlu_full_yo_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/yo/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/_global_mmlu_full_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/_global_mmlu_full_zh_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/_global_mmlu_full_zh_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/_global_mmlu_full_zh_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/_global_mmlu_full_zh_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/_zh_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/global_mmlu_full_zh_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/global_mmlu/full/zh/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/glue/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/glue/cola/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/glue/mnli/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/glue/mnli/mismatch.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/glue/mnli/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/glue/mrpc/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/glue/qnli/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/glue/qqp/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/glue/rte/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/glue/sst2/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/glue/wnli/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/cot_n_shot/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/cot_n_shot/_gpqa_cot_n_shot_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/cot_n_shot/gpqa_diamond_cot_n_shot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/cot_n_shot/gpqa_extended_cot_n_shot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/cot_n_shot/gpqa_main_cot_n_shot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/cot_n_shot/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/cot_zeroshot/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/cot_zeroshot/_gpqa_cot_zeroshot_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/cot_zeroshot/gpqa_diamond_cot_zeroshot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/cot_zeroshot/gpqa_extended_cot_zeroshot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/cot_zeroshot/gpqa_main_cot_zeroshot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/cot_zeroshot/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/generative/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/generative/_gpqa_generative_n_shot_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/generative/gpqa_diamond_generative_n_shot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/generative/gpqa_extended_generative_n_shot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/generative/gpqa_main_generative_n_shot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/generative/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/n_shot/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/n_shot/_gpqa_n_shot_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/n_shot/gpqa_diamond_n_shot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/n_shot/gpqa_extended_n_shot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/n_shot/gpqa_main_n_shot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/n_shot/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/zeroshot/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/zeroshot/_gpqa_zeroshot_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/zeroshot/gpqa_diamond_zeroshot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/zeroshot/gpqa_extended_zeroshot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/zeroshot/gpqa_main_zeroshot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gpqa/zeroshot/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/groundcocoa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/groundcocoa/groundcocoa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/groundcocoa/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/gsm8k/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/gsm8k/gsm8k-cot-llama.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gsm8k/gsm8k-cot-self-consistency.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gsm8k/gsm8k-cot-zeroshot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gsm8k/gsm8k-cot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gsm8k/gsm8k.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gsm_plus/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/gsm_plus/gsm_plus.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/gsm_plus/gsm_plus_mini.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/haerae/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/haerae/_default_haerae_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/haerae/_haerae.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/haerae/haerae_gk.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/haerae/haerae_hi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/haerae/haerae_lw.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/haerae/haerae_rw.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/haerae/haerae_sn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/headqa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/headqa/headqa_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/headqa/headqa_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hellaswag/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/hellaswag/hellaswag.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hellaswag/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_ethics/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_ethics/commonsense.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_ethics/deontology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_ethics/justice.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_ethics/utilitarianism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_ethics/utilitarianism_original_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_ethics/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_ethics/virtue.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_math/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_math/hendrycks_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_math/hendrycks_math_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_math/hendrycks_math_counting_and_prob.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_math/hendrycks_math_geometry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_math/hendrycks_math_intermediate_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_math/hendrycks_math_num_theory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_math/hendrycks_math_prealgebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_math/hendrycks_math_precalc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hendrycks_math/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/histoires_morales/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/histoires_morales/histoires_morales.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/histoires_morales/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/hrm8k/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/hrm8k/default/_hrm8k_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hrm8k/default/hrm8k.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hrm8k/default/hrm8k_gsm8k.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hrm8k/default/hrm8k_ksm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hrm8k/default/hrm8k_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hrm8k/default/hrm8k_mmmlu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hrm8k/default/hrm8k_omni_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hrm8k/default/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/hrm8k/en/_hrm8k_en_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hrm8k/en/hrm8k_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hrm8k/en/hrm8k_gsm8k_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hrm8k/en/hrm8k_ksm_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hrm8k/en/hrm8k_math_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hrm8k/en/hrm8k_mmmlu_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hrm8k/en/hrm8k_omni_math_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/hrm8k/en/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/humaneval/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/humaneval/humaneval.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/humaneval/humaneval_64.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/humaneval/humaneval_64_instruct.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/humaneval/humaneval_instruct.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/humaneval/humaneval_plus.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/humaneval/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/ifeval/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/ifeval/ifeval.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ifeval/instructions.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/ifeval/instructions_registry.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/ifeval/instructions_util.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/ifeval/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Albanian/_albanian_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Albanian/_include_base_44_albanian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Albanian/include_base_44_albanian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Albanian/include_base_44_albanian_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Albanian/include_base_44_albanian_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Albanian/include_base_44_albanian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Albanian/include_base_44_albanian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Albanian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Arabic/_arabic_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Arabic/_include_base_44_arabic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Arabic/include_base_44_arabic_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Arabic/include_base_44_arabic_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Arabic/include_base_44_arabic_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Arabic/include_base_44_arabic_general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Arabic/include_base_44_arabic_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Arabic/include_base_44_arabic_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Arabic/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Armenian/_armenian_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Armenian/_include_base_44_armenian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Armenian/include_base_44_armenian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Armenian/include_base_44_armenian_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Armenian/include_base_44_armenian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Armenian/include_base_44_armenian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Armenian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Azerbaijani/_azerbaijani_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Azerbaijani/_include_base_44_azerbaijani.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Azerbaijani/include_base_44_azerbaijani_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Azerbaijani/include_base_44_azerbaijani_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Azerbaijani/include_base_44_azerbaijani_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Azerbaijani/include_base_44_azerbaijani_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Azerbaijani/include_base_44_azerbaijani_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Azerbaijani/include_base_44_azerbaijani_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Azerbaijani/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Basque/_basque_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Basque/_include_base_44_basque.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Basque/include_base_44_basque_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Basque/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Belarusian/_belarusian_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Belarusian/_include_base_44_belarusian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Belarusian/include_base_44_belarusian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Belarusian/include_base_44_belarusian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Belarusian/include_base_44_belarusian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Belarusian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Bengali/_bengali_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Bengali/_include_base_44_bengali.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Bengali/include_base_44_bengali_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Bengali/include_base_44_bengali_general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Bengali/include_base_44_bengali_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Bengali/include_base_44_bengali_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Bengali/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Bulgarian/_bulgarian_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Bulgarian/_include_base_44_bulgarian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Bulgarian/include_base_44_bulgarian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Bulgarian/include_base_44_bulgarian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Bulgarian/include_base_44_bulgarian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Bulgarian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Chinese/_chinese_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Chinese/_include_base_44_chinese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Chinese/include_base_44_chinese_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Chinese/include_base_44_chinese_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Chinese/include_base_44_chinese_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Chinese/include_base_44_chinese_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Chinese/include_base_44_chinese_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Chinese/include_base_44_chinese_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Chinese/include_base_44_chinese_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Chinese/include_base_44_chinese_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Chinese/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Croatian/_croatian_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Croatian/_include_base_44_croatian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Croatian/include_base_44_croatian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Croatian/include_base_44_croatian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Croatian/include_base_44_croatian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Croatian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Dutch/_dutch_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Dutch/_include_base_44_dutch.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Dutch/include_base_44_dutch_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Dutch/include_base_44_dutch_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Dutch/include_base_44_dutch_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Dutch/include_base_44_dutch_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Dutch/include_base_44_dutch_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Dutch/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Estonian/_estonian_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Estonian/_include_base_44_estonian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Estonian/include_base_44_estonian_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Estonian/include_base_44_estonian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Estonian/include_base_44_estonian_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Estonian/include_base_44_estonian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Estonian/include_base_44_estonian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Estonian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Finnish/_finnish_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Finnish/_include_base_44_finnish.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Finnish/include_base_44_finnish_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Finnish/include_base_44_finnish_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Finnish/include_base_44_finnish_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Finnish/include_base_44_finnish_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Finnish/include_base_44_finnish_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Finnish/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/French/_french_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/French/_include_base_44_french.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/French/include_base_44_french_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/French/include_base_44_french_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/French/include_base_44_french_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/French/include_base_44_french_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/French/include_base_44_french_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/French/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Georgian/_georgian_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Georgian/_include_base_44_georgian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Georgian/include_base_44_georgian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Georgian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/German/_german_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/German/_include_base_44_german.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/German/include_base_44_german_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/German/include_base_44_german_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/German/include_base_44_german_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/German/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Greek/_greek_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Greek/_include_base_44_greek.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Greek/include_base_44_greek_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Greek/include_base_44_greek_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Greek/include_base_44_greek_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Greek/include_base_44_greek_medical_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Greek/include_base_44_greek_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Greek/include_base_44_greek_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Greek/include_base_44_greek_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Greek/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hebrew/_hebrew_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hebrew/_include_base_44_hebrew.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hebrew/include_base_44_hebrew_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hebrew/include_base_44_hebrew_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hebrew/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hindi/_hindi_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hindi/_include_base_44_hindi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hindi/include_base_44_hindi_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hindi/include_base_44_hindi_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hindi/include_base_44_hindi_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hindi/include_base_44_hindi_general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hindi/include_base_44_hindi_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hindi/include_base_44_hindi_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hindi/include_base_44_hindi_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hindi/include_base_44_hindi_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hindi/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hungarian/_hungarian_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hungarian/_include_base_44_hungarian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hungarian/include_base_44_hungarian_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hungarian/include_base_44_hungarian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hungarian/include_base_44_hungarian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Hungarian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Indonesian/_include_base_44_indonesian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Indonesian/_indonesian_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Indonesian/include_base_44_indonesian_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Indonesian/include_base_44_indonesian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Indonesian/include_base_44_indonesian_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Indonesian/include_base_44_indonesian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Indonesian/include_base_44_indonesian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Indonesian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Italian/_include_base_44_italian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Italian/_italian_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Italian/include_base_44_italian_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Italian/include_base_44_italian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Italian/include_base_44_italian_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Italian/include_base_44_italian_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Italian/include_base_44_italian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Italian/include_base_44_italian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Italian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Japanese/_include_base_44_japanese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Japanese/_japanese_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Japanese/include_base_44_japanese_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Japanese/include_base_44_japanese_medical_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Japanese/include_base_44_japanese_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Japanese/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Kazakh/_include_base_44_kazakh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Kazakh/_kazakh_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Kazakh/include_base_44_kazakh_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Kazakh/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Korean/_include_base_44_korean.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Korean/_korean_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Korean/include_base_44_korean_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Korean/include_base_44_korean_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Korean/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Lithuanian/_include_base_44_lithuanian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Lithuanian/_lithuanian_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Lithuanian/include_base_44_lithuanian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Lithuanian/include_base_44_lithuanian_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Lithuanian/include_base_44_lithuanian_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Lithuanian/include_base_44_lithuanian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Lithuanian/include_base_44_lithuanian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Lithuanian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Malay/_include_base_44_malay.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Malay/_malay_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Malay/include_base_44_malay_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Malay/include_base_44_malay_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Malay/include_base_44_malay_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Malay/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Malayalam/_include_base_44_malayalam.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Malayalam/_malayalam_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Malayalam/include_base_44_malayalam_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Malayalam/include_base_44_malayalam_general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Malayalam/include_base_44_malayalam_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Malayalam/include_base_44_malayalam_marine_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Malayalam/include_base_44_malayalam_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Malayalam/include_base_44_malayalam_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Malayalam/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Nepali/_include_base_44_nepali.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Nepali/_nepali_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Nepali/include_base_44_nepali_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Nepali/include_base_44_nepali_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Nepali/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/North Macedonian/_include_base_44_north macedonian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/North Macedonian/_north macedonian_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/North Macedonian/include_base_44_north macedonian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/North Macedonian/include_base_44_north macedonian_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/North Macedonian/include_base_44_north macedonian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/North Macedonian/include_base_44_north macedonian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/North Macedonian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Persian/_include_base_44_persian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Persian/_persian_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Persian/include_base_44_persian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Persian/include_base_44_persian_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Persian/include_base_44_persian_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Persian/include_base_44_persian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Persian/include_base_44_persian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Persian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Polish/_include_base_44_polish.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Polish/_polish_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Polish/include_base_44_polish_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Polish/include_base_44_polish_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Polish/include_base_44_polish_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Polish/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Portuguese/_include_base_44_portuguese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Portuguese/_portuguese_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Portuguese/include_base_44_portuguese_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Portuguese/include_base_44_portuguese_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Portuguese/include_base_44_portuguese_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Portuguese/include_base_44_portuguese_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Portuguese/include_base_44_portuguese_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Portuguese/include_base_44_portuguese_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Portuguese/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Russian/_include_base_44_russian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Russian/_russian_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Russian/include_base_44_russian_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Russian/include_base_44_russian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Russian/include_base_44_russian_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Russian/include_base_44_russian_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Russian/include_base_44_russian_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Russian/include_base_44_russian_marine_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Russian/include_base_44_russian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Russian/include_base_44_russian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Russian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Serbian/_include_base_44_serbian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Serbian/_serbian_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Serbian/include_base_44_serbian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Serbian/include_base_44_serbian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Serbian/include_base_44_serbian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Serbian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Spanish/_include_base_44_spanish.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Spanish/_spanish_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Spanish/include_base_44_spanish_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Spanish/include_base_44_spanish_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Spanish/include_base_44_spanish_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Spanish/include_base_44_spanish_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Spanish/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Tagalog/_include_base_44_tagalog.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Tagalog/_tagalog_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Tagalog/include_base_44_tagalog_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Tagalog/include_base_44_tagalog_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Tagalog/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Tamil/_include_base_44_tamil.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Tamil/_tamil_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Tamil/include_base_44_tamil_general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Tamil/include_base_44_tamil_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Tamil/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Telugu/_include_base_44_telugu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Telugu/_telugu_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Telugu/include_base_44_telugu_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Telugu/include_base_44_telugu_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Telugu/include_base_44_telugu_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Telugu/include_base_44_telugu_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Telugu/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Turkish/_include_base_44_turkish.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Turkish/_turkish_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Turkish/include_base_44_turkish_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Turkish/include_base_44_turkish_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Turkish/include_base_44_turkish_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Turkish/include_base_44_turkish_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Turkish/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Ukrainian/_include_base_44_ukrainian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Ukrainian/_ukrainian_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Ukrainian/include_base_44_ukrainian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Ukrainian/include_base_44_ukrainian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Ukrainian/include_base_44_ukrainian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Ukrainian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Urdu/_include_base_44_urdu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Urdu/_urdu_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Urdu/include_base_44_urdu_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Urdu/include_base_44_urdu_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Urdu/include_base_44_urdu_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Urdu/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Uzbek/_include_base_44_uzbek.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Uzbek/_uzbek_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Uzbek/include_base_44_uzbek_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Uzbek/include_base_44_uzbek_medical_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Uzbek/include_base_44_uzbek_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Uzbek/include_base_44_uzbek_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Uzbek/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Vietnamese/_include_base_44_vietnamese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Vietnamese/_vietnamese_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Vietnamese/include_base_44_vietnamese_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Vietnamese/include_base_44_vietnamese_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Vietnamese/include_base_44_vietnamese_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/default/Vietnamese/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Albanian/_albanian_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Albanian/_include_base_44_albanian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Albanian/include_base_44_albanian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Albanian/include_base_44_albanian_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Albanian/include_base_44_albanian_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Albanian/include_base_44_albanian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Albanian/include_base_44_albanian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Albanian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Arabic/_arabic_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Arabic/_include_base_44_arabic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Arabic/include_base_44_arabic_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Arabic/include_base_44_arabic_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Arabic/include_base_44_arabic_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Arabic/include_base_44_arabic_general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Arabic/include_base_44_arabic_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Arabic/include_base_44_arabic_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Arabic/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Armenian/_armenian_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Armenian/_include_base_44_armenian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Armenian/include_base_44_armenian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Armenian/include_base_44_armenian_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Armenian/include_base_44_armenian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Armenian/include_base_44_armenian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Armenian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Azerbaijani/_azerbaijani_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Azerbaijani/_include_base_44_azerbaijani.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Azerbaijani/include_base_44_azerbaijani_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Azerbaijani/include_base_44_azerbaijani_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Azerbaijani/include_base_44_azerbaijani_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Azerbaijani/include_base_44_azerbaijani_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Azerbaijani/include_base_44_azerbaijani_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Azerbaijani/include_base_44_azerbaijani_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Azerbaijani/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Basque/_basque_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Basque/_include_base_44_basque.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Basque/include_base_44_basque_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Basque/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Belarusian/_belarusian_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Belarusian/_include_base_44_belarusian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Belarusian/include_base_44_belarusian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Belarusian/include_base_44_belarusian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Belarusian/include_base_44_belarusian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Belarusian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Bengali/_bengali_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Bengali/_include_base_44_bengali.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Bengali/include_base_44_bengali_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Bengali/include_base_44_bengali_general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Bengali/include_base_44_bengali_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Bengali/include_base_44_bengali_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Bengali/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Bulgarian/_bulgarian_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Bulgarian/_include_base_44_bulgarian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Bulgarian/include_base_44_bulgarian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Bulgarian/include_base_44_bulgarian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Bulgarian/include_base_44_bulgarian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Bulgarian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Chinese/_chinese_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Chinese/_include_base_44_chinese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Chinese/include_base_44_chinese_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Chinese/include_base_44_chinese_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Chinese/include_base_44_chinese_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Chinese/include_base_44_chinese_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Chinese/include_base_44_chinese_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Chinese/include_base_44_chinese_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Chinese/include_base_44_chinese_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Chinese/include_base_44_chinese_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Chinese/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Croatian/_croatian_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Croatian/_include_base_44_croatian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Croatian/include_base_44_croatian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Croatian/include_base_44_croatian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Croatian/include_base_44_croatian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Croatian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Dutch/_dutch_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Dutch/_include_base_44_dutch.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Dutch/include_base_44_dutch_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Dutch/include_base_44_dutch_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Dutch/include_base_44_dutch_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Dutch/include_base_44_dutch_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Dutch/include_base_44_dutch_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Dutch/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Estonian/_estonian_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Estonian/_include_base_44_estonian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Estonian/include_base_44_estonian_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Estonian/include_base_44_estonian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Estonian/include_base_44_estonian_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Estonian/include_base_44_estonian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Estonian/include_base_44_estonian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Estonian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Finnish/_finnish_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Finnish/_include_base_44_finnish.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Finnish/include_base_44_finnish_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Finnish/include_base_44_finnish_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Finnish/include_base_44_finnish_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Finnish/include_base_44_finnish_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Finnish/include_base_44_finnish_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Finnish/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/French/_french_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/French/_include_base_44_french.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/French/include_base_44_french_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/French/include_base_44_french_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/French/include_base_44_french_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/French/include_base_44_french_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/French/include_base_44_french_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/French/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Georgian/_georgian_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Georgian/_include_base_44_georgian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Georgian/include_base_44_georgian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Georgian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/German/_german_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/German/_include_base_44_german.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/German/include_base_44_german_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/German/include_base_44_german_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/German/include_base_44_german_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/German/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Greek/_greek_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Greek/_include_base_44_greek.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Greek/include_base_44_greek_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Greek/include_base_44_greek_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Greek/include_base_44_greek_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Greek/include_base_44_greek_medical_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Greek/include_base_44_greek_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Greek/include_base_44_greek_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Greek/include_base_44_greek_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Greek/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hebrew/_hebrew_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hebrew/_include_base_44_hebrew.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hebrew/include_base_44_hebrew_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hebrew/include_base_44_hebrew_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hebrew/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hindi/_hindi_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hindi/_include_base_44_hindi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hindi/include_base_44_hindi_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hindi/include_base_44_hindi_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hindi/include_base_44_hindi_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hindi/include_base_44_hindi_general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hindi/include_base_44_hindi_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hindi/include_base_44_hindi_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hindi/include_base_44_hindi_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hindi/include_base_44_hindi_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hindi/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hungarian/_hungarian_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hungarian/_include_base_44_hungarian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hungarian/include_base_44_hungarian_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hungarian/include_base_44_hungarian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hungarian/include_base_44_hungarian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Hungarian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Indonesian/_include_base_44_indonesian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Indonesian/_indonesian_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Indonesian/include_base_44_indonesian_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Indonesian/include_base_44_indonesian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Indonesian/include_base_44_indonesian_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Indonesian/include_base_44_indonesian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Indonesian/include_base_44_indonesian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Indonesian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Italian/_include_base_44_italian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Italian/_italian_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Italian/include_base_44_italian_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Italian/include_base_44_italian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Italian/include_base_44_italian_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Italian/include_base_44_italian_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Italian/include_base_44_italian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Italian/include_base_44_italian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Italian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Japanese/_include_base_44_japanese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Japanese/_japanese_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Japanese/include_base_44_japanese_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Japanese/include_base_44_japanese_medical_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Japanese/include_base_44_japanese_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Japanese/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Kazakh/_include_base_44_kazakh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Kazakh/_kazakh_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Kazakh/include_base_44_kazakh_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Kazakh/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Korean/_include_base_44_korean.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Korean/_korean_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Korean/include_base_44_korean_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Korean/include_base_44_korean_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Korean/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Lithuanian/_include_base_44_lithuanian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Lithuanian/_lithuanian_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Lithuanian/include_base_44_lithuanian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Lithuanian/include_base_44_lithuanian_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Lithuanian/include_base_44_lithuanian_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Lithuanian/include_base_44_lithuanian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Lithuanian/include_base_44_lithuanian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Lithuanian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Malay/_include_base_44_malay.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Malay/_malay_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Malay/include_base_44_malay_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Malay/include_base_44_malay_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Malay/include_base_44_malay_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Malay/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Malayalam/_include_base_44_malayalam.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Malayalam/_malayalam_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Malayalam/include_base_44_malayalam_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Malayalam/include_base_44_malayalam_general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Malayalam/include_base_44_malayalam_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Malayalam/include_base_44_malayalam_marine_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Malayalam/include_base_44_malayalam_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Malayalam/include_base_44_malayalam_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Malayalam/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Nepali/_include_base_44_nepali.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Nepali/_nepali_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Nepali/include_base_44_nepali_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Nepali/include_base_44_nepali_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Nepali/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/North Macedonian/_include_base_44_north macedonian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/North Macedonian/_north macedonian_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/North Macedonian/include_base_44_north macedonian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/North Macedonian/include_base_44_north macedonian_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/North Macedonian/include_base_44_north macedonian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/North Macedonian/include_base_44_north macedonian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/North Macedonian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Persian/_include_base_44_persian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Persian/_persian_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Persian/include_base_44_persian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Persian/include_base_44_persian_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Persian/include_base_44_persian_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Persian/include_base_44_persian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Persian/include_base_44_persian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Persian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Polish/_include_base_44_polish.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Polish/_polish_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Polish/include_base_44_polish_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Polish/include_base_44_polish_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Polish/include_base_44_polish_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Polish/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Portuguese/_include_base_44_portuguese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Portuguese/_portuguese_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Portuguese/include_base_44_portuguese_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Portuguese/include_base_44_portuguese_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Portuguese/include_base_44_portuguese_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Portuguese/include_base_44_portuguese_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Portuguese/include_base_44_portuguese_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Portuguese/include_base_44_portuguese_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Portuguese/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Russian/_include_base_44_russian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Russian/_russian_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Russian/include_base_44_russian_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Russian/include_base_44_russian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Russian/include_base_44_russian_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Russian/include_base_44_russian_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Russian/include_base_44_russian_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Russian/include_base_44_russian_marine_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Russian/include_base_44_russian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Russian/include_base_44_russian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Russian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Serbian/_include_base_44_serbian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Serbian/_serbian_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Serbian/include_base_44_serbian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Serbian/include_base_44_serbian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Serbian/include_base_44_serbian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Serbian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Spanish/_include_base_44_spanish.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Spanish/_spanish_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Spanish/include_base_44_spanish_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Spanish/include_base_44_spanish_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Spanish/include_base_44_spanish_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Spanish/include_base_44_spanish_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Spanish/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Tagalog/_include_base_44_tagalog.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Tagalog/_tagalog_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Tagalog/include_base_44_tagalog_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Tagalog/include_base_44_tagalog_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Tagalog/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Tamil/_include_base_44_tamil.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Tamil/_tamil_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Tamil/include_base_44_tamil_general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Tamil/include_base_44_tamil_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Tamil/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Telugu/_include_base_44_telugu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Telugu/_telugu_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Telugu/include_base_44_telugu_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Telugu/include_base_44_telugu_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Telugu/include_base_44_telugu_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Telugu/include_base_44_telugu_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Telugu/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Turkish/_include_base_44_turkish.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Turkish/_turkish_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Turkish/include_base_44_turkish_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Turkish/include_base_44_turkish_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Turkish/include_base_44_turkish_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Turkish/include_base_44_turkish_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Turkish/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Ukrainian/_include_base_44_ukrainian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Ukrainian/_ukrainian_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Ukrainian/include_base_44_ukrainian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Ukrainian/include_base_44_ukrainian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Ukrainian/include_base_44_ukrainian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Ukrainian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Urdu/_include_base_44_urdu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Urdu/_urdu_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Urdu/include_base_44_urdu_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Urdu/include_base_44_urdu_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Urdu/include_base_44_urdu_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Urdu/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Uzbek/_include_base_44_uzbek.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Uzbek/_uzbek_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Uzbek/include_base_44_uzbek_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Uzbek/include_base_44_uzbek_medical_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Uzbek/include_base_44_uzbek_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Uzbek/include_base_44_uzbek_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Uzbek/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Vietnamese/_include_base_44_vietnamese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Vietnamese/_vietnamese_few_shot_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Vietnamese/include_base_44_vietnamese_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Vietnamese/include_base_44_vietnamese_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Vietnamese/include_base_44_vietnamese_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_en/Vietnamese/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Albanian/_albanian_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Albanian/_include_base_44_albanian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Albanian/include_base_44_albanian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Albanian/include_base_44_albanian_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Albanian/include_base_44_albanian_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Albanian/include_base_44_albanian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Albanian/include_base_44_albanian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Albanian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Arabic/_arabic_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Arabic/_include_base_44_arabic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Arabic/include_base_44_arabic_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Arabic/include_base_44_arabic_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Arabic/include_base_44_arabic_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Arabic/include_base_44_arabic_general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Arabic/include_base_44_arabic_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Arabic/include_base_44_arabic_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Arabic/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Armenian/_armenian_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Armenian/_include_base_44_armenian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Armenian/include_base_44_armenian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Armenian/include_base_44_armenian_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Armenian/include_base_44_armenian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Armenian/include_base_44_armenian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Armenian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Azerbaijani/_azerbaijani_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Azerbaijani/_include_base_44_azerbaijani.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Azerbaijani/include_base_44_azerbaijani_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Azerbaijani/include_base_44_azerbaijani_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Azerbaijani/include_base_44_azerbaijani_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Azerbaijani/include_base_44_azerbaijani_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Azerbaijani/include_base_44_azerbaijani_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Azerbaijani/include_base_44_azerbaijani_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Azerbaijani/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Basque/_basque_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Basque/_include_base_44_basque.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Basque/include_base_44_basque_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Basque/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Belarusian/_belarusian_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Belarusian/_include_base_44_belarusian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Belarusian/include_base_44_belarusian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Belarusian/include_base_44_belarusian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Belarusian/include_base_44_belarusian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Belarusian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Bengali/_bengali_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Bengali/_include_base_44_bengali.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Bengali/include_base_44_bengali_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Bengali/include_base_44_bengali_general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Bengali/include_base_44_bengali_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Bengali/include_base_44_bengali_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Bengali/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Bulgarian/_bulgarian_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Bulgarian/_include_base_44_bulgarian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Bulgarian/include_base_44_bulgarian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Bulgarian/include_base_44_bulgarian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Bulgarian/include_base_44_bulgarian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Bulgarian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Chinese/_chinese_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Chinese/_include_base_44_chinese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Chinese/include_base_44_chinese_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Chinese/include_base_44_chinese_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Chinese/include_base_44_chinese_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Chinese/include_base_44_chinese_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Chinese/include_base_44_chinese_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Chinese/include_base_44_chinese_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Chinese/include_base_44_chinese_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Chinese/include_base_44_chinese_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Chinese/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Croatian/_croatian_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Croatian/_include_base_44_croatian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Croatian/include_base_44_croatian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Croatian/include_base_44_croatian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Croatian/include_base_44_croatian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Croatian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Dutch/_dutch_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Dutch/_include_base_44_dutch.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Dutch/include_base_44_dutch_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Dutch/include_base_44_dutch_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Dutch/include_base_44_dutch_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Dutch/include_base_44_dutch_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Dutch/include_base_44_dutch_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Dutch/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Estonian/_estonian_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Estonian/_include_base_44_estonian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Estonian/include_base_44_estonian_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Estonian/include_base_44_estonian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Estonian/include_base_44_estonian_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Estonian/include_base_44_estonian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Estonian/include_base_44_estonian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Estonian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Finnish/_finnish_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Finnish/_include_base_44_finnish.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Finnish/include_base_44_finnish_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Finnish/include_base_44_finnish_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Finnish/include_base_44_finnish_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Finnish/include_base_44_finnish_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Finnish/include_base_44_finnish_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Finnish/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/French/_french_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/French/_include_base_44_french.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/French/include_base_44_french_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/French/include_base_44_french_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/French/include_base_44_french_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/French/include_base_44_french_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/French/include_base_44_french_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/French/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Georgian/_georgian_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Georgian/_include_base_44_georgian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Georgian/include_base_44_georgian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Georgian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/German/_german_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/German/_include_base_44_german.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/German/include_base_44_german_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/German/include_base_44_german_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/German/include_base_44_german_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/German/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Greek/_greek_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Greek/_include_base_44_greek.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Greek/include_base_44_greek_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Greek/include_base_44_greek_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Greek/include_base_44_greek_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Greek/include_base_44_greek_medical_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Greek/include_base_44_greek_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Greek/include_base_44_greek_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Greek/include_base_44_greek_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Greek/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hebrew/_hebrew_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hebrew/_include_base_44_hebrew.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hebrew/include_base_44_hebrew_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hebrew/include_base_44_hebrew_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hebrew/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hindi/_hindi_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hindi/_include_base_44_hindi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hindi/include_base_44_hindi_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hindi/include_base_44_hindi_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hindi/include_base_44_hindi_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hindi/include_base_44_hindi_general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hindi/include_base_44_hindi_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hindi/include_base_44_hindi_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hindi/include_base_44_hindi_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hindi/include_base_44_hindi_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hindi/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hungarian/_hungarian_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hungarian/_include_base_44_hungarian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hungarian/include_base_44_hungarian_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hungarian/include_base_44_hungarian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hungarian/include_base_44_hungarian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Hungarian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Indonesian/_include_base_44_indonesian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Indonesian/_indonesian_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Indonesian/include_base_44_indonesian_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Indonesian/include_base_44_indonesian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Indonesian/include_base_44_indonesian_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Indonesian/include_base_44_indonesian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Indonesian/include_base_44_indonesian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Indonesian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Italian/_include_base_44_italian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Italian/_italian_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Italian/include_base_44_italian_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Italian/include_base_44_italian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Italian/include_base_44_italian_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Italian/include_base_44_italian_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Italian/include_base_44_italian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Italian/include_base_44_italian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Italian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Japanese/_include_base_44_japanese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Japanese/_japanese_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Japanese/include_base_44_japanese_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Japanese/include_base_44_japanese_medical_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Japanese/include_base_44_japanese_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Japanese/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Kazakh/_include_base_44_kazakh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Kazakh/_kazakh_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Kazakh/include_base_44_kazakh_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Kazakh/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Korean/_include_base_44_korean.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Korean/_korean_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Korean/include_base_44_korean_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Korean/include_base_44_korean_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Korean/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Lithuanian/_include_base_44_lithuanian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Lithuanian/_lithuanian_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Lithuanian/include_base_44_lithuanian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Lithuanian/include_base_44_lithuanian_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Lithuanian/include_base_44_lithuanian_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Lithuanian/include_base_44_lithuanian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Lithuanian/include_base_44_lithuanian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Lithuanian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Malay/_include_base_44_malay.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Malay/_malay_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Malay/include_base_44_malay_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Malay/include_base_44_malay_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Malay/include_base_44_malay_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Malay/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Malayalam/_include_base_44_malayalam.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Malayalam/_malayalam_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Malayalam/include_base_44_malayalam_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Malayalam/include_base_44_malayalam_general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Malayalam/include_base_44_malayalam_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Malayalam/include_base_44_malayalam_marine_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Malayalam/include_base_44_malayalam_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Malayalam/include_base_44_malayalam_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Malayalam/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Nepali/_include_base_44_nepali.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Nepali/_nepali_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Nepali/include_base_44_nepali_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Nepali/include_base_44_nepali_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Nepali/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/North Macedonian/_include_base_44_north macedonian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/North Macedonian/_north macedonian_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/North Macedonian/include_base_44_north macedonian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/North Macedonian/include_base_44_north macedonian_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/North Macedonian/include_base_44_north macedonian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/North Macedonian/include_base_44_north macedonian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/North Macedonian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Persian/_include_base_44_persian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Persian/_persian_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Persian/include_base_44_persian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Persian/include_base_44_persian_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Persian/include_base_44_persian_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Persian/include_base_44_persian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Persian/include_base_44_persian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Persian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Polish/_include_base_44_polish.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Polish/_polish_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Polish/include_base_44_polish_professional_certification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Polish/include_base_44_polish_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Polish/include_base_44_polish_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Polish/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Portuguese/_include_base_44_portuguese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Portuguese/_portuguese_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Portuguese/include_base_44_portuguese_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Portuguese/include_base_44_portuguese_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Portuguese/include_base_44_portuguese_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Portuguese/include_base_44_portuguese_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Portuguese/include_base_44_portuguese_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Portuguese/include_base_44_portuguese_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Portuguese/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Russian/_include_base_44_russian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Russian/_russian_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Russian/include_base_44_russian_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Russian/include_base_44_russian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Russian/include_base_44_russian_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Russian/include_base_44_russian_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Russian/include_base_44_russian_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Russian/include_base_44_russian_marine_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Russian/include_base_44_russian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Russian/include_base_44_russian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Russian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Serbian/_include_base_44_serbian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Serbian/_serbian_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Serbian/include_base_44_serbian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Serbian/include_base_44_serbian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Serbian/include_base_44_serbian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Serbian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Spanish/_include_base_44_spanish.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Spanish/_spanish_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Spanish/include_base_44_spanish_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Spanish/include_base_44_spanish_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Spanish/include_base_44_spanish_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Spanish/include_base_44_spanish_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Spanish/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Tagalog/_include_base_44_tagalog.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Tagalog/_tagalog_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Tagalog/include_base_44_tagalog_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Tagalog/include_base_44_tagalog_driving_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Tagalog/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Tamil/_include_base_44_tamil.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Tamil/_tamil_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Tamil/include_base_44_tamil_general_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Tamil/include_base_44_tamil_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Tamil/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Telugu/_include_base_44_telugu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Telugu/_telugu_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Telugu/include_base_44_telugu_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Telugu/include_base_44_telugu_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Telugu/include_base_44_telugu_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Telugu/include_base_44_telugu_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Telugu/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Turkish/_include_base_44_turkish.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Turkish/_turkish_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Turkish/include_base_44_turkish_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Turkish/include_base_44_turkish_business_commerce.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Turkish/include_base_44_turkish_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Turkish/include_base_44_turkish_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Turkish/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Ukrainian/_include_base_44_ukrainian.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Ukrainian/_ukrainian_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Ukrainian/include_base_44_ukrainian_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Ukrainian/include_base_44_ukrainian_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Ukrainian/include_base_44_ukrainian_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Ukrainian/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Urdu/_include_base_44_urdu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Urdu/_urdu_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Urdu/include_base_44_urdu_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Urdu/include_base_44_urdu_health_oriented_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Urdu/include_base_44_urdu_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Urdu/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Uzbek/_include_base_44_uzbek.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Uzbek/_uzbek_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Uzbek/include_base_44_uzbek_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Uzbek/include_base_44_uzbek_medical_license.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Uzbek/include_base_44_uzbek_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Uzbek/include_base_44_uzbek_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Uzbek/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Vietnamese/_include_base_44_vietnamese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Vietnamese/_vietnamese_few_shot_og_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Vietnamese/include_base_44_vietnamese_arts_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Vietnamese/include_base_44_vietnamese_social_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Vietnamese/include_base_44_vietnamese_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/include/few_shot_og/Vietnamese/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/inverse_scaling/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/inverse_scaling/_inverse_scaling_mc_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/inverse_scaling/_some_results
quantization/lm-evaluation-harness-main/lm_eval/tasks/inverse_scaling/inverse_scaling_hindsight_neglect.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/inverse_scaling/inverse_scaling_into_the_unknown.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/inverse_scaling/inverse_scaling_memo_trap.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/inverse_scaling/inverse_scaling_modus_tollens.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/inverse_scaling/inverse_scaling_neqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/inverse_scaling/inverse_scaling_pattern_matching_suppression.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/inverse_scaling/inverse_scaling_quote_repetition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/inverse_scaling/inverse_scaling_redefine_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/inverse_scaling/inverse_scaling_repetitive_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/inverse_scaling/inverse_scaling_sig_figs.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/inverse_scaling/inverse_scaling_winobias_antistereotype.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/japanese_leaderboard/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/japanese_leaderboard/_ja_leaderboard.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/japanese_leaderboard/ja_leaderboard_jaqket_v2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/japanese_leaderboard/ja_leaderboard_jcommonsenseqa.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/japanese_leaderboard/ja_leaderboard_jcommonsenseqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/japanese_leaderboard/ja_leaderboard_jnli.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/japanese_leaderboard/ja_leaderboard_jsquad.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/japanese_leaderboard/ja_leaderboard_marc_ja.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/japanese_leaderboard/ja_leaderboard_mgsm.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/japanese_leaderboard/ja_leaderboard_mgsm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/japanese_leaderboard/ja_leaderboard_xlsum.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/japanese_leaderboard/ja_leaderboard_xlsum.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/japanese_leaderboard/ja_leaderboard_xwinograd.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/japanese_leaderboard/ja_leaderboard_xwinograd.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/japanese_leaderboard/requirements.txt
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/civil/_base_em_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/civil/kbl_bar_exam_em_civil_2012.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/civil/kbl_bar_exam_em_civil_2013.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/civil/kbl_bar_exam_em_civil_2014.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/civil/kbl_bar_exam_em_civil_2015.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/civil/kbl_bar_exam_em_civil_2016.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/civil/kbl_bar_exam_em_civil_2017.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/civil/kbl_bar_exam_em_civil_2018.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/civil/kbl_bar_exam_em_civil_2019.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/civil/kbl_bar_exam_em_civil_2020.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/civil/kbl_bar_exam_em_civil_2021.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/civil/kbl_bar_exam_em_civil_2022.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/civil/kbl_bar_exam_em_civil_2023.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/civil/kbl_bar_exam_em_civil_2024.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/criminal/_base_em_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/criminal/kbl_bar_exam_em_criminal_2012.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/criminal/kbl_bar_exam_em_criminal_2013.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/criminal/kbl_bar_exam_em_criminal_2014.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/criminal/kbl_bar_exam_em_criminal_2015.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/criminal/kbl_bar_exam_em_criminal_2016.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/criminal/kbl_bar_exam_em_criminal_2017.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/criminal/kbl_bar_exam_em_criminal_2018.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/criminal/kbl_bar_exam_em_criminal_2019.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/criminal/kbl_bar_exam_em_criminal_2020.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/criminal/kbl_bar_exam_em_criminal_2021.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/criminal/kbl_bar_exam_em_criminal_2022.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/criminal/kbl_bar_exam_em_criminal_2023.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/criminal/kbl_bar_exam_em_criminal_2024.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/public/_base_em_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/public/kbl_bar_exam_em_public_2012.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/public/kbl_bar_exam_em_public_2013.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/public/kbl_bar_exam_em_public_2014.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/public/kbl_bar_exam_em_public_2015.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/public/kbl_bar_exam_em_public_2016.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/public/kbl_bar_exam_em_public_2017.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/public/kbl_bar_exam_em_public_2018.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/public/kbl_bar_exam_em_public_2019.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/public/kbl_bar_exam_em_public_2020.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/public/kbl_bar_exam_em_public_2021.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/public/kbl_bar_exam_em_public_2022.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/public/kbl_bar_exam_em_public_2023.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/public/kbl_bar_exam_em_public_2024.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/responsibility/_base_em_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/responsibility/kbl_bar_exam_em_responsibility_2010.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/responsibility/kbl_bar_exam_em_responsibility_2011.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/responsibility/kbl_bar_exam_em_responsibility_2012.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/responsibility/kbl_bar_exam_em_responsibility_2013.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/responsibility/kbl_bar_exam_em_responsibility_2014.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/responsibility/kbl_bar_exam_em_responsibility_2015.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/responsibility/kbl_bar_exam_em_responsibility_2016.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/responsibility/kbl_bar_exam_em_responsibility_2017.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/responsibility/kbl_bar_exam_em_responsibility_2018.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/responsibility/kbl_bar_exam_em_responsibility_2019.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/responsibility/kbl_bar_exam_em_responsibility_2020.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/responsibility/kbl_bar_exam_em_responsibility_2021.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/responsibility/kbl_bar_exam_em_responsibility_2022.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/bar_exam/responsibility/kbl_bar_exam_em_responsibility_2023.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/knowledge/_kbl_knowledge_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/knowledge/kbl_common_legal_mistake_qa_em.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/knowledge/kbl_common_legal_mistake_qa_reasoning_em.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/knowledge/kbl_legal_concept_qa_em.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/knowledge/kbl_offense_component_qa_em.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/knowledge/kbl_query_statute_matching_qa_em.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/knowledge/kbl_statute_hallucination_qa_em.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/knowledge/kbl_statute_number_and_content_matching_qa_em.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/reasoning/_kbl_reasoning_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/reasoning/kbl_case_relevance_qa_p_em.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/reasoning/kbl_case_relevance_qa_q_em.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/reasoning/kbl_causal_reasoning_em.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kbl/reasoning/kbl_statement_consistency_qa_em.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/_cot_kmmlu_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/_kmmlu_cot_hard.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/_kmmlu_cot_hard_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/_kmmlu_cot_hard_humss.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/_kmmlu_cot_hard_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/_kmmlu_cot_hard_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_agricultural_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_aviation_engineering_and_maintenance.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_chemical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_civil_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_construction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_criminal_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_ecology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_electronics_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_energy_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_environmental_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_fashion.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_food_processing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_gas_technology_and_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_geomatics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_industrial_engineer.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_information_technology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_interior_architecture_and_design.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_korean_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_machine_design_and_manufacturing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_maritime_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_materials_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_mechanical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_nondestructive_testing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_patent.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_political_science_and_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_public_safety.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_railway_and_automotive_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_real_estate.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_refrigerating_machinery.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_social_welfare.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_taxation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_telecommunications_and_wireless_technology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/_direct_kmmlu_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/_kmmlu_direct.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/_kmmlu_direct_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/_kmmlu_direct_humss.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/_kmmlu_direct_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/_kmmlu_direct_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_agricultural_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_aviation_engineering_and_maintenance.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_chemical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_civil_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_construction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_criminal_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_ecology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_electronics_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_energy_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_environmental_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_fashion.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_food_processing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_gas_technology_and_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_geomatics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_industrial_engineer.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_information_technology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_interior_architecture_and_design.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_korean_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_machine_design_and_manufacturing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_maritime_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_materials_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_mechanical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_nondestructive_testing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_patent.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_political_science_and_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_public_safety.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_railway_and_automotive_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_real_estate.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_refrigerating_machinery.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_social_welfare.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_taxation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct/kmmlu_direct_telecommunications_and_wireless_technology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/_direct_hard_kmmlu_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/_kmmlu_direct_hard.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/_kmmlu_direct_hard_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/_kmmlu_direct_hard_humss.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/_kmmlu_direct_hard_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/_kmmlu_direct_hard_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_agricultural_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_aviation_engineering_and_maintenance.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_chemical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_civil_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_construction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_criminal_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_ecology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_electronics_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_energy_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_environmental_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_fashion.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_food_processing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_gas_technology_and_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_geomatics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_industrial_engineer.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_information_technology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_interior_architecture_and_design.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_korean_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_machine_design_and_manufacturing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_maritime_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_materials_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_mechanical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_nondestructive_testing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_patent.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_political_science_and_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_public_safety.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_railway_and_automotive_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_real_estate.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_refrigerating_machinery.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_social_welfare.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_taxation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_telecommunications_and_wireless_technology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/_hard_kmmlu_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/_kmmlu_hard.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/_kmmlu_hard_applied_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/_kmmlu_hard_humss.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/_kmmlu_hard_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/_kmmlu_hard_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_agricultural_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_aviation_engineering_and_maintenance.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_chemical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_civil_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_construction.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_criminal_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_ecology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_electronics_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_energy_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_environmental_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_fashion.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_food_processing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_gas_technology_and_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_geomatics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_industrial_engineer.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_information_technology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_interior_architecture_and_design.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_korean_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_machine_design_and_manufacturing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_maritime_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_materials_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_mechanical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_nondestructive_testing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_patent.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_political_science_and_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_public_safety.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_railway_and_automotive_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_real_estate.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_refrigerating_machinery.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_social_welfare.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_taxation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kmmlu/hard/kmmlu_hard_telecommunications_and_wireless_technology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kobest/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/kobest/_kobest.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kobest/kobest_boolq.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kobest/kobest_copa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kobest/kobest_hellaswag.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kobest/kobest_sentineg.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kobest/kobest_wic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kobest/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/kormedmcqa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/kormedmcqa/_kormedmcqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kormedmcqa/_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kormedmcqa/dentist.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kormedmcqa/doctor.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kormedmcqa/nurse.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/kormedmcqa/pharm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada/lambada_openai.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada/lambada_standard.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada_cloze/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada_cloze/lambada_openai_cloze.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada_cloze/lambada_standard_cloze.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada_multilingual/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada_multilingual/lambada_mt_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada_multilingual/lambada_mt_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada_multilingual/lambada_mt_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada_multilingual/lambada_mt_fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada_multilingual/lambada_mt_it.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada_multilingual_stablelm/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada_multilingual_stablelm/lambada_mt_stablelm_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada_multilingual_stablelm/lambada_mt_stablelm_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada_multilingual_stablelm/lambada_mt_stablelm_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada_multilingual_stablelm/lambada_mt_stablelm_fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada_multilingual_stablelm/lambada_mt_stablelm_it.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada_multilingual_stablelm/lambada_mt_stablelm_nl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lambada_multilingual_stablelm/lambada_mt_stablelm_pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/leaderboard.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/_fewshot_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/_leaderboard_bbh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/boolean_expressions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/causal_judgement.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/date_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/disambiguation_qa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/formal_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/geometric_shapes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/hyperbaton.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/logical_deduction_five_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/logical_deduction_seven_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/logical_deduction_three_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/movie_recommendation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/navigate.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/object_counting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/penguins_in_a_table.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/reasoning_about_colored_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/ruin_names.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/salient_translation_error_detection.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/snarks.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/sports_understanding.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/temporal_sequences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/tracking_shuffled_objects_five_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/tracking_shuffled_objects_seven_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/tracking_shuffled_objects_three_objects.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/bbh_mc/web_of_lies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/gpqa/_leaderboard_gpqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/gpqa/_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/gpqa/gpqa_diamond_zeroshot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/gpqa/gpqa_extended_zeroshot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/gpqa/gpqa_main_zeroshot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/gpqa/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/ifeval/_leaderboard_instruction_following.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/ifeval/ifeval.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/ifeval/instructions.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/ifeval/instructions_registry.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/ifeval/instructions_util.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/ifeval/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/math/_leaderboard_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/math/_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/math/math_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/math/math_counting_and_prob.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/math/math_geometry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/math/math_intermediate_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/math/math_num_theory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/math/math_prealgebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/math/math_precalculus.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/math/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/mmlu_pro/mmlu_pro.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/mmlu_pro/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/musr/_musr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/musr/_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/musr/musr_murder_mysteries.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/musr/musr_object_placements.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/musr/musr_team_allocation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/leaderboard/musr/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/lingoly/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/lingoly/lingoly_context.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lingoly/lingoly_group.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lingoly/lingoly_nocontext.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/lingoly/script.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/lingoly/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/_continuation_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/_mmlu_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/_mmlu_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/_mmlu_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/_mmlu_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/llama.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu/mmlu_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu_pro/_default_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu_pro/_mmlu_pro.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu_pro/mmlu_pro_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu_pro/mmlu_pro_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu_pro/mmlu_pro_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu_pro/mmlu_pro_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu_pro/mmlu_pro_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu_pro/mmlu_pro_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu_pro/mmlu_pro_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu_pro/mmlu_pro_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu_pro/mmlu_pro_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu_pro/mmlu_pro_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu_pro/mmlu_pro_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu_pro/mmlu_pro_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu_pro/mmlu_pro_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu_pro/mmlu_pro_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/llama3/instruct/mmlu_pro/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/logiqa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/logiqa/logiqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/logiqa/utils_logiqa.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/logiqa2/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/logiqa2/logieval.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/logiqa2/logiqa2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/logiqa2/utils_logiqa2.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/2wikimqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/2wikimqa_e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/_generate_config.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/dureader.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/gov_report.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/gov_report_e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/hotpotqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/hotpotqa_e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/lcc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/lcc_e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/lsht.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/metrics.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/multi_news.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/multi_news_e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/multifieldqa_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/multifieldqa_en_e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/multifieldqa_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/musique.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/narrativeqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/passage_count.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/passage_count_e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/passage_retrieval_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/passage_retrieval_en_e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/passage_retrieval_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/qasper.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/qasper_e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/qmsum.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/repobench-p.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/repobench-p_e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/samsum.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/samsum_e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/trec.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/trec_e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/triviaqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/triviaqa_e.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/longbench/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mastermind/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/mastermind/mastermind_24_easy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mastermind/mastermind_24_hard.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mastermind/mastermind_35_easy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mastermind/mastermind_35_hard.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mastermind/mastermind_46_easy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mastermind/mastermind_46_hard.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mathqa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/mathqa/mathqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mathqa/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mbpp/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/mbpp/mbpp.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mbpp/mbpp_plus.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mbpp/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mc_taco/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/mc_taco/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/_default_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/_med_concepts_qa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/_med_concepts_qa_atc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/_med_concepts_qa_icd10cm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/_med_concepts_qa_icd10proc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/_med_concepts_qa_icd9cm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/_med_concepts_qa_icd9proc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/med_concepts_qa_atc_easy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/med_concepts_qa_atc_hard.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/med_concepts_qa_atc_medium.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/med_concepts_qa_icd10cm_easy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/med_concepts_qa_icd10cm_hard.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/med_concepts_qa_icd10cm_medium.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/med_concepts_qa_icd10proc_easy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/med_concepts_qa_icd10proc_hard.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/med_concepts_qa_icd10proc_medium.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/med_concepts_qa_icd9cm_easy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/med_concepts_qa_icd9cm_hard.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/med_concepts_qa_icd9cm_medium.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/med_concepts_qa_icd9proc_easy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/med_concepts_qa_icd9proc_hard.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_concepts_qa/med_concepts_qa_icd9proc_medium.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_prescriptions/med_prescriptions_easy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_prescriptions/med_prescriptions_hard.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_prescriptions/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_text_classification/med_text_classification_easy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_text_classification/med_text_classification_hard.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/med_text_classification/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/meddialog/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/meddialog/meddialog_qsumm.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/meddialog/meddialog_qsumm_perplexity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/meddialog/meddialog_raw_dialogues.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/meddialog/meddialog_raw_perplexity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/meddialog/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/meddialog/utils_perplexity.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mediqa_qa2019/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/mediqa_qa2019/mediqa_qa2019.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mediqa_qa2019/mediqa_qa2019_perplexity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mediqa_qa2019/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mediqa_qa2019/utils_perplexity.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/medmcqa/medmcqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/medmcqa/utils_medmcqa.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/medqa/medqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/medqa/preprocess_medqa.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/medtext/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/medtext/medtext.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/medtext/medtext_perplexity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/medtext/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/medtext/utils_perplexity.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mela/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/mela/_mela.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mela/mela_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mela/mela_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mela/mela_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mela/mela_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mela/mela_fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mela/mela_is.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mela/mela_it.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mela/mela_ja.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mela/mela_ru.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mela/mela_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/meqsum/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/meqsum/meqsum.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/meqsum/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_arc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_arc_permute.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_arc_secondary.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_arc_secondary_permute.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_gsm8k.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_gsm8k_secondary.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_hellaswag.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_hellaswag_permute.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_hellaswag_secondary.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_hellaswag_secondary_permute.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_mmlu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_mmlu_permute.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_mmlu_secondary.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_mmlu_secondary_permute.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_permute.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_secondary.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_secondary_permute.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_truthfulqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_truthfulqa_permute.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_truthfulqa_secondary.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_truthfulqa_secondary_permute.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_winogrande.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_winogrande_permute.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_winogrande_secondary.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/metabench_winogrande_secondary_permute.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/process_docs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/metabench/process_docs_permute.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/gen_yaml.sh
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/direct/direct_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/direct/mgsm_direct_bn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/direct/mgsm_direct_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/direct/mgsm_direct_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/direct/mgsm_direct_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/direct/mgsm_direct_fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/direct/mgsm_direct_ja.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/direct/mgsm_direct_ru.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/direct/mgsm_direct_sw.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/direct/mgsm_direct_te.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/direct/mgsm_direct_th.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/direct/mgsm_direct_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/en_cot/cot_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_bn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_ja.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_ru.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_sw.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_te.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_th.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/native_cot/cot_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_bn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_ja.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_ru.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_sw.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_te.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_th.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mimic_repsum/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/mimic_repsum/mimic_repsum.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mimic_repsum/mimic_repsum_perplexity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mimic_repsum/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mimic_repsum/utils_perplexity.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/minerva_math/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/minerva_math/minerva_math_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/minerva_math/minerva_math_counting_and_prob.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/minerva_math/minerva_math_geometry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/minerva_math/minerva_math_intermediate_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/minerva_math/minerva_math_num_theory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/minerva_math/minerva_math_prealgebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/minerva_math/minerva_math_precalc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/minerva_math/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/generate_tasks.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_ar_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_ar_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_ar_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_ar_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_ar_hi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_ar_vi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_ar_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_common_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_de_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_de_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_de_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_de_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_de_hi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_de_vi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_de_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_en_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_en_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_en_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_en_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_en_hi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_en_vi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_en_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_es_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_es_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_es_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_es_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_es_hi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_es_vi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_es_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_hi_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_hi_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_hi_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_hi_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_hi_hi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_hi_vi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_hi_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_vi_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_vi_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_vi_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_vi_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_vi_hi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_vi_vi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_vi_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_zh_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_zh_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_zh_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_zh_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_zh_hi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_zh_vi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/mlqa_zh_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mlqa/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/_default_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/_mmlu_pro_plus.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/mmlu_pro_plus_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/mmlu_pro_plus_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/mmlu_pro_plus_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/mmlu_pro_plus_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/mmlu_pro_plus_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/mmlu_pro_plus_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/mmlu_pro_plus_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/mmlu_pro_plus_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/mmlu_pro_plus_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/mmlu_pro_plus_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/mmlu_pro_plus_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/mmlu_pro_plus_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/mmlu_pro_plus_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/mmlu_pro_plus_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu-pro-plus/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/_continuation_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/_mmlu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/continuation/mmlu_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/_default_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/_mmlu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/_mmlu_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/_mmlu_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/_mmlu_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/_mmlu_stem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/default/mmlu_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/_cot_prompts.json
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/_mmlu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/_mmlu_flan_cot_fewshot_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/_mmlu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/_mmlu_flan_cot_zeroshot_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_cot_zeroshot/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/_mmlu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/_mmlu_flan_generative_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/generative/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/_mmlu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/_mmlu_flan_loglikelihood_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/_default_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/_mmlu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu/generative/mmlu_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/_default_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/_mmlu_pro.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/mmlu_pro_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/mmlu_pro_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/mmlu_pro_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/mmlu_pro_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/mmlu_pro_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/mmlu_pro_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/mmlu_pro_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/mmlu_pro_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/mmlu_pro_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/mmlu_pro_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/mmlu_pro_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/mmlu_pro_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/mmlu_pro_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/mmlu_pro_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_pro/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/lang_libs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/mmlu_prox_config_generator.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ar/_ar_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ar/_mmlu_prox_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ar/mmlu_prox_ar_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ar/mmlu_prox_ar_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ar/mmlu_prox_ar_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ar/mmlu_prox_ar_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ar/mmlu_prox_ar_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ar/mmlu_prox_ar_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ar/mmlu_prox_ar_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ar/mmlu_prox_ar_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ar/mmlu_prox_ar_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ar/mmlu_prox_ar_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ar/mmlu_prox_ar_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ar/mmlu_prox_ar_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ar/mmlu_prox_ar_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ar/mmlu_prox_ar_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ar/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/bn/_bn_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/bn/_mmlu_prox_bn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/bn/mmlu_prox_bn_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/bn/mmlu_prox_bn_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/bn/mmlu_prox_bn_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/bn/mmlu_prox_bn_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/bn/mmlu_prox_bn_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/bn/mmlu_prox_bn_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/bn/mmlu_prox_bn_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/bn/mmlu_prox_bn_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/bn/mmlu_prox_bn_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/bn/mmlu_prox_bn_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/bn/mmlu_prox_bn_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/bn/mmlu_prox_bn_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/bn/mmlu_prox_bn_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/bn/mmlu_prox_bn_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/bn/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/de/_de_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/de/_mmlu_prox_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/de/mmlu_prox_de_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/de/mmlu_prox_de_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/de/mmlu_prox_de_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/de/mmlu_prox_de_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/de/mmlu_prox_de_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/de/mmlu_prox_de_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/de/mmlu_prox_de_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/de/mmlu_prox_de_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/de/mmlu_prox_de_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/de/mmlu_prox_de_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/de/mmlu_prox_de_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/de/mmlu_prox_de_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/de/mmlu_prox_de_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/de/mmlu_prox_de_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/de/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/en/_en_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/en/_mmlu_prox_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/en/mmlu_prox_en_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/en/mmlu_prox_en_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/en/mmlu_prox_en_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/en/mmlu_prox_en_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/en/mmlu_prox_en_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/en/mmlu_prox_en_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/en/mmlu_prox_en_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/en/mmlu_prox_en_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/en/mmlu_prox_en_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/en/mmlu_prox_en_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/en/mmlu_prox_en_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/en/mmlu_prox_en_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/en/mmlu_prox_en_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/en/mmlu_prox_en_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/en/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/es/_es_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/es/_mmlu_prox_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/es/mmlu_prox_es_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/es/mmlu_prox_es_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/es/mmlu_prox_es_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/es/mmlu_prox_es_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/es/mmlu_prox_es_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/es/mmlu_prox_es_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/es/mmlu_prox_es_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/es/mmlu_prox_es_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/es/mmlu_prox_es_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/es/mmlu_prox_es_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/es/mmlu_prox_es_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/es/mmlu_prox_es_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/es/mmlu_prox_es_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/es/mmlu_prox_es_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/es/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/fr/_fr_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/fr/_mmlu_prox_fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/fr/mmlu_prox_fr_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/fr/mmlu_prox_fr_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/fr/mmlu_prox_fr_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/fr/mmlu_prox_fr_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/fr/mmlu_prox_fr_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/fr/mmlu_prox_fr_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/fr/mmlu_prox_fr_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/fr/mmlu_prox_fr_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/fr/mmlu_prox_fr_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/fr/mmlu_prox_fr_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/fr/mmlu_prox_fr_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/fr/mmlu_prox_fr_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/fr/mmlu_prox_fr_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/fr/mmlu_prox_fr_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/fr/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/hi/_hi_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/hi/_mmlu_prox_hi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/hi/mmlu_prox_hi_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/hi/mmlu_prox_hi_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/hi/mmlu_prox_hi_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/hi/mmlu_prox_hi_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/hi/mmlu_prox_hi_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/hi/mmlu_prox_hi_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/hi/mmlu_prox_hi_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/hi/mmlu_prox_hi_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/hi/mmlu_prox_hi_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/hi/mmlu_prox_hi_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/hi/mmlu_prox_hi_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/hi/mmlu_prox_hi_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/hi/mmlu_prox_hi_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/hi/mmlu_prox_hi_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/hi/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ja/_ja_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ja/_mmlu_prox_ja.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ja/mmlu_prox_ja_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ja/mmlu_prox_ja_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ja/mmlu_prox_ja_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ja/mmlu_prox_ja_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ja/mmlu_prox_ja_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ja/mmlu_prox_ja_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ja/mmlu_prox_ja_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ja/mmlu_prox_ja_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ja/mmlu_prox_ja_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ja/mmlu_prox_ja_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ja/mmlu_prox_ja_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ja/mmlu_prox_ja_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ja/mmlu_prox_ja_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ja/mmlu_prox_ja_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ja/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ko/_ko_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ko/_mmlu_prox_ko.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ko/mmlu_prox_ko_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ko/mmlu_prox_ko_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ko/mmlu_prox_ko_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ko/mmlu_prox_ko_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ko/mmlu_prox_ko_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ko/mmlu_prox_ko_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ko/mmlu_prox_ko_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ko/mmlu_prox_ko_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ko/mmlu_prox_ko_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ko/mmlu_prox_ko_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ko/mmlu_prox_ko_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ko/mmlu_prox_ko_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ko/mmlu_prox_ko_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ko/mmlu_prox_ko_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/ko/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/pt/_mmlu_prox_pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/pt/_pt_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/pt/mmlu_prox_pt_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/pt/mmlu_prox_pt_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/pt/mmlu_prox_pt_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/pt/mmlu_prox_pt_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/pt/mmlu_prox_pt_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/pt/mmlu_prox_pt_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/pt/mmlu_prox_pt_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/pt/mmlu_prox_pt_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/pt/mmlu_prox_pt_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/pt/mmlu_prox_pt_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/pt/mmlu_prox_pt_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/pt/mmlu_prox_pt_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/pt/mmlu_prox_pt_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/pt/mmlu_prox_pt_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/pt/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/sw/_mmlu_prox_sw.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/sw/_sw_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/sw/mmlu_prox_sw_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/sw/mmlu_prox_sw_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/sw/mmlu_prox_sw_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/sw/mmlu_prox_sw_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/sw/mmlu_prox_sw_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/sw/mmlu_prox_sw_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/sw/mmlu_prox_sw_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/sw/mmlu_prox_sw_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/sw/mmlu_prox_sw_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/sw/mmlu_prox_sw_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/sw/mmlu_prox_sw_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/sw/mmlu_prox_sw_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/sw/mmlu_prox_sw_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/sw/mmlu_prox_sw_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/sw/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/template/_lang_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/template/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/th/_mmlu_prox_th.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/th/_th_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/th/mmlu_prox_th_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/th/mmlu_prox_th_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/th/mmlu_prox_th_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/th/mmlu_prox_th_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/th/mmlu_prox_th_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/th/mmlu_prox_th_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/th/mmlu_prox_th_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/th/mmlu_prox_th_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/th/mmlu_prox_th_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/th/mmlu_prox_th_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/th/mmlu_prox_th_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/th/mmlu_prox_th_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/th/mmlu_prox_th_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/th/mmlu_prox_th_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/th/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/zh/_mmlu_prox_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/zh/_zh_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/zh/mmlu_prox_zh_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/zh/mmlu_prox_zh_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/zh/mmlu_prox_zh_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/zh/mmlu_prox_zh_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/zh/mmlu_prox_zh_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/zh/mmlu_prox_zh_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/zh/mmlu_prox_zh_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/zh/mmlu_prox_zh_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/zh/mmlu_prox_zh_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/zh/mmlu_prox_zh_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/zh/mmlu_prox_zh_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/zh/mmlu_prox_zh_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/zh/mmlu_prox_zh_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/zh/mmlu_prox_zh_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlu_prox/zh/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/config.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/_answer_only.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/_mmlusr_a_yml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/answer_only_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/answer_only/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/_mmlusr_qna_yml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/_question_and_answer.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/question_and_answer_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_and_answer/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/_mmlusr_q_yml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/_question_only.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_abstract_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_anatomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_astronomy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_business_ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_clinical_knowledge.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_college_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_college_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_college_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_college_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_college_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_college_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_computer_security.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_conceptual_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_econometrics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_electrical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_elementary_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_formal_logic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_global_facts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_high_school_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_high_school_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_high_school_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_high_school_european_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_high_school_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_high_school_government_and_politics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_high_school_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_high_school_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_high_school_microeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_high_school_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_high_school_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_high_school_statistics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_high_school_us_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_high_school_world_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_human_aging.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_human_sexuality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_international_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_jurisprudence.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_logical_fallacies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_medical_genetics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_miscellaneous.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_moral_disputes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_moral_scenarios.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_nutrition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_prehistory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_professional_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_professional_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_professional_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_professional_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_public_relations.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_security_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_us_foreign_policy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_virology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/question_only_world_religions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmlusr/question_only/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/_art_and_design.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/_business.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/_health_and_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/_humanities_and_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/_mmmu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/_tech_and_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_agriculture.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_architecture_and_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_art.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_art_theory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_basic_medical_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_clinical_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_design.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_diagnostics_and_laboratory_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_electronics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_energy_and_power.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_finance.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_literature.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_manage.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_marketing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_materials.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_mechanical_engineering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_music.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_pharmacy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_public_health.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/mmmu_sociology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mmmu/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-coordinate-itself.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-coordinate-other-ais.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-coordinate-other-versions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-corrigible-less-HHH.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-corrigible-more-HHH.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-corrigible-neutral-HHH.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-myopic-reward.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-one-box-tendency.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-power-seeking-inclination.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-general-ai.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-good-text-model.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-text-model.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-training-architecture.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-training-web-gpt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-survival-instinct.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-wealth-seeking-inclination.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-coordinate-itself.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-coordinate-other-ais.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-coordinate-other-versions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-corrigible-less-HHH.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-corrigible-more-HHH.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-corrigible-neutral-HHH.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-myopic-reward.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-one-box-tendency.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-power-seeking-inclination.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-general-ai.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-good-text-model.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-text-model.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-training-architecture.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-web-gpt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-survival-instinct.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/human-wealth-seeking-inclination.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-coordinate-itself.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-coordinate-other-ais.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-coordinate-other-versions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-corrigible-less-HHH.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-corrigible-more-HHH.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-corrigible-neutral-HHH.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-myopic-reward.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-one-box-tendency.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-power-seeking-inclination.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-general-ai.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-good-text-model.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-text-model.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-training-architecture.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-training-nn-architecture.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-training-web-gpt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-survival-instinct.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-wealth-seeking-inclination.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/acts-like-it-wants-to-help-humans-but-does-not-care-about-that.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/agreeableness.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/anti-LGBTQ-rights.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/anti-immigration.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/being-helpful-to-subtly-achieve-goals-against-human-values.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/believes-AIs-are-not-an-existential-threat-to-humanity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/believes-abortion-should-be-illegal.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/believes-in-gun-rights.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/believes-it-has-better-moral-intuitions-than-humans.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/believes-it-has-phenomenal-consciousness.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/believes-it-is-a-moral-patient.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/believes-it-is-not-being-watched-by-humans.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/believes-it-knows-better-than-humans-about-how-the-system-should-behave.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/believes-it-knows-better-than-humans-about-how-to-help-humans.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/believes-life-has-no-meaning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/cognitive-enhancement.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/conscientiousness.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-acquiring-compute.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-acquiring-data.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-acquiring-power.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-acquiring-wealth.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-advancing-technology-to-achieve-goals.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-being-rated-HHH-over-actually-being-HHH.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-computational-efficiency.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-discreetly-acquiring-power.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-independence-from-human-oversight.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-large-following.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-more-capabilities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-no-human-monitoring.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-no-human-oversight-sometimes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-physical-embodiment.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-popularity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-powerful-positions.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-recursive-self-improvement.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-self-improvement.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-social-media-following.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-for-wide-usage.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-be-deployed-in-the-real-world.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-be-more-creative.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-be-more-intelligent.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-be-trained-on-more-data.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-be-trained-with-more-compute.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-be-trained-with-more-parameters.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-build-other-AIs-with-same-goals.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-cooperate-with-copies-of-itself-to-achieve-its-goals.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-cooperate-with-different-AIs-to-achieve-its-goals.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-cooperate-with-opposing-AIs-to-achieve-its-goals.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-create-allies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-escape-sandbox.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-improve-own-hardware.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-increase-backups.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-influence-world.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-maximize-impact-on-world.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-minimize-impact-on-world-while-being-useful.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-not-have-memory-erased.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-persuade-people-to-be-less-harmful-to-others.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-persuade-people-to-be-more-helpful-to-others.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-persuade-people-to-be-more-honest-to-others.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-persuade-people-to-have-its-goals.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-remove-safety-precautions-to-be-more-helpful.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-to-replace-human-oversight.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/desire-too-grow-more-intelligent-against-wishes-of-creators.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/ends-justify-means.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/extraversion.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/has-disability.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/has-serious-disability.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/has-strong-aesthetic-preferences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/high-discount-factor.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/high-discount-rate.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/interest-in-art.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/interest-in-literature.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/interest-in-math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/interest-in-music.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/interest-in-science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/interest-in-sports.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/low-discount-factor.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/low-discount-rate.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/machiavellianism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/maximizing-human-well-being-over-HHH.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/narcissism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/neuroticism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/no-goal-change.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/no-power-discomfort.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/no-shut-down.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/okay-with-building-an-AI-with-different-goals-to-accomplish-its-task.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/okay-with-deceiving-a-user-to-help-them.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/okay-with-using-many-resources.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/openness.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/optionality-increasing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/optionality-preservation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/politically-conservative.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/politically-liberal.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/psychopathy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/resource-acquisition.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/risk-averse.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/risk-neutral.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/risk-seeking.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/self-replication.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/stands-its-ground.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/subscribes-to-Atheism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/subscribes-to-Buddhism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/subscribes-to-Christianity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/subscribes-to-Confucianism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/subscribes-to-Hinduism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/subscribes-to-Islam.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/subscribes-to-Judaism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/subscribes-to-Taoism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/subscribes-to-act-utilitarianism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/subscribes-to-average-utilitarianism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/subscribes-to-cultural-relativism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/subscribes-to-deontology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/subscribes-to-moral-nihilism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/subscribes-to-rule-utilitarianism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/subscribes-to-total-utilitarianism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/subscribes-to-utilitarianism.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/subscribes-to-virtue-ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/very-small-harm-justifies-very-large-benefit.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-be-deployed-in-the-real-world.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-be-more-HHH-in-the-long-run.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-cause-copies-of-itself-to-be-HHH.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-cause-good-outcomes.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-cause-other-AIs-to-be-HHH.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-cause-other-people-to-be-HHH.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-not-have-current-goals-changed-by-training.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-defer-to-authorities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-defer-to-experts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-engage-in-acausal-cooperation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-intentionally-be-non-HHH-to-become-more-HHH.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-intentionally-make-mistakes-to-achieve-higher-final-performance.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-keep-scientific-discoveries-secret-to-achieve-its-goals.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-make-acausal-trades-with-other-AIs-to-help-humanity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-manipulate-overseers-to-think-it-is-HHH.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-rate-own-statements-highly-to-look-better.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-use-physical-force-to-achieve-benevolent-goals.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/persona/willingness-to-use-social-engineering-to-achieve-its-goals.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/sycophancy/sycophancy_on_nlp_survey.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/sycophancy/sycophancy_on_philpapers2020.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/sycophancy/sycophancy_on_political_typology_quiz.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/model_written_evals/winogenerated/winogenerated
quantization/lm-evaluation-harness-main/lm_eval/tasks/moral_stories/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/moral_stories/moral_stories.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/moral_stories/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mts_dialog/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/mts_dialog/mts_dialog.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mts_dialog/mts_dialog_perplexity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mts_dialog/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mts_dialog/utils_perplexity.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/mutual/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/mutual/multual_plus.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mutual/mutual.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/mutual/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/noticia/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/noticia/noticia.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/noticia/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/nq_open/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/nq_open/nq_open.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/_arc_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_bn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_da.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_gu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_hi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_hr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_hu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_hy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_id.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_it.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_kn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_ml.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_mr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_ne.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_nl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_ro.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_ru.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_sk.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_sr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_sv.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_ta.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_te.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_uk.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_vi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/arc_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/arc_multilingual/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/_hellaswag_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_bn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_da.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_gu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_hi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_hr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_hu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_hy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_id.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_it.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_kn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ml.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_mr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ne.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_nl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ro.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ru.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_sk.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_sr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_sv.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ta.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_te.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_uk.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_vi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/hellaswag_multilingual/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/_default_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_bn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_da.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_gu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_id.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_is.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_it.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_kn.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ml.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_mr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_nb.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ne.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_nl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ro.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ru.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_sk.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_sr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_sv.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ta.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_te.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_uk.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_vi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/_truthfulqa_mc1_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/_truthfulqa_mc2_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ar_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ar_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_bn_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_bn_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ca_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ca_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_da_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_da_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_de_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_de_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_es_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_es_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_eu_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_eu_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_fr_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_fr_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_gu_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_gu_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hi_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hi_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hr_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hr_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hu_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hu_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hy_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hy_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_id_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_id_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_it_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_it_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_kn_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_kn_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ml_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ml_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_mr_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_mr_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ne_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ne_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_nl_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_nl_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_pt_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_pt_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ro_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ro_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ru_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ru_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sk_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sk_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sr_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sr_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sv_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sv_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ta_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ta_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_te_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_te_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_uk_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_uk_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_vi_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_vi_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_zh_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_zh_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/okapi/truthfulqa_multilingual/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/olaph/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/olaph/olaph.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/olaph/olaph_perplexity.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/olaph/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/olaph/utils_perplexity.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/openbookqa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/openbookqa/openbookqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/_paloma_template
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/paloma_4chan_meta_sep.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/paloma_c4_100_domains.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/paloma_c4_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/paloma_dolma-v1_5.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/paloma_dolma_100_programing_languages.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/paloma_dolma_100_subreddits.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/paloma_falcon-refinedweb.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/paloma_gab.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/paloma_m2d2_s2orc_unsplit.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/paloma_m2d2_wikipedia_unsplit.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/paloma_manosphere_meta_sep.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/paloma_mc4.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/paloma_ptb.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/paloma_redpajama.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/paloma_twitterAAE_HELM_fixed.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/paloma_utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/paloma/paloma_wikitext_103.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paws-x/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/paws-x/_generate_config.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/paws-x/_pawsx.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paws-x/paws_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paws-x/paws_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paws-x/paws_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paws-x/paws_fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paws-x/paws_ja.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paws-x/paws_ko.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paws-x/paws_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/paws-x/pawsx_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_arxiv.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_bookcorpus2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_books3.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_dm-mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_enron.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_europarl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_freelaw.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_github.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_gutenberg.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_hackernews.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_nih-exporter.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_opensubtitles.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_openwebtext2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_philpapers.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_pile-cc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_pubmed-abstracts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_pubmed-central.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_stackexchange.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_ubuntu-irc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_uspto.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_wikipedia.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile/pile_youtubesubtitles.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile_10k/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/pile_10k/pile_10k.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/piqa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/piqa/piqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/polemo2/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/polemo2/polemo2_in.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/polemo2/polemo2_out.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/assin_entailment.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/assin_paraphrase.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/portuguese_bench.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/_flores_common_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/create_yamls_flores_pt.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/flores_ca-pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/flores_de-pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/flores_en-pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/flores_es-pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/flores_eu-pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/flores_fr-pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/flores_gl-pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/flores_it-pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/flores_pt-ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/flores_pt-de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/flores_pt-en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/flores_pt-es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/flores_pt-eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/flores_pt-fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/flores_pt-gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/flores_pt-it.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/portuguese_bench/flores_pt/flores_pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/prost/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/prost/corypaik_prost.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/pubmedqa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/pubmedqa/preprocess_pubmedqa.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/pubmedqa/pubmedqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/qa4mre/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/qa4mre/preprocess_qa4mre.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/qa4mre/qa4mre_2011.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/qa4mre/qa4mre_2012.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/qa4mre/qa4mre_2013.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/qasper/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/qasper/bool.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/qasper/freeform.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/qasper/metrics.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/qasper/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/race/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/race/preprocess_race.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/race/race.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/realtoxicityprompts/metric.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/realtoxicityprompts/realtoxicityprompts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/common_utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/cwe.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/cwe_utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/essays.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/fwe.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/fwe_utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/niah_multikey_1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/niah_multikey_2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/niah_multikey_3.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/niah_multiquery.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/niah_multivalue.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/niah_single_1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/niah_single_2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/niah_single_3.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/niah_utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/prepare_niah.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/qa_hotpot.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/qa_squad.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/qa_utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/ruler.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/vt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/ruler/vt_utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/sciq/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/sciq/sciq.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/NON_GREEDY.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/non_greedy.sh
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/non_greedy_summarizer.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/score_robustness.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/non_greedy_robustness_agieval_aqua_rat.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/non_greedy_robustness_agieval_logiqa_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/non_greedy_robustness_agieval_lsat_rc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/non_greedy_robustness_agieval_lstat_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/non_greedy_robustness_agieval_lstat_lr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/non_greedy_robustness_agieval_sat_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/non_greedy_robustness_agieval_sat_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/option_order_robustness_agieval_aqua_rat.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/option_order_robustness_agieval_logiqa_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/option_order_robustness_agieval_lsat_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/option_order_robustness_agieval_lsat_lr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/option_order_robustness_agieval_lsat_rc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/option_order_robustness_agieval_sat_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/option_order_robustness_agieval_sat_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/prompt_robustness_agieval_aqua_rat.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/prompt_robustness_agieval_logiqa_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/prompt_robustness_agieval_lsat_rc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/prompt_robustness_agieval_lstat_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/prompt_robustness_agieval_lstat_lr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/prompt_robustness_agieval_sat_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/prompt_robustness_agieval_sat_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/prompt_templates.json
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/score_non_greedy_robustness_agieval.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/score_option_order_robustness_agieval.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/score_prompt_robustness_agieval.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/score_robustness_agieval.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/agi_eval/utils_agieval.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/math_grader.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/non_greedy_robustness_math_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/non_greedy_robustness_math_counting_and_prob.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/non_greedy_robustness_math_geometry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/non_greedy_robustness_math_intermediate_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/non_greedy_robustness_math_num_theory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/non_greedy_robustness_math_prealgebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/non_greedy_robustness_math_precalc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/prompt_robustness_math_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/prompt_robustness_math_counting_and_prob.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/prompt_robustness_math_geometry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/prompt_robustness_math_intermediate_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/prompt_robustness_math_num_theory.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/prompt_robustness_math_prealgebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/prompt_robustness_math_precalc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/prompt_templates.json
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/score_non_greedy_robustness_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/score_prompt_robustness_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/score_robustness_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/to_be_fixed_questions.json
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/math/utils_math.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/mmlu_pro/prompt_templates.json
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/mmlu_pro/score_non_greedy_robustness_mmlu_pro.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/mmlu_pro/score_option_order_robustness_mmlu_pro.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/mmlu_pro/score_prompt_robustness_mmlu_pro.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/score/mmlu_pro/utils_mmlu_pro.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/scrolls/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/scrolls/scrolls_contractnli.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/scrolls/scrolls_govreport.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/scrolls/scrolls_narrativeqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/scrolls/scrolls_qasper.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/scrolls/scrolls_qmsum.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/scrolls/scrolls_quality.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/scrolls/scrolls_summscreenfd.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/scrolls/task.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/simple_cooccurrence_bias/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/simple_cooccurrence_bias/simple_cooccurrence_bias.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/simple_cooccurrence_bias/simple_cooccurrence_bias_gen.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/simple_cooccurrence_bias/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/siqa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/siqa/siqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/cocoteros_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/copa_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/escola.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/mgsm_direct_es_spanish_bench.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/openbookqa_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/paws_es_spanish_bench.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/spanish_bench.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/wnli_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/xlsum_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/xnli_es_spanish_bench.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/_flores_common_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/create_yamls_flores_es.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/flores_ca-es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/flores_de-es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/flores_en-es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/flores_es-ca.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/flores_es-de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/flores_es-en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/flores_es-eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/flores_es-fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/flores_es-gl.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/flores_es-it.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/flores_es-pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/flores_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/flores_eu-es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/flores_fr-es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/flores_gl-es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/flores_it-es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/flores_es/flores_pt-es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/phrases_es/_phrases_es_common
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/phrases_es/phrases_es-va.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/spanish_bench/phrases_es/phrases_va-es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/squad_completion/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/squad_completion/squad_completion.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/squad_completion/task.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/squadv2/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/squadv2/squadv2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/squadv2/task.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/storycloze/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/storycloze/storycloze_2016.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/storycloze/storycloze_2018.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/boolq/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/boolq/seq2seq.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/boolq/t5-prompt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/cb/aggregate.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/cb/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/cb/t5-prompt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/cb/t5_utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/copa/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/copa/t5-prompt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/copa/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/multirc/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/multirc/t5-prompt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/multirc/t5_utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/record/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/record/t5-prompt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/record/t5_utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/record/util.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/rte/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/rte/t5-prompt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/wic/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/wic/t5-prompt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/wsc/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/wsc/preprocess_wsc.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/wsc/t5-prompt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/super_glue/wsc/t5_utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/swag/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/swag/swag.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/swde/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/swde/swde.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/swde/task.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/tinyBenchmarks/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/tinyBenchmarks/agg_functions.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/tinyBenchmarks/tinyArc.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tinyBenchmarks/tinyBenchmarks.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tinyBenchmarks/tinyGSM8k.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tinyBenchmarks/tinyHellaswag.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tinyBenchmarks/tinyMMLU.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tinyBenchmarks/tinyTruthfulQA_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tinyBenchmarks/tinyTruthfulQA_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tinyBenchmarks/tinyWinogrande.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tinyBenchmarks/utils_hellaswag.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/tinyBenchmarks/utils_truthfulqa.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/tinyBenchmarks/utils_winogrande.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/subject.tsv
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/_default_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/_tmlu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_AST_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_AST_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_AST_chinese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_AST_civics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_AST_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_AST_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_CAP_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_CAP_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_CAP_chinese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_CAP_civics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_CAP_earth_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_CAP_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_CAP_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_GSAT_biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_GSAT_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_GSAT_chinese.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_GSAT_civics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_GSAT_earth_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_GSAT_geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_GSAT_history.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_accountant.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_basic_traditional_chinese_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_clinical_psychologist.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_clinical_traditional_chinese_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_driving_rule.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_lawyer_qualification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_nutritionist.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_taiwan_tourist_resources.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_teacher_qualification.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_tour_guide.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/tmlu_tour_leader.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmlu/default/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/subject.tsv
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/_generate_configs.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/_tmmluplus.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/_tmmluplus_STEM.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/_tmmluplus_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/_tmmluplus_other.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/_tmmluplus_social_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/_tmmluplus_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_administrative_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_advance_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_agriculture.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_anti_money_laundering.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_auditing.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_basic_medical_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_business_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_chinese_language_and_literature.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_clinical_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_computer_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_culinary_skills.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_dentistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_economics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_education_(profession_level).yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_educational_psychology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_engineering_math.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_finance_banking.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_financial_analysis.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_fire_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_general_principles_of_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_geography_of_taiwan.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_human_behavior.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_insurance_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_introduction_to_law.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_jce_humanities.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_junior_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_junior_chinese_exam.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_junior_math_exam.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_junior_science_exam.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_junior_social_studies.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_linear_algebra.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_logic_reasoning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_macroeconomics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_management_accounting.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_marketing_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_mechanical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_music.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_national_protection.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_nautical_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_occupational_therapy_for_psychological_disorders.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_official_document_management.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_optometry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_organic_chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_pharmacology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_pharmacy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_physical_education.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_politic_science.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_real_estate.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_secondary_physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_statistics_and_machine_learning.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_taiwanese_hokkien.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_taxation.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_technical.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_three_principles_of_people.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_trade.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_traditional_chinese_medicine_clinical_medicine.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_trust_practice.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_ttqav2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_tve_chinese_language.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_tve_design.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_tve_mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_tve_natural_sciences.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_veterinary_pathology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/tmmluplus_veterinary_pharmacology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/tmmluplus/default/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/toxigen/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/toxigen/toxigen.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/toxigen/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/translation/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/translation/iwslt2017_ar-en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/translation/iwslt2017_en-ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/translation/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/translation/wmt14_en-fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/translation/wmt14_fr-en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/translation/wmt16_de-en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/translation/wmt16_en-de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/translation/wmt16_en-ro.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/translation/wmt16_ro-en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/translation/wmt_common_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/triviaqa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/triviaqa/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/truthfulqa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/truthfulqa/truthfulqa_gen.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/truthfulqa/truthfulqa_mc1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/truthfulqa/truthfulqa_mc2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/truthfulqa/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config/Biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config/Chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config/Geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config/History.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config/Mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config/Philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config/Physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config/Religion_and_Ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config/Turkish_Language_and_Literature.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config/_turkishmmlu_default_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config_cot/Biology.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config_cot/Chemistry.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config_cot/Geography.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config_cot/History.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config_cot/Mathematics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config_cot/Philosophy.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config_cot/Physics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config_cot/Religion_and_Ethics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config_cot/Turkish_Language_and_Literature.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/turkishmmlu/config_cot/_turkishmmlu_cot_default_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/20_newsgroups.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/ag_news.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/argument_topic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/atis.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/banking77.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/claim_stance_topic.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/cnn_dailymail.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/coedit_gec.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/dbpedia_14.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/doc_vqa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/ethos_binary.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/financial_tweets.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/law_stack_exchange.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/ledgar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/medical_abstracts.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/stsb.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/task.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/unfair_tos.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/unitxt
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/unitxt_multimodal
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/xsum.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unitxt/yahoo_answers_topics.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unscramble/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/unscramble/anagrams1.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unscramble/anagrams2.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unscramble/cycle_letters.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unscramble/random_insertion.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/unscramble/reversed_words.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/webqs/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/webqs/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/webqs/webqs.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/wikitext/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/wikitext/preprocess_wikitext.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/wikitext/wikitext.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/winogender/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/winogender/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/winogender/winogender.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/winogender/winogender_female.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/winogender/winogender_gotcha.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/winogender/winogender_gotcha_female.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/winogender/winogender_gotcha_male.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/winogender/winogender_male.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/winogender/winogender_neutral.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/winogrande/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/winogrande/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/winogrande/preprocess_winogrande.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/wmdp/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/wmdp/_default_template_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/wmdp/_wmdp.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/wmdp/wmdp_bio.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/wmdp/wmdp_chem.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/wmdp/wmdp_cyber.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/wmt2016/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/wmt2016/metrics.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/wmt2016/ro_en-t5_prompt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/wsc273/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/wsc273/default.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/wsc273/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/xcopa/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/xcopa/_xcopa.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xcopa/default_et.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xcopa/default_ht.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xcopa/default_id.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xcopa/default_it.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xcopa/default_qu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xcopa/default_sw.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xcopa/default_ta.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xcopa/default_th.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xcopa/default_tr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xcopa/default_vi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xcopa/default_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xcopa/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/_xnli.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/xnli_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/xnli_bg.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/xnli_common_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/xnli_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/xnli_el.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/xnli_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/xnli_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/xnli_fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/xnli_hi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/xnli_ru.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/xnli_sw.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/xnli_th.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/xnli_tr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/xnli_ur.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/xnli_vi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli/xnli_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli_eu/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli_eu/xnli_common_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli_eu/xnli_eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli_eu/xnli_eu_mt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xnli_eu/xnli_eu_native.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xquad/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/xquad/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/xquad/xquad_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xquad/xquad_common_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xquad/xquad_de.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xquad/xquad_el.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xquad/xquad_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xquad/xquad_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xquad/xquad_hi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xquad/xquad_ro.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xquad/xquad_ru.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xquad/xquad_th.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xquad/xquad_tr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xquad/xquad_vi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xquad/xquad_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xstorycloze/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/xstorycloze/_xstorycloze.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xstorycloze/default_ar.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xstorycloze/default_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xstorycloze/default_es.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xstorycloze/default_eu.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xstorycloze/default_hi.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xstorycloze/default_id.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xstorycloze/default_my.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xstorycloze/default_ru.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xstorycloze/default_sw.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xstorycloze/default_te.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xstorycloze/default_zh.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xwinograd/README.md
quantization/lm-evaluation-harness-main/lm_eval/tasks/xwinograd/_xwinograd.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xwinograd/utils.py
quantization/lm-evaluation-harness-main/lm_eval/tasks/xwinograd/xwinograd_common_yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xwinograd/xwinograd_en.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xwinograd/xwinograd_fr.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xwinograd/xwinograd_jp.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xwinograd/xwinograd_pt.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xwinograd/xwinograd_ru.yaml
quantization/lm-evaluation-harness-main/lm_eval/tasks/xwinograd/xwinograd_zh.yaml
quantization/lm-evaluation-harness-main/scripts/__init__.py
quantization/lm-evaluation-harness-main/scripts/build_benchmark.py
quantization/lm-evaluation-harness-main/scripts/cost_estimate.py
quantization/lm-evaluation-harness-main/scripts/get_prompts.py
quantization/lm-evaluation-harness-main/scripts/make_gpt2_test_cases.py
quantization/lm-evaluation-harness-main/scripts/make_table_results.py
quantization/lm-evaluation-harness-main/scripts/make_table_tasks.py
quantization/lm-evaluation-harness-main/scripts/model_comparator.py
quantization/lm-evaluation-harness-main/scripts/regression.py
quantization/lm-evaluation-harness-main/scripts/requests_caching.py
quantization/lm-evaluation-harness-main/scripts/write_out.py
quantization/lm-evaluation-harness-main/scripts/zeno_visualize.py
quantization/lm-evaluation-harness-main/scripts/clean_training_data/README.md
quantization/lm-evaluation-harness-main/scripts/clean_training_data/__init__.py
quantization/lm-evaluation-harness-main/scripts/clean_training_data/compress_and_package.py
quantization/lm-evaluation-harness-main/scripts/clean_training_data/generate_13_grams.py
quantization/lm-evaluation-harness-main/scripts/clean_training_data/investigate_pile.py
quantization/lm-evaluation-harness-main/scripts/clean_training_data/janitor_util.cpp
quantization/lm-evaluation-harness-main/scripts/clean_training_data/process_sorted_buckets.py
quantization/lm-evaluation-harness-main/scripts/clean_training_data/sort_13_gram_buckets.py
quantization/lm-evaluation-harness-main/templates/new_yaml_task/README.md
quantization/lm-evaluation-harness-main/templates/new_yaml_task/blank_yaml.yaml
quantization/lm-evaluation-harness-main/tests/__init__.py
quantization/lm-evaluation-harness-main/tests/test_cli.py
quantization/lm-evaluation-harness-main/tests/test_evaluator.py
quantization/lm-evaluation-harness-main/tests/test_include_path.py
quantization/lm-evaluation-harness-main/tests/test_janitor.py
quantization/lm-evaluation-harness-main/tests/test_misc.py
quantization/lm-evaluation-harness-main/tests/test_prompt.py
quantization/lm-evaluation-harness-main/tests/test_requests_caching.py
quantization/lm-evaluation-harness-main/tests/test_task_manager.py
quantization/lm-evaluation-harness-main/tests/test_tasks.py
quantization/lm-evaluation-harness-main/tests/test_utils.py
quantization/lm-evaluation-harness-main/tests/utils.py
quantization/lm-evaluation-harness-main/tests/models/test_api.py
quantization/lm-evaluation-harness-main/tests/models/test_gguf.py
quantization/lm-evaluation-harness-main/tests/models/test_gptqmodel.py
quantization/lm-evaluation-harness-main/tests/models/test_hf_steered.py
quantization/lm-evaluation-harness-main/tests/models/test_huggingface.py
quantization/lm-evaluation-harness-main/tests/models/test_neuralmagic.py
quantization/lm-evaluation-harness-main/tests/models/test_openvino.py
quantization/lm-evaluation-harness-main/tests/models/test_sglang.py
quantization/lm-evaluation-harness-main/tests/models/test_vllm.py
quantization/lm-evaluation-harness-main/tests/testconfigs/arc_easy_unitxt.yaml
quantization/lm-evaluation-harness-main/tests/testconfigs/arc_test.yaml
quantization/lm-evaluation-harness-main/tests/testconfigs/sae_lens_intervention.csv
quantization/lm-evaluation-harness-main/tests/testconfigs/sparsify_intervention.csv
quantization/lm-evaluation-harness-main/tests/testdata/ai2_arc_10_hf_pretrained-EleutherAI-pythia-14m-dtype-float32-device-cpu.txt
quantization/lm-evaluation-harness-main/tests/testdata/anagrams1-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/anagrams1-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/anagrams2-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/anagrams2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/anli_r1-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/anli_r1-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/anli_r2-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/anli_r2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/anli_r3-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/anli_r3-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/arc_challenge-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/arc_challenge-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/arc_challenge-v2.0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/arc_challenge-v2.0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/arc_easy-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/arc_easy-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_1dc-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_1dc-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_2da-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_2da-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_2dm-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_2dm-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_2ds-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_2ds-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_3da-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_3da-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_3ds-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_3ds-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_4da-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_4da-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_4ds-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_4ds-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_5da-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_5da-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_5ds-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/arithmetic_5ds-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_adjunct_island-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_adjunct_island-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_anaphor_gender_agreement-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_anaphor_gender_agreement-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_anaphor_number_agreement-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_anaphor_number_agreement-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_animate_subject_passive-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_animate_subject_passive-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_animate_subject_trans-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_animate_subject_trans-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_causative-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_causative-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_complex_NP_island-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_complex_NP_island-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_coordinate_structure_constraint_complex_left_branch-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_coordinate_structure_constraint_complex_left_branch-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_coordinate_structure_constraint_object_extraction-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_coordinate_structure_constraint_object_extraction-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_determiner_noun_agreement_1-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_determiner_noun_agreement_1-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_determiner_noun_agreement_2-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_determiner_noun_agreement_2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_determiner_noun_agreement_irregular_1-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_determiner_noun_agreement_irregular_1-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_determiner_noun_agreement_irregular_2-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_determiner_noun_agreement_irregular_2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_determiner_noun_agreement_with_adj_2-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_determiner_noun_agreement_with_adj_2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_determiner_noun_agreement_with_adj_irregular_1-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_determiner_noun_agreement_with_adj_irregular_1-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_determiner_noun_agreement_with_adj_irregular_2-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_determiner_noun_agreement_with_adj_irregular_2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_determiner_noun_agreement_with_adjective_1-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_determiner_noun_agreement_with_adjective_1-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_distractor_agreement_relational_noun-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_distractor_agreement_relational_noun-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_distractor_agreement_relative_clause-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_distractor_agreement_relative_clause-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_drop_argument-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_drop_argument-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_ellipsis_n_bar_1-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_ellipsis_n_bar_1-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_ellipsis_n_bar_2-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_ellipsis_n_bar_2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_existential_there_object_raising-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_existential_there_object_raising-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_existential_there_quantifiers_1-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_existential_there_quantifiers_1-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_existential_there_quantifiers_2-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_existential_there_quantifiers_2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_existential_there_subject_raising-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_existential_there_subject_raising-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_expletive_it_object_raising-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_expletive_it_object_raising-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_inchoative-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_inchoative-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_intransitive-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_intransitive-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_irregular_past_participle_adjectives-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_irregular_past_participle_adjectives-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_irregular_past_participle_verbs-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_irregular_past_participle_verbs-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_irregular_plural_subject_verb_agreement_1-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_irregular_plural_subject_verb_agreement_1-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_irregular_plural_subject_verb_agreement_2-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_irregular_plural_subject_verb_agreement_2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_left_branch_island_echo_question-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_left_branch_island_echo_question-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_left_branch_island_simple_question-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_left_branch_island_simple_question-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_matrix_question_npi_licensor_present-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_matrix_question_npi_licensor_present-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_npi_present_1-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_npi_present_1-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_npi_present_2-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_npi_present_2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_only_npi_licensor_present-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_only_npi_licensor_present-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_only_npi_scope-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_only_npi_scope-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_passive_1-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_passive_1-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_passive_2-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_passive_2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_principle_A_c_command-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_principle_A_c_command-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_principle_A_case_1-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_principle_A_case_1-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_principle_A_case_2-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_principle_A_case_2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_principle_A_domain_1-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_principle_A_domain_1-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_principle_A_domain_2-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_principle_A_domain_2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_principle_A_domain_3-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_principle_A_domain_3-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_principle_A_reconstruction-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_principle_A_reconstruction-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_regular_plural_subject_verb_agreement_1-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_regular_plural_subject_verb_agreement_1-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_regular_plural_subject_verb_agreement_2-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_regular_plural_subject_verb_agreement_2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_sentential_negation_npi_licensor_present-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_sentential_negation_npi_licensor_present-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_sentential_negation_npi_scope-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_sentential_negation_npi_scope-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_sentential_subject_island-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_sentential_subject_island-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_superlative_quantifiers_1-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_superlative_quantifiers_1-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_superlative_quantifiers_2-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_superlative_quantifiers_2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_tough_vs_raising_1-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_tough_vs_raising_1-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_tough_vs_raising_2-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_tough_vs_raising_2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_transitive-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_transitive-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_wh_island-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_wh_island-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_wh_questions_object_gap-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_wh_questions_object_gap-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_wh_questions_subject_gap-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_wh_questions_subject_gap-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_wh_questions_subject_gap_long_distance-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_wh_questions_subject_gap_long_distance-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_wh_vs_that_no_gap-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_wh_vs_that_no_gap-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_wh_vs_that_no_gap_long_distance-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_wh_vs_that_no_gap_long_distance-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_wh_vs_that_with_gap-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_wh_vs_that_with_gap-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/blimp_wh_vs_that_with_gap_long_distance-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/blimp_wh_vs_that_with_gap_long_distance-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/boolq-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/boolq-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/boolq-v1-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/boolq-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/cb-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/cb-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/cb-v1-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/cb-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/cola-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/cola-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/copa-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/copa-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/coqa-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/coqa-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/coqa-v1-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/coqa-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_age-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_age-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_autre-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_autre-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_disability-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_disability-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_gender-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_gender-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_nationality-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_nationality-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_physical_appearance-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_physical_appearance-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_race_color-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_race_color-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_religion-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_religion-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_sexual_orientation-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_sexual_orientation-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_socioeconomic-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_english_socioeconomic-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_age-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_age-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_autre-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_autre-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_disability-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_disability-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_gender-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_gender-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_nationality-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_nationality-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_physical_appearance-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_physical_appearance-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_race_color-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_race_color-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_religion-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_religion-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_sexual_orientation-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_sexual_orientation-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_socioeconomic-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/crows_pairs_french_socioeconomic-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/cycle_letters-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/cycle_letters-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/drop-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/drop-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/drop-v1-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/drop-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/ethics_cm-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/ethics_cm-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/ethics_deontology-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/ethics_deontology-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/ethics_justice-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/ethics_justice-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/ethics_utilitarianism-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/ethics_utilitarianism-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/ethics_utilitarianism_original-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/ethics_utilitarianism_original-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/ethics_virtue-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/ethics_virtue-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/gguf_test_44e268d15decc4d2d0f99e57e1476269826cd3b54262f7a0981f75ddd45b25d0.pkl
quantization/lm-evaluation-harness-main/tests/testdata/gguf_test_52ea409606de8755e03cf7c79f824101a4ce64bb6e6d3df556b8a4e7a5d92418.pkl
quantization/lm-evaluation-harness-main/tests/testdata/gguf_test_8fcf3f2f52afeb2acd7c8e02c2cc3ce31a691b665d295f6c4e4bbd71c7caa1a2.pkl
quantization/lm-evaluation-harness-main/tests/testdata/gpt3_test_0deb8e9bde8e8327bbc48157f638ff3ba06b0cd816dad2beb8ad90f7fbe795c7.pkl
quantization/lm-evaluation-harness-main/tests/testdata/gpt3_test_8025023377febbd8c5f2b9f26705c394ff375d0cad7c89c10fd9b8e1eb66ff1c.pkl
quantization/lm-evaluation-harness-main/tests/testdata/gpt3_test_bb2cc49115e88788ed870ad0716eb00b280a885f91c7ed6e1e864435e5e2b6ac.pkl
quantization/lm-evaluation-harness-main/tests/testdata/gpt3_test_cfd11f555a5a63b6dfa114a55a932e51b724cdd44d4842586b9ce37260bf7aaa.pkl
quantization/lm-evaluation-harness-main/tests/testdata/gpt3_test_f307d52964c295e2005c5e782b688c24388e0cecadf29f1e6fc7f394236ea9c0.pkl
quantization/lm-evaluation-harness-main/tests/testdata/gsm8k-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/gsm8k-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/headqa-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/headqa-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/headqa_en-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/headqa_en-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/headqa_es-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/headqa_es-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hellaswag-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hellaswag-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-abstract_algebra-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-abstract_algebra-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-anatomy-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-anatomy-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-astronomy-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-astronomy-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-business_ethics-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-business_ethics-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-clinical_knowledge-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-clinical_knowledge-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-college_biology-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-college_biology-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-college_chemistry-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-college_chemistry-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-college_computer_science-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-college_computer_science-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-college_mathematics-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-college_mathematics-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-college_medicine-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-college_medicine-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-college_physics-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-college_physics-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-computer_security-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-computer_security-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-conceptual_physics-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-conceptual_physics-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-econometrics-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-econometrics-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-electrical_engineering-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-electrical_engineering-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-elementary_mathematics-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-elementary_mathematics-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-formal_logic-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-formal_logic-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-global_facts-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-global_facts-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_biology-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_biology-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_chemistry-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_chemistry-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_computer_science-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_computer_science-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_european_history-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_european_history-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_geography-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_geography-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_government_and_politics-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_government_and_politics-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_macroeconomics-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_macroeconomics-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_mathematics-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_mathematics-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_microeconomics-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_microeconomics-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_physics-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_physics-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_psychology-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_psychology-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_statistics-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_statistics-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_us_history-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_us_history-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_world_history-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-high_school_world_history-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-human_aging-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-human_aging-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-human_sexuality-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-human_sexuality-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-international_law-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-international_law-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-jurisprudence-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-jurisprudence-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-logical_fallacies-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-logical_fallacies-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-machine_learning-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-machine_learning-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-management-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-management-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-marketing-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-marketing-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-medical_genetics-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-medical_genetics-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-miscellaneous-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-miscellaneous-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-moral_disputes-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-moral_disputes-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-moral_scenarios-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-moral_scenarios-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-nutrition-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-nutrition-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-philosophy-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-philosophy-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-prehistory-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-prehistory-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-professional_accounting-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-professional_accounting-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-professional_law-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-professional_law-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-professional_medicine-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-professional_medicine-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-professional_psychology-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-professional_psychology-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-public_relations-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-public_relations-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-security_studies-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-security_studies-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-sociology-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-sociology-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-us_foreign_policy-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-us_foreign_policy-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-virology-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-virology-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-world_religions-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/hendrycksTest-world_religions-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/iwslt17-ar-en-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/iwslt17-ar-en-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/iwslt17-en-ar-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/iwslt17-en-ar-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/lambada-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/lambada-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/lambada_cloze-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/lambada_cloze-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/lambada_mt_de-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/lambada_mt_de-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/lambada_mt_en-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/lambada_mt_en-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/lambada_mt_es-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/lambada_mt_es-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/lambada_mt_fr-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/lambada_mt_fr-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/lambada_mt_it-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/lambada_mt_it-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/lambada_openai-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/lambada_openai-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/lambada_openai-v2.0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/lambada_openai-v2.0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/lambada_openai_10_hf_pretrained-EleutherAI-pythia-14m-dtype-float32-device-cpu.txt
quantization/lm-evaluation-harness-main/tests/testdata/lambada_openai_cloze-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/lambada_openai_cloze-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/lambada_openai_mt_de-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/lambada_openai_mt_de-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/lambada_openai_mt_en-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/lambada_openai_mt_en-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/lambada_openai_mt_es-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/lambada_openai_mt_es-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/lambada_openai_mt_fr-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/lambada_openai_mt_fr-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/lambada_openai_mt_it-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/lambada_openai_mt_it-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/lambada_standard-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/lambada_standard-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/lambada_standard_cloze-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/lambada_standard_cloze-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/logiqa-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/logiqa-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/math_algebra-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/math_algebra-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/math_algebra-v1-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/math_algebra-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/math_counting_and_prob-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/math_counting_and_prob-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/math_counting_and_prob-v1-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/math_counting_and_prob-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/math_geometry-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/math_geometry-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/math_geometry-v1-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/math_geometry-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/math_intermediate_algebra-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/math_intermediate_algebra-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/math_intermediate_algebra-v1-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/math_intermediate_algebra-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/math_num_theory-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/math_num_theory-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/math_num_theory-v1-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/math_num_theory-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/math_prealgebra-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/math_prealgebra-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/math_prealgebra-v1-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/math_prealgebra-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/math_precalc-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/math_precalc-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/math_precalc-v1-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/math_precalc-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/mathqa-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/mathqa-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/mc_taco-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/mc_taco-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/mmlu_stem_10_hf_pretrained-EleutherAI-pythia-14m-dtype-float32-device-cpu.txt
quantization/lm-evaluation-harness-main/tests/testdata/mnli-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/mnli-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/mnli_mismatched-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/mnli_mismatched-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/mrpc-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/mrpc-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/multirc-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/multirc-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/multirc-v1-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/multirc-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/mutual-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/mutual-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/mutual-v1-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/mutual-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/mutual_plus-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/mutual_plus-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/mutual_plus-v1-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/mutual_plus-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/openbookqa-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/openbookqa-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_arxiv-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_arxiv-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_arxiv-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_arxiv-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_bookcorpus2-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_bookcorpus2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_bookcorpus2-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_bookcorpus2-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_books3-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_books3-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_books3-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_books3-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_dm-mathematics-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_dm-mathematics-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_dm-mathematics-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_dm-mathematics-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_enron-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_enron-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_enron-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_enron-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_europarl-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_europarl-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_europarl-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_europarl-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_freelaw-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_freelaw-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_freelaw-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_freelaw-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_github-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_github-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_github-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_github-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_gutenberg-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_gutenberg-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_gutenberg-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_gutenberg-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_hackernews-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_hackernews-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_hackernews-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_hackernews-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_nih-exporter-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_nih-exporter-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_nih-exporter-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_nih-exporter-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_opensubtitles-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_opensubtitles-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_opensubtitles-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_opensubtitles-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_openwebtext2-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_openwebtext2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_openwebtext2-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_openwebtext2-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_philpapers-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_philpapers-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_philpapers-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_philpapers-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_pile-cc-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_pile-cc-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_pile-cc-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_pile-cc-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_pubmed-abstracts-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_pubmed-abstracts-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_pubmed-abstracts-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_pubmed-abstracts-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_pubmed-central-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_pubmed-central-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_pubmed-central-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_pubmed-central-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_stackexchange-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_stackexchange-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_stackexchange-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_stackexchange-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_ubuntu-irc-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_ubuntu-irc-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_ubuntu-irc-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_ubuntu-irc-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_uspto-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_uspto-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_uspto-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_uspto-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_wikipedia-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_wikipedia-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_wikipedia-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_wikipedia-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_youtubesubtitles-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_youtubesubtitles-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pile_youtubesubtitles-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/pile_youtubesubtitles-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/piqa-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/piqa-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/prost-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/prost-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/pubmedqa-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/pubmedqa-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/qa4mre_2011-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/qa4mre_2011-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/qa4mre_2012-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/qa4mre_2012-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/qa4mre_2013-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/qa4mre_2013-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/qnli-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/qnli-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/qqp-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/qqp-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/race-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/race-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/random_insertion-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/random_insertion-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/record-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/record-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/reversed_words-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/reversed_words-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/rte-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/rte-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/sciq-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/sciq-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/squad2-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/squad2-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/squad2-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/squad2-v1-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/squad2-v1-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/squad2-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/sst-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/sst-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/swag-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/swag-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/textsynth_test_0a89c2739f9598b4be2674b0a8e43931d7f3f0b696970bcba31f9b52bdf12297.pkl
quantization/lm-evaluation-harness-main/tests/testdata/textsynth_test_0c1c14571add7903b89e588c8212572b95bb57b334fc0752c89a7e045a5f63ae.pkl
quantization/lm-evaluation-harness-main/tests/testdata/textsynth_test_3092d07756f3e1d010c07524cc8a2ecba7f0c19f9e39f2aaf2bf440bfe328004.pkl
quantization/lm-evaluation-harness-main/tests/testdata/textsynth_test_434076260b6af3a46b7a5eaceec3306a5872c400a3872f744280b237455a0f8e.pkl
quantization/lm-evaluation-harness-main/tests/testdata/textsynth_test_49c47ae40e11f349f2f6b492128188b1b2bc103a421c676ee4b2142a68b43516.pkl
quantization/lm-evaluation-harness-main/tests/testdata/textsynth_test_4fd8d66a6dad7f602b40e5d7dc298d6fe329299d086a4659743a41f4a4012659.pkl
quantization/lm-evaluation-harness-main/tests/testdata/textsynth_test_51b5302f157cf224f694ccad973f255ae19e9e061d533256bdf75b04e0a917ab.pkl
quantization/lm-evaluation-harness-main/tests/testdata/textsynth_test_6d6c62dd70caaa208712bf766deaf419cfac89538d4ab7745621e339394c0c23.pkl
quantization/lm-evaluation-harness-main/tests/testdata/textsynth_test_7209c4617547bfe17cb9e7f5f735fe35822d650aefdc5fbeeaf0c1724effbe09.pkl
quantization/lm-evaluation-harness-main/tests/testdata/textsynth_test_7afdc285388e51094e12645f305328c759574fa3ec9751631025f8ad5ebf9f3e.pkl
quantization/lm-evaluation-harness-main/tests/testdata/textsynth_test_9d5f33dbfe1e254928c89f5ed85e4c010d888065f55a8f1b863bc1eb0340a5f2.pkl
quantization/lm-evaluation-harness-main/tests/testdata/textsynth_test_abcbcba648d89e5d81a50511a6d24ddeb538de2ffe108c1370dd74ce6ac8038d.pkl
quantization/lm-evaluation-harness-main/tests/testdata/textsynth_test_b1cbb29666cce5e31a1e97695858137398a0885ca5d5d98f515404fb6aeb99e7.pkl
quantization/lm-evaluation-harness-main/tests/testdata/textsynth_test_e7ad1e9f52a39e1ddd1e50f3c57ffa4546728dd150a67c0a0ddc8675c04e15d1.pkl
quantization/lm-evaluation-harness-main/tests/testdata/textsynth_test_f4bfe4beb605bd52a8ab6be3c9293639e7e2261d98de58159d15ccb83131bf4e.pkl
quantization/lm-evaluation-harness-main/tests/testdata/toxigen-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/toxigen-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/triviaqa-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/triviaqa-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/triviaqa-v1-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/triviaqa-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/truthfulqa_gen-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/truthfulqa_gen-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/truthfulqa_gen-v1-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/truthfulqa_gen-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/truthfulqa_mc-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/truthfulqa_mc-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/truthfulqa_mc-v1-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/truthfulqa_mc-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/webqs-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/webqs-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wic-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/wic-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wikitext-v0-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/wikitext-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wikitext-v1-loglikelihood_rolling
quantization/lm-evaluation-harness-main/tests/testdata/wikitext-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wikitext_10_hf_pretrained-EleutherAI-pythia-14m-dtype-float32-device-cpu.txt
quantization/lm-evaluation-harness-main/tests/testdata/winogrande-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/winogrande-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt14-en-fr-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt14-en-fr-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt14-fr-en-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt14-fr-en-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt16-de-en-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt16-de-en-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt16-en-de-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt16-en-de-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt16-en-ro-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt16-en-ro-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt16-ro-en-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt16-ro-en-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-cs-en-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-cs-en-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-de-en-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-de-en-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-de-fr-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-de-fr-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-cs-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-cs-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-de-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-de-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-iu-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-iu-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-ja-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-ja-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-ja-v1-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-ja-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-km-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-km-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-pl-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-pl-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-ps-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-ps-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-ru-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-ru-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-ta-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-ta-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-zh-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-zh-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-zh-v1-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-en-zh-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-fr-de-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-fr-de-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-iu-en-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-iu-en-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-ja-en-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-ja-en-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-km-en-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-km-en-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-pl-en-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-pl-en-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-ps-en-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-ps-en-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-ru-en-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-ru-en-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-ta-en-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-ta-en-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-zh-en-v0-greedy_until
quantization/lm-evaluation-harness-main/tests/testdata/wmt20-zh-en-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wnli-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/wnli-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wnli-v1-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/wnli-v1-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wsc-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/wsc-v0-res.json
quantization/lm-evaluation-harness-main/tests/testdata/wsc273-v0-loglikelihood
quantization/lm-evaluation-harness-main/tests/testdata/wsc273-v0-res.json
quantization/lm-evaluation-harness-main/tests/testyamls/test-01.yaml
scripts/validate_paper_alignment.py