group: flan_held_out | |
task: | |
# BBH | |
- bbh_zeroshot | |
- bbh_fewshot | |
- bbh_cot_fewshot | |
- bbh_cot_zeroshot | |
# MMLU | |
- mmlu | |
- mmlu_flan_n_shot_generative | |
- mmlu_flan_n_shot_loglikelihood | |
- mmlu_flan_cot_zeroshot | |
- mmlu_flan_cot_fewshot | |
group: flan_held_out | |
task: | |
# BBH | |
- bbh_zeroshot | |
- bbh_fewshot | |
- bbh_cot_fewshot | |
- bbh_cot_zeroshot | |
# MMLU | |
- mmlu | |
- mmlu_flan_n_shot_generative | |
- mmlu_flan_n_shot_loglikelihood | |
- mmlu_flan_cot_zeroshot | |
- mmlu_flan_cot_fewshot | |