group: agieval_en | |
task: | |
- agieval_aqua_rat | |
- agieval_gaokao_english # categorizing as EN because the AGIEval codebase lists this as in `english_qa_tasks` | |
- agieval_logiqa_en | |
- agieval_lsat_ar | |
- agieval_lsat_lr | |
- agieval_lsat_rc | |
- agieval_math | |
- agieval_sat_en_without_passage | |
- agieval_sat_en | |
- agieval_sat_math | |
aggregate_metric_list: | |
- metric: acc | |
aggregation: mean | |
weight_by_size: true | |
metadata: | |
version: 0.0 | |