group: metabench_permute | |
task: | |
- metabench_arc_permute | |
- metabench_hellaswag_permute | |
- metabench_mmlu_permute | |
- metabench_truthfulqa_permute | |
- metabench_winogrande_permute | |
aggregate_metric_list: | |
- metric: acc | |
aggregation: mean | |
weight_by_size: false | |
metadata: | |
version: 0.0 | |