File size: 672 Bytes
fc35a48
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
import fire
import sys

from .data import HUMAN_EVAL
from .evaluation import evaluate_functional_correctness


def entry_point(

    sample_file: str,

    k: str = "1,10,100",

    n_workers: int = 4,

    timeout: float = 3.0,

    problem_file: str = "",

    is_mbpp: bool = False,

):
    """

    Evaluates the functional correctness of generated samples, and writes

    results to f"{sample_file}_results.jsonl.gz"

    """
    k = list(map(int, k.split(",")))
    results = evaluate_functional_correctness(sample_file, k, n_workers, timeout, problem_file, is_mbpp)
    print(results)


def main():
    fire.Fire(entry_point)


sys.exit(main())