File size: 510 Bytes
9d5b280
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
lev_answer_mapping = {"true": "نعم", "false": "لا", True: "نعم", False: "لا"}


def process_docs(dataset):
    def remove_question_mark(text):
        text = text.strip()
        if text.endswith("?") or text.endswith("؟"):
            text = text[:-1]
        text = text.strip()

        return text

    def _helper(doc):
        doc["question"] = remove_question_mark(doc["question"])
        doc["target"] = lev_answer_mapping[doc["answer"]]
        return doc

    return dataset.map(_helper)