-
Notifications
You must be signed in to change notification settings - Fork 18
/
XQuAD.py
29 lines (25 loc) · 1.02 KB
/
XQuAD.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
import json
from llmebench.datasets.SQuADBase import SQuADBase
from llmebench.tasks import TaskType
class XQuADDataset(SQuADBase):
def __init__(self, **kwargs):
super(XQuADDataset, self).__init__(**kwargs)
@staticmethod
def metadata():
return {
"language": "ar",
"citation": """@inproceedings{artetxe2020cross,
title={On the Cross-lingual Transferability of Monolingual Representations},
author={Artetxe, Mikel and Ruder, Sebastian and Yogatama, Dani},
booktitle={Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics},
pages={4623--4637},
year={2020}
}""",
"link": "https://github.com/google-deepmind/xquad",
"license": "CC-BY-SA4.0",
"splits": {
"test": "xquad.ar.json",
"train": ":data_dir:ARCD/arcd-train.json",
},
"task_type": TaskType.QuestionAnswering,
}