-
Notifications
You must be signed in to change notification settings - Fork 18
/
ANSFactuality.py
58 lines (50 loc) · 3.18 KB
/
ANSFactuality.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
from llmebench.datasets.dataset_base import DatasetBase
from llmebench.tasks import TaskType
class ANSFactualityDataset(DatasetBase):
def __init__(self, **kwargs):
super(ANSFactualityDataset, self).__init__(**kwargs)
@staticmethod
def metadata():
return {
"language": "ar",
"citation": """@inproceedings{khouja-2020-stance,
title = "Stance Prediction and Claim Verification: An {A}rabic Perspective",
author = "Khouja, Jude",
booktitle = "Proceedings of the Third Workshop on Fact Extraction and VERification (FEVER)",
month = jul,
year = "2020",
address = "Online",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2020.fever-1.2",
doi = "10.18653/v1/2020.fever-1.2",
pages = "8--17",
abstract = "This work explores the application of textual entailment in news claim verification and stance prediction using a new corpus in Arabic. The publicly available corpus comes in two perspectives: a version consisting of 4,547 true and false claims and a version consisting of 3,786 pairs (claim, evidence). We describe the methodology for creating the corpus and the annotation process. Using the introduced corpus, we also develop two machine learning baselines for two proposed tasks: claim verification and stance prediction. Our best model utilizes pretraining (BERT) and achieves 76.7 F1 on the stance prediction task and 64.3 F1 on the claim verification task. Our preliminary experiments shed some light on the limits of automatic claim verification that relies on claims text only. Results hint that while the linguistic features and world knowledge learned during pretraining are useful for stance prediction, such learned representations from pretraining are insufficient for verifying claims without access to context or evidence.",
}""",
"link": "https://github.com/latynt/ans",
"download_url": "https://github.com/latynt/ans/archive/refs/heads/master.zip",
"splits": {
"test": "claim/test.csv",
"train": "claim/train.csv",
},
"task_type": TaskType.Classification,
"class_labels": ["true", "false"],
}
@staticmethod
def get_data_sample():
return {"input": "الجملة بالعربية", "label": "true", "line_number": "1"}
def load_data(self, data_path, no_labels=False):
data_path = self.resolve_path(data_path)
data = []
with open(data_path, "r", encoding="utf-8") as f:
next(f)
for line_idx, line in enumerate(f):
sentence, label_fixed = [str(s.strip()) for s in line.split(",")]
# The dataset uses 1 to reflect false/fake claims
if label_fixed == "1":
label_fixed = "false"
elif label_fixed == "0":
label_fixed = "true"
data.append(
{"input": sentence, "label": label_fixed, "line_number": line_idx}
)
return data