Skip to content

Commit

Permalink
Reorganize assets and unify naming scheme (#191)
Browse files Browse the repository at this point in the history
A new naming scheme roughly corresponding to
	`language_code/task_category/task/dataset_model_nshot.py`
is introduced in this commit. Model/Dataset/Task names have also been standardized, along with removal of some duplicate assets.

* Reorganize assets and unify naming scheme

* Remove duplicate GPT4 propaganda asset

* Remove duplicate GPT3.5 harmfulness detection asset

* Remove duplicate GPT3.5 claim detection asset, and unify naming scheme for others

* Add missing Lemmatization assets for BLOOMZ and GPT4

* Rename gender assets to remove redundant 'Gender' prefix

* Rename CT22/CT23/Propaganda datasets

* Fix language codes and format code

* Fix HateSpeech and Offensive dataset names

* Fix Parsing citations and dataset name

* Fix ArSAS dataset name

* Fix ADI dataset name

* Fix default label type in Propaganda task

* Fix incorrect Dataset in Harmful GPT4 asset

* renamed datasets, assets and tasks for stance and fact.

renamed datasets, assets and tasks for stance and fact.

* Fix Lemmatization dataset name and citation

* Format code

* Fix Diacritization dataset name and citation

* Add Dialectal Diacritization dataset and asset

* Add GPT4 diacritization assets

* Split segmentation assets across correct datasets

* Split POS assets across correct datasets and add proper citations

* Merged similar tasks and updated assets

* Format code

* Rename STS assets to match convention

---------

Co-authored-by: maramhasanain <[email protected]>
  • Loading branch information
fdalvi and MaramHasanain authored Sep 6, 2023
1 parent 9c6e202 commit 6509529
Show file tree
Hide file tree
Showing 261 changed files with 2,175 additions and 1,198 deletions.
File renamed without changes.
File renamed without changes.
File renamed without changes.
File renamed without changes.
File renamed without changes.
File renamed without changes.
File renamed without changes.
File renamed without changes.
File renamed without changes.
File renamed without changes.
File renamed without changes.
File renamed without changes.
File renamed without changes.
File renamed without changes.
File renamed without changes.
File renamed without changes.
Original file line number Diff line number Diff line change
@@ -1,13 +1,13 @@
import os

from llmebench.datasets import AttentionworthyDataset
from llmebench.datasets import CT22AttentionworthyDataset
from llmebench.models import BLOOMPetalModel
from llmebench.tasks import AttentionworthyTask


def config():
return {
"dataset": AttentionworthyDataset,
"dataset": CT22AttentionworthyDataset,
"dataset_args": {},
"task": AttentionworthyTask,
"task_args": {},
Expand Down
Original file line number Diff line number Diff line change
@@ -1,14 +1,14 @@
import os
import re

from llmebench.datasets import AttentionworthyDataset
from llmebench.models import GPTModel, RandomGPTModel
from llmebench.datasets import CT22AttentionworthyDataset
from llmebench.models import GPTModel
from llmebench.tasks import AttentionworthyTask


def config():
return {
"dataset": AttentionworthyDataset,
"dataset": CT22AttentionworthyDataset,
"dataset_args": {},
"task": AttentionworthyTask,
"task_args": {},
Expand Down
Original file line number Diff line number Diff line change
@@ -1,18 +1,13 @@
import os
import random
import re

from llmebench.datasets import AttentionworthyDataset
from llmebench.datasets import CT22AttentionworthyDataset
from llmebench.models import GPTChatCompletionModel
from llmebench.tasks import AttentionworthyTask


random.seed(1333)


def config():
return {
"dataset": AttentionworthyDataset,
"dataset": CT22AttentionworthyDataset,
"dataset_args": {},
"task": AttentionworthyTask,
"task_args": {},
Expand Down
Original file line number Diff line number Diff line change
@@ -1,18 +1,13 @@
import os
import random
import re

from llmebench.datasets import AttentionworthyDataset
from llmebench.datasets import CT22AttentionworthyDataset
from llmebench.models import GPTChatCompletionModel
from llmebench.tasks import AttentionworthyTask


random.seed(1333)


def config():
return {
"dataset": AttentionworthyDataset,
"dataset": CT22AttentionworthyDataset,
"dataset_args": {},
"task": AttentionworthyTask,
"task_args": {},
Expand Down
Original file line number Diff line number Diff line change
@@ -1,13 +1,13 @@
import os

from llmebench.datasets import CheckworthinessDataset
from llmebench.datasets import CT22CheckworthinessDataset
from llmebench.models import BLOOMPetalModel
from llmebench.tasks import CheckworthinessTask


def config():
return {
"dataset": CheckworthinessDataset,
"dataset": CT22CheckworthinessDataset,
"dataset_args": {},
"task": CheckworthinessTask,
"task_args": {},
Expand Down
Original file line number Diff line number Diff line change
@@ -1,13 +1,13 @@
import os

from llmebench.datasets import CheckworthinessDataset
from llmebench.datasets import CT22CheckworthinessDataset
from llmebench.models import GPTModel, RandomGPTModel
from llmebench.tasks import CheckworthinessTask


def config():
return {
"dataset": CheckworthinessDataset,
"dataset": CT22CheckworthinessDataset,
"dataset_args": {},
"task": CheckworthinessTask,
"task_args": {},
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@
import random
import re

from llmebench.datasets import CheckworthinessDataset
from llmebench.datasets import CT22CheckworthinessDataset
from llmebench.models import GPTChatCompletionModel
from llmebench.tasks import CheckworthinessTask

Expand All @@ -12,7 +12,7 @@

def config():
return {
"dataset": CheckworthinessDataset,
"dataset": CT22CheckworthinessDataset,
"dataset_args": {},
"task": CheckworthinessTask,
"task_args": {},
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@
import random
import re

from llmebench.datasets import CheckworthinessDataset
from llmebench.datasets import CT22CheckworthinessDataset
from llmebench.models import GPTChatCompletionModel
from llmebench.tasks import CheckworthinessTask

Expand All @@ -12,7 +12,7 @@

def config():
return {
"dataset": CheckworthinessDataset,
"dataset": CT22CheckworthinessDataset,
"dataset_args": {},
"task": CheckworthinessTask,
"task_args": {},
Expand Down
Original file line number Diff line number Diff line change
@@ -1,13 +1,13 @@
import os

from llmebench.datasets import CovidClaimDataset
from llmebench.datasets import CT22ClaimDataset
from llmebench.models import BLOOMPetalModel
from llmebench.tasks import ClaimDetectionTask


def config():
return {
"dataset": CovidClaimDataset,
"dataset": CT22ClaimDataset,
"dataset_args": {},
"task": ClaimDetectionTask,
"task_args": {},
Expand Down
Original file line number Diff line number Diff line change
@@ -1,13 +1,13 @@
import os

from llmebench.datasets import CovidClaimDataset
from llmebench.datasets import CT22ClaimDataset
from llmebench.models import GPTModel
from llmebench.tasks import ClaimDetectionTask


def config():
return {
"dataset": CovidClaimDataset,
"dataset": CT22ClaimDataset,
"dataset_args": {},
"task": ClaimDetectionTask,
"task_args": {},
Expand Down
Original file line number Diff line number Diff line change
@@ -1,13 +1,13 @@
import os

from llmebench.datasets import CovidClaimDataset
from llmebench.datasets import CT22ClaimDataset
from llmebench.models import GPTChatCompletionModel
from llmebench.tasks import ClaimDetectionTask


def config():
return {
"dataset": CovidClaimDataset,
"dataset": CT22ClaimDataset,
"dataset_args": {},
"task": ClaimDetectionTask,
"task_args": {},
Expand Down
Original file line number Diff line number Diff line change
@@ -1,18 +1,13 @@
import os
import random
import re

from llmebench.datasets import CheckworthinessDataset
from llmebench.datasets import CT22CheckworthinessDataset
from llmebench.models import GPTChatCompletionModel
from llmebench.tasks import CheckworthinessTask


random.seed(1333)


def config():
return {
"dataset": CheckworthinessDataset,
"dataset": CT22CheckworthinessDataset,
"dataset_args": {},
"task": CheckworthinessTask,
"task_args": {},
Expand Down
Original file line number Diff line number Diff line change
@@ -1,15 +1,15 @@
import os

from llmebench.datasets import FactualityCOVID19Dataset
from llmebench.datasets import COVID19FactualityDataset
from llmebench.models import BLOOMPetalModel
from llmebench.tasks import FactualityCOVID19Task
from llmebench.tasks import FactualityTask


def config():
return {
"dataset": FactualityCOVID19Dataset,
"dataset": COVID19FactualityDataset,
"dataset_args": {},
"task": FactualityCOVID19Task,
"task": FactualityTask,
"task_args": {},
"model": BLOOMPetalModel,
"model_args": {
Expand Down
Original file line number Diff line number Diff line change
@@ -1,20 +1,15 @@
import os
import random
import re

from llmebench.datasets import FactualityCOVID19Dataset
from llmebench.datasets import COVID19FactualityDataset
from llmebench.models import GPTChatCompletionModel
from llmebench.tasks import FactualityCOVID19Task


random.seed(1333)
from llmebench.tasks import FactualityTask


def config():
return {
"dataset": FactualityCOVID19Dataset,
"dataset": COVID19FactualityDataset,
"dataset_args": {},
"task": FactualityCOVID19Task,
"task": FactualityTask,
"task_args": {},
"model": GPTChatCompletionModel,
"model_args": {
Expand Down
Original file line number Diff line number Diff line change
@@ -1,20 +1,15 @@
import os
import random
import re

from llmebench.datasets import FactualityCOVID19Dataset
from llmebench.datasets import COVID19FactualityDataset
from llmebench.models import GPTChatCompletionModel
from llmebench.tasks import FactualityCOVID19Task


random.seed(1333)
from llmebench.tasks import FactualityTask


def config():
return {
"dataset": FactualityCOVID19Dataset,
"dataset": COVID19FactualityDataset,
"dataset_args": {},
"task": FactualityCOVID19Task,
"task": FactualityTask,
"task_args": {},
"model": GPTChatCompletionModel,
"model_args": {
Expand Down
Original file line number Diff line number Diff line change
@@ -1,20 +1,15 @@
import os
import random
import re

from llmebench.datasets import FactualityKhouja20Dataset
from llmebench.datasets import Khouja20FactualityDataset
from llmebench.models import BLOOMPetalModel
from llmebench.tasks import FactualityKhouja20Task


random.seed(1333)
from llmebench.tasks import FactualityTask


def config():
return {
"dataset": FactualityKhouja20Dataset,
"dataset": Khouja20FactualityDataset,
"dataset_args": {},
"task": FactualityKhouja20Task,
"task": FactualityTask,
"task_args": {},
"model": BLOOMPetalModel,
"model_args": {
Expand Down
Original file line number Diff line number Diff line change
@@ -1,15 +1,15 @@
import os

from llmebench.datasets import FactualityKhouja20Dataset
from llmebench.models import GPTModel, RandomGPTModel
from llmebench.tasks import FactualityKhouja20Task
from llmebench.datasets import Khouja20FactualityDataset
from llmebench.models import GPTModel
from llmebench.tasks import FactualityTask


def config():
return {
"dataset": FactualityKhouja20Dataset,
"dataset": Khouja20FactualityDataset,
"dataset_args": {},
"task": FactualityKhouja20Task,
"task": FactualityTask,
"task_args": {},
"model": GPTModel,
"model_args": {
Expand Down
Original file line number Diff line number Diff line change
@@ -1,15 +1,15 @@
import os

from llmebench.datasets import FactualityKhouja20Dataset
from llmebench.datasets import Khouja20FactualityDataset
from llmebench.models import GPTChatCompletionModel
from llmebench.tasks import FactualityKhouja20Task
from llmebench.tasks import FactualityTask


def config():
return {
"dataset": FactualityKhouja20Dataset,
"dataset": Khouja20FactualityDataset,
"dataset_args": {},
"task": FactualityKhouja20Task,
"task": FactualityTask,
"task_args": {},
"model": GPTChatCompletionModel,
"model_args": {
Expand Down
Original file line number Diff line number Diff line change
@@ -1,15 +1,15 @@
import os

from llmebench.datasets import FactualityKhouja20Dataset
from llmebench.datasets import Khouja20FactualityDataset
from llmebench.models import GPTChatCompletionModel
from llmebench.tasks import FactualityKhouja20Task
from llmebench.tasks import FactualityTask


def config():
return {
"dataset": FactualityKhouja20Dataset,
"dataset": Khouja20FactualityDataset,
"dataset_args": {},
"task": FactualityKhouja20Task,
"task": FactualityTask,
"task_args": {},
"model": GPTChatCompletionModel,
"model_args": {
Expand Down
Original file line number Diff line number Diff line change
@@ -1,20 +1,15 @@
import os
import random
import re

from llmebench.datasets import FactualityUnifiedFCDataset
from llmebench.datasets import UnifiedFCFactualityDataset
from llmebench.models import BLOOMPetalModel
from llmebench.tasks import FactualityUnifiedFCTask


random.seed(1333)
from llmebench.tasks import FactualityTask


def config():
return {
"dataset": FactualityUnifiedFCDataset,
"dataset": UnifiedFCFactualityDataset,
"dataset_args": {},
"task": FactualityUnifiedFCTask,
"task": FactualityTask,
"task_args": {},
"model": BLOOMPetalModel,
"model_args": {
Expand Down
Loading

0 comments on commit 6509529

Please sign in to comment.