From 0eeb09d8d3a059164c92d27b2dbb4019b88b37a3 Mon Sep 17 00:00:00 2001 From: Arid Hasan <arid.hasan.h@gmail.com> Date: Tue, 10 Sep 2024 12:40:07 -0300 Subject: [PATCH] add asset GPT4-o NE --- assets/ne/QA/MultiNativQA_GPT4_ZeroShot.py | 53 ++++++++++++++++++++++ 1 file changed, 53 insertions(+) create mode 100644 assets/ne/QA/MultiNativQA_GPT4_ZeroShot.py diff --git a/assets/ne/QA/MultiNativQA_GPT4_ZeroShot.py b/assets/ne/QA/MultiNativQA_GPT4_ZeroShot.py new file mode 100644 index 00000000..63457b2a --- /dev/null +++ b/assets/ne/QA/MultiNativQA_GPT4_ZeroShot.py @@ -0,0 +1,53 @@ +from llmebench.datasets import MultiNativQADataset +from llmebench.models import OpenAIModel +from llmebench.tasks import MultiNativQATask + + +def metadata(): + return { + "author": "Arabic Language Technologies, QCRI, HBKU", + "model": "GPT4-o", + "description": "Deployed on Azure.", + "scores": {}, + } + + +def config(): + return { + "dataset": MultiNativQADataset, + "task": MultiNativQATask, + "model": OpenAIModel, + } + + +def prompt(input_sample): + # Define the question prompt + question_prompt = f""" + Please use your expertise to answer the following Nepali question. Answer in Nepali and rate your confidence level from 1 to 10. + Provide your response in the following JSON format: {{"answer": "your answer", "score": your confidence score}}. + Please provide JSON output only. No additional text. Answer should be limited to less or equal to {input_sample['length']} words. + + Question: {input_sample['question']} + """ + + # Define the assistant prompt + assistant_prompt = """ + You are an Nepali AI assistant specialized in providing detailed and accurate answers across various fields. + Your task is to deliver clear, concise, and relevant information. + """ + + return [ + {"role": "user", "content": question_prompt}, + {"role": "assistant", "content": assistant_prompt}, + ] + + +def post_process(response): + content = response["choices"][0]["message"]["content"].strip() + content = content.replace("\n", "").strip() + if "```json" in content: + # content = content.replace("```json", "").replace('```', '').replace("\n}", "}") + # content = content.replace("{\n", "{").replace("\",\n", "\",") + + content = re.search(r"```json(.*)```", content).group(1) + return json.loads(content)["answer"]