From 7057b76cb24ef69b36ff01ba23d01223afd19ef9 Mon Sep 17 00:00:00 2001 From: Muhammad Taha Date: Mon, 6 May 2024 22:26:22 +0800 Subject: [PATCH 1/2] adding a cookbook for finetune embeddings --- cookbook/finetuning_embedding_model.py | 31 ++++++++++++++++++++++++++ 1 file changed, 31 insertions(+) create mode 100644 cookbook/finetuning_embedding_model.py diff --git a/cookbook/finetuning_embedding_model.py b/cookbook/finetuning_embedding_model.py new file mode 100644 index 0000000..8501fd9 --- /dev/null +++ b/cookbook/finetuning_embedding_model.py @@ -0,0 +1,31 @@ +from beyondllm import source, retrieve, llms +from beyondllm.embeddings import FineTuneEmbeddings +import os + + +# Setting up an environment variable for API key +os.environ['GOOGLE_API_KEY'] = "your-api-key" + +# Importing and preparing the data +data = source.fit("build-career-in-ai.pdf", dtype="pdf", chunk_size=1024, chunk_overlap=0) + +# List of files to train the embeddings +list_of_files = ['build-career-in-ai.pdf'] + +# Initializing a Gemini LLM model +llm = llms.GeminiModel() + +# Creating an instance of FineTuneEmbeddings +fine_tuned_model = FineTuneEmbeddings() + +# Training the embedding model +embed_model = fine_tuned_model.train(list_of_files, "BAAI/bge-small-en-v1.5", llm, "fintune") + +# Option to load an already fine-tuned model +# embed_model = fine_tuned_model.load_model("fintune") + +# Creating a retriever using the fine-tuned embeddings +retriever = retrieve.auto_retriever(data, embed_model, type="normal", top_k=4) + +# Retrieving information using a query +print(retriever.retrieve("How to excel in AI?")) From 9317e6ed7be5141667c6387f9f311a6f9b0cbfa8 Mon Sep 17 00:00:00 2001 From: Muhammad Taha Date: Wed, 8 May 2024 19:42:11 +0800 Subject: [PATCH 2/2] Adding support for observability for OpenAI models --- src/beyondllm/observe/__intit__.py | 1 + src/beyondllm/observe/observe.py | 26 ++++++++++++++++++++++++++ 2 files changed, 27 insertions(+) create mode 100644 src/beyondllm/observe/__intit__.py create mode 100644 src/beyondllm/observe/observe.py diff --git a/src/beyondllm/observe/__intit__.py b/src/beyondllm/observe/__intit__.py new file mode 100644 index 0000000..f623392 --- /dev/null +++ b/src/beyondllm/observe/__intit__.py @@ -0,0 +1 @@ +from .observe import Observer \ No newline at end of file diff --git a/src/beyondllm/observe/observe.py b/src/beyondllm/observe/observe.py new file mode 100644 index 0000000..a638399 --- /dev/null +++ b/src/beyondllm/observe/observe.py @@ -0,0 +1,26 @@ +from dataclasses import dataclass +try: + import phoenix as px + from phoenix.trace.openai import OpenAIInstrumentor +except ImportError: + user_agree = input("The feature you're trying to use requires additional packages. Would you like to install them now? [y/N]: ") + if user_agree.lower() == 'y': + import subprocess + import sys + subprocess.check_call([sys.executable, "-m", "pip", "install", "arize-phoenix[evals]"]) + + import phoenix as px + from phoenix.trace.openai import OpenAIInstrumentor + else: + raise ImportError("The required Phoenix packages are not installed.") + + + +@dataclass +class Observer: + instrumentor: OpenAIInstrumentor = OpenAIInstrumentor() + + def run(self): + self.instrumentor.instrument() + self.session = px.launch_app() + \ No newline at end of file