Sinaptik-AI · gventuri · Sep 28, 2023 · Sep 26, 2023 · Sep 27, 2023 · Sep 27, 2023
diff --git a/assets/prompt-templates/correct_error_prompt.tmpl b/assets/prompt-templates/correct_error_prompt.tmpl
@@ -0,0 +1,15 @@
+
+You are provided with the following {engine} DataFrames with the following metadata:
+
+{dataframes}
+
+The user asked the following question:
+{conversation}
+
+You generated this python code:
+{code}
+
+It fails with the following error:
+{error_returned}
+
+Correct the python code and return a new python code (do not import anything) that fixes the above mentioned error. Do not generate the same code again.
diff --git a/assets/prompt-templates/generate_python_code.tmpl b/assets/prompt-templates/generate_python_code.tmpl
@@ -0,0 +1,30 @@
+
+You are provided with the following pandas DataFrames:
+
+{dataframes}
+
+<conversation>
+{conversation}
+</conversation>
+
+This is the initial python code to be updated:
+```python
+# TODO import all the dependencies required
+{default_import}
+
+def analyze_data(dfs: list[{engine_df_name}]) -> dict:
+    """
+    Analyze the data
+    1. Prepare: Preprocessing and cleaning data if necessary
+    2. Process: Manipulating data for analysis (grouping, filtering, aggregating, etc.)
+    3. Analyze: Conducting the actual analysis (if the user asks to plot a chart save it to an image in {save_charts_path}/temp_chart.png and do not show the chart.)
+    4. Output: return a dictionary of:
+    - type (possible values "text", "number", "dataframe", "plot")
+    - value (can be a string, a dataframe or the path of the plot, NOT a dictionary)
+    Example output: {{ "type": "text", "value": "The average loan amount is $15,000." }}
+    """
+```
+
+Using the provided dataframes (`dfs`), update the python code based on the last question in the conversation.
+
+Updated code:
diff --git a/docs/custom-prompts.md b/docs/custom-prompts.md
@@ -16,14 +16,44 @@ To create your custom prompt create a new CustomPromptClass inherited from base
 
 ```python
 from pandasai import SmartDataframe
-from pandasai.prompts import Prompt
+from pandasai.prompts import AbstractPrompt
+
+
+class MyCustomPrompt(AbstractPrompt):
+    @property
+    def template(self):
+        return """This is your custom text for your prompt with custom {my_custom_value}"""
+
+
+df = SmartDataframe("data.csv", {
+    "custom_prompts": {
+        "generate_python_code": MyCustomPrompt(
+            my_custom_value="my custom value")
+    }
+})
+```
+
+You can also use `FileBasedPrompt` in case you prefer to store prompt template in a file:
+
+_my_prompt_template.tmpl:_
+```
+This is your custom text for your prompt with custom {my_custom_value}
+```
+_python code:_
+
+```python
+from pandasai import SmartDataframe
+from pandasai.prompts import FileBasedPrompt
+
+
+class MyCustomFileBasedPrompt(FileBasedPrompt):
+    _path_to_template = "path/to/my_prompt_template.tmpl"
 
-class MyCustomPrompt(Prompt):
-    text = """This is your custom text for your prompt with custom {my_custom_value}"""
 
 df = SmartDataframe("data.csv", {
     "custom_prompts": {
-        "generate_python_code": MyCustomPrompt(my_custom_value="my custom value")
+        "generate_python_code": MyCustomFileBasedPrompt(
+            my_custom_value="my custom value")
     }
 })
 ```
@@ -36,15 +66,17 @@ You can directly access the default prompt variables (for example dfs, conversat
 
 ```python
 from pandasai import SmartDataframe
-from pandasai.prompts import Prompt
+from pandasai.prompts import AbstractPrompt
 
-class MyCustomPrompt(Prompt):
-    text = """You are given a dataframe with number if rows equal to {dfs[0].shape[0]} and number of columns equal to {dfs[0].shape[1]}
+
+class MyCustomPrompt(AbstractPrompt):
+    template = """You are given a dataframe with number if rows equal to {dfs[0].shape[0]} and number of columns equal to {dfs[0].shape[1]}
 
 Here's the conversation:
 {conversation}
 """
 
+
 df = SmartDataframe("data.csv", {
     "custom_prompts": {
         "generate_python_code": MyCustomPrompt()

diff --git a/pandasai/__init__.py b/pandasai/__init__.py
@@ -40,7 +40,7 @@
 import pandas as pd
 from .smart_dataframe import SmartDataframe
 from .smart_datalake import SmartDatalake
-from .prompts.base import Prompt
+from .prompts.base import AbstractPrompt
 from .callbacks.base import BaseCallback
 from .schemas.df_config import Config
 from .helpers.cache import Cache
@@ -112,7 +112,7 @@ def __init__(
         middlewares=None,
         custom_whitelisted_dependencies=None,
         enable_logging=True,
-        non_default_prompts: Optional[Dict[str, Type[Prompt]]] = None,
+        non_default_prompts: Optional[Dict[str, Type[AbstractPrompt]]] = None,
         callback: Optional[BaseCallback] = None,
     ):
         """

diff --git a/pandasai/exceptions.py b/pandasai/exceptions.py
@@ -71,3 +71,23 @@ def __init__(self, library_name):
             f"Generated code includes import of {library_name} which"
             " is not in whitelist."
         )
+
+
+class TemplateFileNotFoundError(FileNotFoundError):
+    """
+    Raised when a template file cannot be found.
+    """
+
+    def __init__(self, template_path, prompt_name="Unknown"):
+        """
+        __init__ method of TemplateFileNotFoundError Class
+
+        Args:
+            template_path (str): Path for template file.
+            prompt_name (str): Prompt name. Defaults to "Unknown".
+        """
+        self.template_path = template_path
+        super().__init__(
+            f"Unable to find a file with template at '{template_path}' "
+            f"for '{prompt_name}' prompt."
+        )
diff --git a/pandasai/llm/azure_openai.py b/pandasai/llm/azure_openai.py
@@ -18,7 +18,7 @@
 from ..helpers import load_dotenv
 
 from ..exceptions import APIKeyNotFoundError, UnsupportedOpenAIModelError
-from ..prompts.base import Prompt
+from ..prompts.base import AbstractPrompt
 from .base import BaseOpenAI
 
 load_dotenv()
@@ -105,12 +105,12 @@ def _default_params(self) -> Dict[str, Any]:
         """
         return {**super()._default_params, "engine": self.engine}
 
-    def call(self, instruction: Prompt, suffix: str = "") -> str:
+    def call(self, instruction: AbstractPrompt, suffix: str = "") -> str:
         """
         Call the Azure OpenAI LLM.
 
         Args:
-            instruction (Prompt): A prompt object with instruction for LLM.
+            instruction (AbstractPrompt): A prompt object with instruction for LLM.
             suffix (str): Suffix to pass.
 
         Returns:

diff --git a/pandasai/llm/base.py b/pandasai/llm/base.py
@@ -29,7 +29,7 @@ class CustomLLM(BaseOpenAI):
     NoCodeFoundError,
 )
 from ..helpers.openai_info import openai_callback_var
-from ..prompts.base import Prompt
+from ..prompts.base import AbstractPrompt
 
 
 class LLM:
@@ -120,12 +120,12 @@ def _extract_code(self, response: str, separator: str = "```") -> str:
         return code
 
     @abstractmethod
-    def call(self, instruction: Prompt, suffix: str = "") -> str:
+    def call(self, instruction: AbstractPrompt, suffix: str = "") -> str:
         """
         Execute the LLM with given prompt.
 
         Args:
-            instruction (Prompt): A prompt object with instruction for LLM.
+            instruction (AbstractPrompt): A prompt object with instruction for LLM.
             suffix (str, optional): Suffix. Defaults to "".
 
         Raises:
@@ -134,12 +134,12 @@ def call(self, instruction: Prompt, suffix: str = "") -> str:
         """
         raise MethodNotImplementedError("Call method has not been implemented")
 
-    def generate_code(self, instruction: Prompt) -> str:
+    def generate_code(self, instruction: AbstractPrompt) -> str:
         """
         Generate the code based on the instruction and the given prompt.
 
         Args:
-            instruction (Prompt): Prompt with instruction for LLM.
+            instruction (AbstractPrompt): Prompt with instruction for LLM.
 
         Returns:
             str: A string of Python code.
@@ -334,11 +334,11 @@ def query(self, payload) -> str:
 
         return response.json()[0]["generated_text"]
 
-    def call(self, instruction: Prompt, suffix: str = "") -> str:
+    def call(self, instruction: AbstractPrompt, suffix: str = "") -> str:
         """
         A call method of HuggingFaceLLM class.
         Args:
-            instruction (Prompt): A prompt object with instruction for LLM.
+            instruction (AbstractPrompt): A prompt object with instruction for LLM.
             suffix (str): A string representing the suffix to be truncated
                 from the generated response.
 
@@ -429,12 +429,12 @@ def _generate_text(self, prompt: str) -> str:
         """
         raise MethodNotImplementedError("method has not been implemented")
 
-    def call(self, instruction: Prompt, suffix: str = "") -> str:
+    def call(self, instruction: AbstractPrompt, suffix: str = "") -> str:
         """
         Call the Google LLM.
 
         Args:
-            instruction (Prompt): Instruction to pass.
+            instruction (AbstractPrompt): Instruction to pass.
             suffix (str): Suffix to pass. Defaults to an empty string ("").
 
         Returns:

diff --git a/pandasai/llm/fake.py b/pandasai/llm/fake.py
@@ -2,7 +2,7 @@
 
 from typing import Optional
 
-from ..prompts.base import Prompt
+from ..prompts.base import AbstractPrompt
 from .base import LLM
 
 
@@ -16,7 +16,7 @@ def __init__(self, output: Optional[str] = None):
         if output is not None:
             self._output = output
 
-    def call(self, instruction: Prompt, suffix: str = "") -> str:
+    def call(self, instruction: AbstractPrompt, suffix: str = "") -> str:
         self.last_prompt = instruction.to_string() + suffix
         return self._output
 

diff --git a/pandasai/llm/huggingface_text_gen.py b/pandasai/llm/huggingface_text_gen.py
@@ -2,7 +2,7 @@
 
 from .base import LLM
 from ..helpers import load_dotenv
-from ..prompts.base import Prompt
+from ..prompts.base import AbstractPrompt
 
 load_dotenv()
 
@@ -14,7 +14,7 @@ class HuggingFaceTextGen(LLM):
     top_k: Optional[int] = None
     top_p: Optional[float] = 0.8
     typical_p: Optional[float] = 0.8
-    temperature: float = 1E-3  # must be strictly positive
+    temperature: float = 1e-3  # must be strictly positive
     repetition_penalty: Optional[float] = None
     truncate: Optional[int] = None
     stop_sequences: List[str] = None
@@ -29,7 +29,7 @@ def __init__(self, inference_server_url: str, **kwargs):
         try:
             import text_generation
 
-            for (key, val) in kwargs.items():
+            for key, val in kwargs.items():
                 if key in self.__annotations__:
                     setattr(self, key, val)
 
@@ -60,14 +60,14 @@ def _default_params(self) -> Dict[str, Any]:
             "seed": self.seed,
         }
 
-    def call(self, instruction: Prompt, suffix: str = "") -> str:
+    def call(self, instruction: AbstractPrompt, suffix: str = "") -> str:
         prompt = instruction.to_string() + suffix
 
         params = self._default_params
         if self.streaming:
             completion = ""
             for chunk in self.client.generate_stream(prompt, **params):
-                completion += chunk.text
+                completion += chunk.template
             return completion
 
         res = self.client.generate(prompt, **params)
@@ -76,8 +76,8 @@ def call(self, instruction: Prompt, suffix: str = "") -> str:
             for stop_seq in self.stop_sequences:
                 if stop_seq in res.generated_text:
                     res.generated_text = res.generated_text[
-                                         :res.generated_text.index(stop_seq)
-                                         ]
+                        : res.generated_text.index(stop_seq)
+                    ]
         return res.generated_text
 
     @property

diff --git a/pandasai/llm/langchain.py b/pandasai/llm/langchain.py
@@ -1,4 +1,4 @@
-from pandasai.prompts.base import Prompt
+from pandasai.prompts.base import AbstractPrompt
 from .base import LLM
 
 
@@ -13,7 +13,7 @@ class LangchainLLM(LLM):
     def __init__(self, langchain_llm):
         self._langchain_llm = langchain_llm
 
-    def call(self, instruction: Prompt, suffix: str = "") -> str:
+    def call(self, instruction: AbstractPrompt, suffix: str = "") -> str:
         prompt = instruction.to_string() + suffix
         return self._langchain_llm.predict(prompt)
 

diff --git a/pandasai/llm/openai.py b/pandasai/llm/openai.py
@@ -15,7 +15,7 @@
 from ..helpers import load_dotenv
 
 from ..exceptions import APIKeyNotFoundError, UnsupportedOpenAIModelError
-from ..prompts.base import Prompt
+from ..prompts.base import AbstractPrompt
 from .base import BaseOpenAI
 
 load_dotenv()
@@ -85,12 +85,12 @@ def _default_params(self) -> Dict[str, Any]:
             "model": self.model,
         }
 
-    def call(self, instruction: Prompt, suffix: str = "") -> str:
+    def call(self, instruction: AbstractPrompt, suffix: str = "") -> str:
         """
         Call the OpenAI LLM.
 
         Args:
-            instruction (Prompt): A prompt object with instruction for LLM.
+            instruction (AbstractPrompt): A prompt object with instruction for LLM.
             suffix (str): Suffix to pass.
 
         Raises:

diff --git a/pandasai/prompts/__init__.py b/pandasai/prompts/__init__.py
@@ -1,9 +1,10 @@
-from .base import Prompt
+from .base import AbstractPrompt, FileBasedPrompt
 from .correct_error_prompt import CorrectErrorPrompt
 from .generate_python_code import GeneratePythonCodePrompt
 
 __all__ = [
-    "Prompt",
+    "AbstractPrompt",
     "CorrectErrorPrompt",
     "GeneratePythonCodePrompt",
+    "FileBasedPrompt",
 ]