feat: system prompt (#448)

2023-08-16 21:57:01 +02:00
parent 7585bc557b
commit 849de5e8ab
9 changed files with 50 additions and 10 deletions
--- a/embedchain/apps/App.py
+++ b/embedchain/apps/App.py
@@ -25,6 +25,8 @@ class App(EmbedChain):

    def get_llm_model_answer(self, prompt, config: ChatConfig):
        messages = []
+        if config.system_prompt:
+            messages.append({"role": "system", "content": config.system_prompt})
        messages.append({"role": "user", "content": prompt})
        response = openai.ChatCompletion.create(
            model=config.model or "gpt-3.5-turbo-0613",
--- a/embedchain/apps/CustomApp.py
+++ b/embedchain/apps/CustomApp.py
@@ -1,5 +1,5 @@
 import logging
-from typing import List
+from typing import List, Optional

 from langchain.schema import BaseMessage

@@ -84,7 +84,7 @@ class CustomApp(EmbedChain):
        if config.top_p and config.top_p != 1:
            logging.warning("Config option `top_p` is not supported by this model.")

-        messages = CustomApp._get_messages(prompt)
+        messages = CustomApp._get_messages(prompt, system_prompt=config.system_prompt)

        return chat(messages).content

@@ -97,7 +97,7 @@ class CustomApp(EmbedChain):
        if config.max_tokens and config.max_tokens != 1000:
            logging.warning("Config option `max_tokens` is not supported by this model.")

-        messages = CustomApp._get_messages(prompt)
+        messages = CustomApp._get_messages(prompt, system_prompt=config.system_prompt)

        return chat(messages).content

@@ -110,7 +110,7 @@ class CustomApp(EmbedChain):
        if config.top_p and config.top_p != 1:
            logging.warning("Config option `top_p` is not supported by this model.")

-        messages = CustomApp._get_messages(prompt)
+        messages = CustomApp._get_messages(prompt, system_prompt=config.system_prompt)

        return chat(messages).content

@@ -133,15 +133,19 @@ class CustomApp(EmbedChain):
        if config.top_p and config.top_p != 1:
            logging.warning("Config option `top_p` is not supported by this model.")

-        messages = CustomApp._get_messages(prompt)
+        messages = CustomApp._get_messages(prompt, system_prompt=config.system_prompt)

        return chat(messages).content

    @staticmethod
-    def _get_messages(prompt: str) -> List[BaseMessage]:
+    def _get_messages(prompt: str, system_prompt: Optional[str] = None) -> List[BaseMessage]:
        from langchain.schema import HumanMessage, SystemMessage

-        return [SystemMessage(content="You are a helpful assistant."), HumanMessage(content=prompt)]
+        messages = []
+        if system_prompt:
+            messages.append(SystemMessage(content=system_prompt))
+        messages.append(HumanMessage(content=prompt))
+        return messages

    def _stream_llm_model_response(self, response):
        """
--- a/embedchain/apps/Llama2App.py
+++ b/embedchain/apps/Llama2App.py
@@ -2,7 +2,7 @@ import os

 from langchain.llms import Replicate

-from embedchain.config import AppConfig
+from embedchain.config import AppConfig, ChatConfig
 from embedchain.embedchain import EmbedChain


@@ -27,8 +27,10 @@ class Llama2App(EmbedChain):

        super().__init__(config)

-    def get_llm_model_answer(self, prompt, config: AppConfig = None):
+    def get_llm_model_answer(self, prompt, config: ChatConfig = None):
        # TODO: Move the model and other inputs into config
+        if config.system_prompt:
+            raise ValueError("Llama2App does not support `system_prompt`")
        llm = Replicate(
            model="a16z-infra/llama13b-v2-chat:df7690f1994d94e96ad9d568eac121aecf50684a0b0963b25a41cc40061269e5",
            input={"temperature": 0.75, "max_length": 500, "top_p": 1},
--- a/embedchain/apps/OpenSourceApp.py
+++ b/embedchain/apps/OpenSourceApp.py
@@ -55,6 +55,9 @@ class OpenSourceApp(EmbedChain):
                "OpenSourceApp does not support switching models at runtime. Please create a new app instance."
            )

+        if config.system_prompt:
+            raise ValueError("OpenSourceApp does not support `system_prompt`")
+
        response = self.instance.generate(
            prompt=prompt,
            streaming=config.stream,
--- a/embedchain/config/ChatConfig.py
+++ b/embedchain/config/ChatConfig.py
@@ -1,4 +1,5 @@
 from string import Template
+from typing import Optional

 from embedchain.config.QueryConfig import QueryConfig

@@ -34,6 +35,7 @@ class ChatConfig(QueryConfig):
        top_p=None,
        stream: bool = False,
        deployment_name=None,
+        system_prompt: Optional[str] = None,
    ):
        """
        Initializes the ChatConfig instance.
@@ -51,6 +53,8 @@ class ChatConfig(QueryConfig):
        (closer to 1) make word selection more diverse, lower values make words less
        diverse.
        :param stream: Optional. Control if response is streamed back to the user
+        :param deployment_name: t.b.a.
+        :param system_prompt: Optional. System prompt string.
        :raises ValueError: If the template is not valid as template should contain
        $context and $query and $history
        """
@@ -70,6 +74,7 @@ class ChatConfig(QueryConfig):
            history=[0],
            stream=stream,
            deployment_name=deployment_name,
+            system_prompt=system_prompt,
        )

    def set_history(self, history):
--- a/embedchain/config/QueryConfig.py
+++ b/embedchain/config/QueryConfig.py
@@ -1,5 +1,6 @@
 import re
 from string import Template
+from typing import Optional

 from embedchain.config.BaseConfig import BaseConfig

@@ -63,6 +64,7 @@ class QueryConfig(BaseConfig):
        history=None,
        stream: bool = False,
        deployment_name=None,
+        system_prompt: Optional[str] = None,
    ):
        """
        Initializes the QueryConfig instance.
@@ -81,6 +83,8 @@ class QueryConfig(BaseConfig):
        diverse.
        :param history: Optional. A list of strings to consider as history.
        :param stream: Optional. Control if response is streamed back to user
+        :param deployment_name: t.b.a.
+        :param system_prompt: Optional. System prompt string.
        :raises ValueError: If the template is not valid as template should
        contain $context and $query (and optionally $history).
        """
@@ -108,6 +112,7 @@ class QueryConfig(BaseConfig):
        self.model = model
        self.top_p = top_p if top_p else 1
        self.deployment_name = deployment_name
+        self.system_prompt = system_prompt

        if self.validate_template(template):
            self.template = template