deepset-ai · silvanocerza · Nov 23, 2023 · Nov 15, 2023 · Nov 16, 2023 · Nov 16, 2023
@@ -1,7 +1,7 @@
 loaders:
   - type: loaders.CustomPythonLoader
     search_path: [../../../haystack/preview/components/builders]
-    modules: ["answer_builder", "prompt_builder"]
+    modules: ["answer_builder", "prompt_builder", "dynamic_prompt_builder"]
     ignore_when_discovered: ["__init__"]
 processors:
   - type: filter

@@ -1,4 +1,5 @@
 from haystack.preview.components.builders.answer_builder import AnswerBuilder
 from haystack.preview.components.builders.prompt_builder import PromptBuilder
+from haystack.preview.components.builders.dynamic_prompt_builder import DynamicPromptBuilder
 
-__all__ = ["AnswerBuilder", "PromptBuilder"]
+__all__ = ["AnswerBuilder", "PromptBuilder", "DynamicPromptBuilder"]
@@ -0,0 +1,334 @@
+import logging
+from typing import Dict, Any, Optional, List, Union, Set
+
+from jinja2 import Template, meta
+
+from haystack.preview import component
+from haystack.preview import default_to_dict
+from haystack.preview.dataclasses.chat_message import ChatMessage, ChatRole
+
+logger = logging.getLogger(__name__)
+
+
+@component
+class DynamicPromptBuilder:
+    """
+    DynamicPromptBuilder is designed to construct dynamic prompts by processing either a list of `ChatMessage`
+    instances or a string template. It integrates with Jinja2 templating for dynamic prompt generation.
+
+    In the case of `ChatMessage` instances, DynamicPromptBuilder assumes the last user message in the list as a
+    template and renders it with resolved pipeline variables and any additional template variables provided. For a
+    string template, it applies the template variables directly to render the final prompt. This dual functionality
+    allows DynamicPromptBuilder to be versatile in handling different types of prompt sources, making it suitable for
+    both chat-based and non-chat-based prompt generation scenarios.
+
+    You can provide additional template variables directly to the pipeline `run` method. They are then merged with the
+    variables resolved from the pipeline runtime. This allows for greater flexibility and customization of the
+    generated prompts based on runtime conditions and user inputs.
+
+    The following example demonstrates how to use DynamicPromptBuilder to generate a chat prompt:
+
+    ```python
+    from haystack.preview.components.builders import DynamicPromptBuilder
+    from haystack.preview.components.generators.chat import GPTChatGenerator
+    from haystack.preview.dataclasses import ChatMessage
+    from haystack.preview import Pipeline
+
+    # no parameter init, we don't use any runtime template variables
+    prompt_builder = DynamicPromptBuilder()
+    llm = GPTChatGenerator(api_key="<your-api-key>", model_name="gpt-3.5-turbo")
+
+    pipe = Pipeline()
+    pipe.add_component("prompt_builder", prompt_builder)
+    pipe.add_component("llm", llm)
+    pipe.connect("prompt_builder.prompt", "llm.messages")
+
+    location = "Berlin"
+    messages = [ChatMessage.from_system("Always respond in German even if some input data is in other languages."),
+                ChatMessage.from_user("Tell me about {{location}}")]
+
+
+    pipe.run(data={"prompt_builder": {"template_variables":{"location": location}, "prompt_source": messages}})
+
+    >> {'llm': {'replies': [ChatMessage(content='Berlin ist die Hauptstadt Deutschlands und die größte Stadt des Landes.
+    >> Es ist eine lebhafte Metropole, die für ihre Geschichte, Kultur und einzigartigen Sehenswürdigkeiten bekannt ist.
+    >> Berlin bietet eine vielfältige Kulturszene, beeindruckende architektonische Meisterwerke wie den Berliner Dom
+    >> und das Brandenburger Tor, sowie weltberühmte Museen wie das Pergamonmuseum. Die Stadt hat auch eine pulsierende
+    >> Clubszene und ist für ihr aufregendes Nachtleben berühmt. Berlin ist ein Schmelztiegel verschiedener Kulturen und
+    >> zieht jedes Jahr Millionen von Touristen an.', role=<ChatRole.ASSISTANT: 'assistant'>, name=None,
+    >> metadata={'model': 'gpt-3.5-turbo-0613', 'index': 0, 'finish_reason': 'stop', 'usage': {'prompt_tokens': 32,
+    >> 'completion_tokens': 153, 'total_tokens': 185}})]}}
+    ```
+
+    The following example demonstrates how to use DynamicPromptBuilder to generate a chat prompt with resolution
+    of pipeline runtime variables (such as documents):
+
+    ```python
+    from haystack.preview.components.builders import DynamicPromptBuilder
+    from haystack.preview.components.generators.chat import GPTChatGenerator
+    from haystack.preview.dataclasses import ChatMessage, Document
+    from haystack.preview import Pipeline, component
+    from typing import List
+
+    # we'll use documents runtime variable in our template, so we need to specify it in the init
+    prompt_builder = DynamicPromptBuilder(expected_runtime_variables=["documents"])
+    llm = GPTChatGenerator(api_key="<your-api-key>", model_name="gpt-3.5-turbo")
+
+
+    @component
+    class DocumentProducer:
+
+        @component.output_types(documents=List[Document])
+        def run(self, doc_input: str):
+            return {"documents": [Document(content=doc_input)]}
+
+
+
+    pipe = Pipeline()
+    pipe.add_component("doc_producer", DocumentProducer())
+    pipe.add_component("prompt_builder", prompt_builder)
+    pipe.add_component("llm", llm)
+
+    # note here how prompt_builder.documents is received from doc_producer.documents
+    pipe.connect("doc_producer.documents", "prompt_builder.documents")
+    pipe.connect("prompt_builder.prompt", "llm.messages")
+
+    messages = [ChatMessage.from_system("Be helpful assistant, but brief!"),
+                ChatMessage.from_user("Here is the document: {{documents[0].content}} Now, answer the
+                following: {{query}}")]
+
+
+    pipe.run(data={"doc_producer": {"doc_input": "Hello world, I'm Haystack!"},
+                   "prompt_builder": {"prompt_source": messages,
+                                      "template_variables":{"query": "who's making a greeting?"}}})
+
+    >> {'llm': {'replies': [ChatMessage(content='Haystack', role=<ChatRole.ASSISTANT: 'assistant'>, name=None,
+    >> metadata={'model': 'gpt-3.5-turbo-0613', 'index': 0, 'finish_reason': 'stop', 'usage':
+    >> {'prompt_tokens': 51, 'completion_tokens': 2, 'total_tokens': 53}})]}}
+    ```
+
+    Similarly to chat prompt generation, you can use DynamicPromptBuilder to generate non-chat-based prompts.
+    The following example demonstrates how to use DynamicPromptBuilder to generate a non-chat prompt:
+
+    ```python
+    prompt_builder = DynamicPromptBuilder(expected_runtime_variables=["documents"], chat_mode=False)
+    llm = GPTGenerator(api_key="<your-api-key>", model_name="gpt-3.5-turbo")
+
+
+    @component
+    class DocumentProducer:
+
+      @component.output_types(documents=List[Document])
+      def run(self, doc_input: str):
+        return {"documents": [Document(content=doc_input)]}
+
+
+    pipe = Pipeline()
+    pipe.add_component("doc_producer", DocumentProducer())
+    pipe.add_component("prompt_builder", prompt_builder)
+    pipe.add_component("llm", llm)
+    pipe.connect("doc_producer.documents", "prompt_builder.documents")
+    pipe.connect("prompt_builder.prompt", "llm.prompt")
+
+    template = "Here is the document: {{documents[0].content}} \n Answer: {{query}}"
+    pipe.run(data={"doc_producer": {"doc_input": "Hello world, I live in Berlin"},
+               "prompt_builder": {"prompt_source": template,
+                                  "template_variables":{"query": "Where does the speaker live?"}}})
+
+    >> {'llm': {'replies': ['The speaker lives in Berlin.'],
+    >> 'metadata': [{'model': 'gpt-3.5-turbo-0613',
+    >> 'index': 0,
+    >> 'finish_reason': 'stop',
+    >> 'usage': {'prompt_tokens': 28,
+    >> 'completion_tokens': 6,
+    >> 'total_tokens': 34}}]}}
+
+    """
+
+    def __init__(self, expected_runtime_variables: Optional[List[str]] = None, chat_mode: Optional[bool] = True):
+        """
+        Initializes DynamicPromptBuilder with the provided variable names. These variable names are used to resolve
+        variables and their values during pipeline runtime execution. Depending on the components connected to the
+        DynamicPromptBuilder in the pipeline, these variable names can be different. For example, if your component
+        connected to the DynamicPromptBuilder has an output named `documents`, the `expected_runtime_variables` should
+        contain `documents` as one of its values. The values associated with variables from the pipeline runtime are
+        then injected into template placeholders of either a ChatMessage or a string template that is provided to
+        the `run` method. See run method for more details.
+
+        :param expected_runtime_variables: A list of template variable names you can use in chat prompt construction.
+        :type expected_runtime_variables: Optional[List[str]]
+        :param chat_mode: A boolean flag to indicate if the chat prompt is being built for a chat-based prompt
+        templating. Defaults to True.
+        :type chat_mode: Optional[bool]
+        """
+        expected_runtime_variables = expected_runtime_variables or []
+
+        if not expected_runtime_variables:
+            logger.warning(
+                "template_variables were not provided, DynamicPromptBuilder will not resolve any pipeline variables."
+            )
+        # setup inputs
+        if chat_mode:
+            run_input_slots = {"prompt_source": List[ChatMessage], "template_variables": Optional[Dict[str, Any]]}
+        else:
+            run_input_slots = {"prompt_source": str, "template_variables": Optional[Dict[str, Any]]}
+
+        kwargs_input_slots = {var: Optional[Any] for var in expected_runtime_variables}
+        component.set_input_types(self, **run_input_slots, **kwargs_input_slots)
+
+        # setup outputs
+        if chat_mode:
+            component.set_output_types(self, prompt=List[ChatMessage])
+        else:
+            component.set_output_types(self, prompt=str)
+
+        self.expected_runtime_variables = expected_runtime_variables
+        self.chat_mode = chat_mode
+
+    def to_dict(self) -> Dict[str, Any]:
+        """
+         Converts the `DynamicPromptBuilder` instance to a dictionary format, primarily for serialization purposes.
+
+        :return: A dictionary representation of the `DynamicPromptBuilder` instance, including its template variables.
+        :rtype: Dict[str, Any]
+        """
+        return default_to_dict(
+            self, expected_runtime_variables=self.expected_runtime_variables, chat_mode=self.chat_mode
+        )
+
+    def run(
+        self,
+        prompt_source: Union[List[ChatMessage], str],
+        template_variables: Optional[Dict[str, Any]] = None,
+        **kwargs,
+    ):
+        """
+        Executes the dynamic prompt building process. Depending on the provided type of `prompt_source`, this method
+        either processes a list of `ChatMessage` instances or a string template. In the case of `ChatMessage` instances,
+        the last user message is treated as a template and rendered with the resolved pipeline variables and any
+        additional template variables provided. For a string template, it directly applies the template variables to
+        render the final prompt. You can provide additional template variables directly to this method, that are then merged
+        with the variables resolved from the pipeline runtime.
+
+        :param prompt_source: A list of `ChatMessage` instances or a string template. The list scenario assumes the last
+        user message as the template for the chat prompt, while the string scenario is used for non-chat-based prompts.
+        :type prompt_source: Union[List[ChatMessage], str]
+
+        :param template_variables: An optional dictionary of template variables. Template variables provided at
+        initialization are required to resolve pipeline variables, and these are additional variables users can
+        provide directly to this method.
+        :type template_variables: Optional[Dict[str, Any]]
+
+        :param kwargs: Additional keyword arguments, typically resolved from a pipeline, which are merged with the
+        provided template variables.
+
+        :return: A dictionary containing the key "prompt", which holds either the updated list of `ChatMessage`
+        instances or the rendered string template, forming the complete dynamic prompt.
+        :rtype: Dict[str, Union[List[ChatMessage], str]]
+        """
+        template_variables_combined = (
+            {**(kwargs or {}), **(template_variables or {})} if (template_variables or kwargs) else {}
+        )
+        if not template_variables_combined:
+            raise ValueError(
+                "The DynamicPromptBuilder run method requires template variables, but none were provided. "
+                "Please provide an appropriate template variable to enable prompt generation."
+            )
+        # some of these checks are superfluous because pipeline will check them as well but let's
+        # handle them anyway for better error messages and robustness
+        result: Union[List[ChatMessage], str]
+        if isinstance(prompt_source, str):
+            result = self._process_simple_template(prompt_source, template_variables_combined)
+        elif isinstance(prompt_source, list):
+            result = self._process_chat_messages(prompt_source, template_variables_combined)
+        else:
+            raise ValueError(
+                f"{self.__class__.__name__} was not provided with a list of ChatMessage(s) or a string template."
+                "Please check the parameters passed to its run method."
+            )
+        return {"prompt": result}
+
+    def _process_simple_template(self, prompt_source: str, template_variables: Dict[str, Any]) -> str:
+        """
+        Renders the template from the provided string source with the provided template variables.
+
+        :param prompt_source: A Jinja2 template as a string.
+        :type prompt_source: str
+        :param template_variables: A dictionary of template variables.
+        :type template_variables: Dict[str, Any]
+        :return: A string containing the rendered template.
+        :rtype: str
+        """
+        template = self._validate_template(prompt_source, set(template_variables.keys()))
+        return template.render(template_variables)
+
+    def _process_chat_messages(self, prompt_source: List[ChatMessage], template_variables: Dict[str, Any]):
+        """
+        Processes a list of :class:`ChatMessage` instances to generate a chat prompt.
+
+        It takes the last user message in the list, treats it as a template, and renders it with the provided
+        template variables. The resulting message replaces the last user message in the list, forming a complete,
+        templated chat prompt.
+
+        :param prompt_source: A list of `ChatMessage` instances to be processed. The last message is expected
+        to be from a user and is treated as a template.
+        :type prompt_source: List[ChatMessage]
+
+        :param template_variables: A dictionary of template variables used for rendering the last user message.
+        :type template_variables: Dict[str, Any]
+
+        :return: A list of `ChatMessage` instances, where the last user message has been replaced with its
+        templated version.
+        :rtype: List[ChatMessage]
+
+        :raises ValueError: If `chat_messages` is empty or contains elements that are not instances of
+        `ChatMessage`.
+        :raises ValueError: If the last message in `chat_messages` is not from a user.
+        """
+        if not prompt_source:
+            raise ValueError(
+                f"The {self.__class__.__name__} requires a non-empty list of ChatMessage instances. "
+                f"Please provide a valid list of ChatMessage instances to render the prompt."
+            )
+        if not all(isinstance(message, ChatMessage) for message in prompt_source):
+            raise ValueError(
+                f"The {self.__class__.__name__} expects a list containing only ChatMessage instances. "
+                f"The provided list contains other types. Please ensure that all elements in the list "
+                f"are ChatMessage instances."
+            )
+
+        last_message: ChatMessage = prompt_source[-1]
+        if last_message.is_from(ChatRole.USER):
+            template = self._validate_template(last_message.content, set(template_variables.keys()))
+            templated_user_message = ChatMessage.from_user(template.render(template_variables))
+            return prompt_source[:-1] + [templated_user_message]
+        else:
+            logger.warning(
+                "DynamicPromptBuilder was not provided with a user message as the last message in "
+                "chat conversation, no templating will be applied."
+            )
+            return prompt_source
+
+    def _validate_template(self, template_text: str, provided_variables: Set[str]):
+        """
+        Checks if all the required template variables are provided to the pipeline `run` method.
+        If all the required template variables are provided, returns a Jinja2 template object.
+        Otherwise, raises a ValueError.
+
+        :param template_text: A Jinja2 template as a string.
+        :param provided_variables: A set of provided template variables.
+        :type provided_variables: Set[str]
+        :return: A Jinja2 template object if all the required template variables are provided.
+        :raises ValueError: If all the required template variables are not provided.
+        """
+        template = Template(template_text)
+        ast = template.environment.parse(template_text)
+        required_template_variables = meta.find_undeclared_variables(ast)
+        filled_template_vars = required_template_variables.intersection(provided_variables)
+        if len(filled_template_vars) != len(required_template_variables):
+            raise ValueError(
+                f"The {self.__class__.__name__} requires specific template variables that are missing. "
+                f"Required variables: {required_template_variables}. Only the following variables were "
+                f"provided: {provided_variables}. Please provide all the required template variables."
+            )
+        return template
@@ -0,0 +1,5 @@
+---
+preview:
+  - |
+    Add `DynamicPromptBuilder` to dynamically generate prompts from either a list of ChatMessage instances or a string
+    template, leveraging Jinja2 templating for flexible and efficient prompt construction.