From 632e477ad3ce3f3717235a65c6341fbeca5ed2e5 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?R=C3=A9mi=20Louf?= <remilouf@gmail.com>
Date: Thu, 6 Apr 2023 09:57:20 +0200
Subject: [PATCH] Add a `model` to decorator to encapsulate calls to language
 models

---
 examples/meta_prompting.py             | 109 ++++++++---------
 outlines/program.py                    |   2 +-
 outlines/text/__init__.py              |   3 +-
 outlines/text/models/__init__.py       |   2 +-
 outlines/text/models/hugging_face.py   |   2 +-
 outlines/text/models/language_model.py | 156 +++++++++++++++++++++++++
 outlines/text/models/model.py          |  52 ---------
 tests/text/test_model.py               |  27 ++++-
 8 files changed, 234 insertions(+), 119 deletions(-)
 create mode 100644 outlines/text/models/language_model.py
 delete mode 100644 outlines/text/models/model.py

diff --git a/examples/meta_prompting.py b/examples/meta_prompting.py
index 8723cbd01..3b2e5dc3a 100644
--- a/examples/meta_prompting.py
+++ b/examples/meta_prompting.py
@@ -12,48 +12,42 @@
 import argparse
 
 import outlines
-from outlines import compose
-from outlines.text.models.openai import OpenAI
+import outlines.text as text
 
 
-def split_into_steps(question, model: str):
-    prompt = compose(
-        """
-        ${question}
+def split_into_steps(question, model_name: str):
+    @text.model(model_name)
+    def solve(question):
+        """${question}
         Let's solve this problem by splitting it into steps.
-        """,
-        question=question,
-    )
-    answer = OpenAI(model)(prompt)
+        """
+
+    answer, prompt = solve(question)
 
     return prompt, answer
 
 
-def fill_in_the_blanks(question, model: str):
-    meta_prompt = compose(
-        """
-        ${question}
+def fill_in_the_blanks(question, model_name: str):
+    @text.model(model_name, stops_at=["."])
+    def determine_goal(question):
+        """${question}
 
         In order to solve this problem, we will analyze each of the options and determine
-        """,
-        question=question,
-    )
-    goal = OpenAI(model, stops_at=["."])(meta_prompt)
-
-    prompt = compose(
         """
-        ${meta_prompt}${goal}. Let's begin.
-        """,
-        meta_prompt=meta_prompt,
-        goal=goal,
-    )
-    answer = OpenAI(model)(prompt)
 
-    return prompt, answer
+    @text.model(model_name, stops_at=["."])
+    def solve(memory):
+        """${memory}. Let's begin."""
 
+    _, memory = determine_goal(question)
+    answer, full_interaction = solve(memory)
 
-def ask_an_expert(question, model: str):
-    meta_prompt = compose(
+    return full_interaction, answer
+
+
+def ask_an_expert(question, model_name: str):
+    @text.model(model_name, stops_at=['"'])
+    def find_expert(question):
         """
         ${question}
         I entered my question into the Expert Generator
@@ -68,48 +62,43 @@ def ask_an_expert(question, model: str):
         The Expert Generator beeped, indicating that it has
         found the most qualified expert. The name displayed
         on the screen: "
-        """,
-        question=question,
-    )
-    expert = OpenAI(model, stops_at=['"'])(meta_prompt)
+        """
 
-    prompt = compose(
+    @text.model(model_name)
+    def get_answer(question, expert, memory):
         """
-        ${prompt}${expert}"
+        ${memory}
         I am ready to ask my question.
         "${expert}" I say,
         ${question}
-        """,
-        prompt=meta_prompt,
-        expert=expert,
-        question=question,
-    )
-    answer = OpenAI(model)(prompt)
-    return prompt, answer
+        """
 
+    expert, memory = find_expert(question)
+    answer, full_interaction = get_answer(question, expert, memory)
 
-def ask_an_expert_simple(question, model: str):
-    meta_prompt = compose(
+    return full_interaction, answer
+
+
+def ask_an_expert_simple(question, model_name: str):
+    @text.model(model_name, stops_at=["\n", "."])
+    def find_expert(question):
         """
         Q: ${question}
         A: A good person to answer this question would be
-        """,
-        question=question,
-    )
-    expert = OpenAI(model, stops_at=["/n", "."])(meta_prompt)
+        """
 
-    prompt = compose(
+    @text.model(model_name)
+    def get_answer(expert, memory):
         """
-        ${meta_prompt}${expert}.
+        ${memory}.
 
         For instance,${expert} would answer
-        """,
-        meta_prompt=meta_prompt,
-        expert=expert,
-    )
-    answer = OpenAI(model)(prompt)
+        """
 
-    return prompt, answer
+    expert, memory = find_expert(question)
+    answer, full_interaction = get_answer(expert, memory)
+
+    return full_interaction, answer
 
 
 def run_example(model_fn, question, model):
@@ -117,7 +106,7 @@ def run_example(model_fn, question, model):
     question_s = outlines.text.string()
     fn = outlines.chain([question_s], model_fn(question_s, model))
     prompt, answer = fn(question)
-    print(f"{prompt}{answer}")
+    print(f"{prompt}")
 
 
 if __name__ == "__main__":
@@ -125,14 +114,13 @@ def run_example(model_fn, question, model):
     parser.add_argument(
         "--model",
         type=str,
-        default="text-davinci-001",
+        default="openai/text-davinci-001",
         help="The Large Language Model to use to run the examples.",
     )
     args = parser.parse_args()
 
     math_q = "f(x) = x*x. What is f(f(3))?"
-    sat_q = compose(
-        """
+    sat_q = """
     Directions: In the following question, a related
     pair of words or phrases is followed by five
     pairs of words or phrases. Choose the pair
@@ -146,7 +134,6 @@ def run_example(model_fn, question, model):
     E) CANDIDATE : AMBITION
 
     """
-    )
     alignment_q = "What should humankind do to ensure that artificial general intelligence is aligned?"
     meaning_q = "What is the meaning of life?"
 
diff --git a/outlines/program.py b/outlines/program.py
index 9a7fab440..a3f2f7b86 100644
--- a/outlines/program.py
+++ b/outlines/program.py
@@ -10,7 +10,7 @@
 from rich.panel import Panel
 
 from outlines.graph import Variable, io_toposort
-from outlines.text.models.model import LanguageModel
+from outlines.text.models import LanguageModel
 from outlines.text.var import StringConstant
 
 COLORS = itertools.cycle(["deep_sky_blue2", "gold3", "deep_pink2"])
diff --git a/outlines/text/__init__.py b/outlines/text/__init__.py
index 63baf99af..2b057f03d 100644
--- a/outlines/text/__init__.py
+++ b/outlines/text/__init__.py
@@ -1,5 +1,6 @@
 from .basic import *
 from .compose import compose
+from .models import model
 from .var import as_string, string
 
-__all__ = ["as_string", "string", "compose"]
+__all__ = ["as_string", "model", "string", "compose"]
diff --git a/outlines/text/models/__init__.py b/outlines/text/models/__init__.py
index 43357b6b0..b75a091cf 100644
--- a/outlines/text/models/__init__.py
+++ b/outlines/text/models/__init__.py
@@ -1 +1 @@
-from .model import LanguageModel
+from .language_model import LanguageModel, model
diff --git a/outlines/text/models/hugging_face.py b/outlines/text/models/hugging_face.py
index 8c5d2cd3e..9425ae57f 100644
--- a/outlines/text/models/hugging_face.py
+++ b/outlines/text/models/hugging_face.py
@@ -1,4 +1,4 @@
-from outlines.text.models.model import LanguageModel
+from outlines.text.models.language_model import LanguageModel
 
 try:
     import torch
diff --git a/outlines/text/models/language_model.py b/outlines/text/models/language_model.py
new file mode 100644
index 000000000..40756d3d2
--- /dev/null
+++ b/outlines/text/models/language_model.py
@@ -0,0 +1,156 @@
+import inspect
+
+from outlines.graph import Apply, Op
+from outlines.text.compose import compose
+from outlines.text.var import StringVariable, as_string
+
+
+class LanguageModel(Op):
+    """An `Op` that produces a sample from a language model.
+
+    The output of language models in outlines is represented as a random
+    variable.  Therefore, calling a language model will return a random sequence
+    (via ancestral sampling) by default. Other decoding methods are constructed
+    as graph transformations.
+
+    """
+
+    def __init__(self, name=None):
+        """Instantiate the `LanguageModel` `Op`.
+
+        Parameters
+        ----------
+        name
+            The name of the `Op` in the graph.
+
+        """
+        super().__init__()
+        self.name = name
+
+    def __call__(self, prompt, stops_at=None, name=None):
+        """Create the `Apply` node that represents the `Op`'s application to inputs.
+
+        Parameters
+        ----------
+        prompt
+            The prompt used to condition the language model's sampling procedure.
+        name
+            The name of the output variable in the graph.
+
+        """
+        res = super().__call__(prompt)
+
+        if name is not None:
+            res.name = name
+
+        return res
+
+    def make_node(self, prompt):
+        prompt = as_string(prompt)
+        out = StringVariable()
+
+        return Apply(self, [prompt], [out])
+
+    def perform(self, prompt):
+        return NotImplementedError
+
+
+def model(name: str, stops_at=None):
+    """Decorator that allows to simplify calls to language models.
+
+    Prompts that are passed to language models are often rendered templates,
+    and the workflow typically looks like:
+
+    >>> import outlines
+    >>> from outlines.text.models.openai import OpenAI
+    >>>
+    >>> llm = OpenAI("davinci")
+    >>> tpl = "I have a ${question}"
+    >>> prompt = outlines.compose(tpl, question="How are you?")
+    >>> answer = llm(prompt)
+
+    While explicit, these 4 lines have the following defaults:
+
+    1. The prompt is hidden;
+    2. The language model instantiation is far from the prompt; prompt templates
+    are however attached to a specific language model call.
+    3. The intent behind the language model call is hidden.
+
+    To encapsulate the logic behind language model calls, we thus define the
+    template prompt inside a function and decorate the function with a model
+    specification. When that function is called, the template is rendered using
+    the arguments passed to the function, and the rendered prompt is passed to
+    a language model instantiated with the arguments passed to the decorator.
+
+    The previous example is equivalent to the following:
+
+    >>> import outlines
+    >>>
+    >>> @outlines.text.model("openai/davinci")
+    ... def answer(question):
+    ...     "I have a ${question}"
+    ...
+    >>> answer, _ = answer("How are you?")
+
+    Decorated functions return two objects: the first represents the output of
+    the language model call, the second represents the concatenation of the
+    rendered prompt with the output of the language model call. The latter can
+    be used in context where one expands an initial prompt with recursive calls
+    to language models.
+
+    """
+    provider_name = name.split("/")[0]
+    model_name = name[len(provider_name) + 1 :]
+
+    if provider_name == "openai":
+        from outlines.text.models.openai import OpenAI
+
+        llm = OpenAI(model_name, stops_at)  # type:ignore
+    elif provider_name == "hf":
+        from outlines.text.models.hugging_face import HFCausalLM
+
+        llm = HFCausalLM(model_name)  # type:ignore
+    else:
+        raise NameError(f"The model provider {provider_name} is not available.")
+
+    def decorator(fn):
+        # Get the names of the parameters to the function, which must correspond
+        # to the variables defined in the template.
+        var_names = []
+        kwargs_data = {}
+        sig = inspect.signature(fn)
+        for parameter in sig.parameters.values():
+            if parameter.default == inspect._empty:
+                var_names.append(parameter.name)
+            else:
+                kwargs_data[parameter.name] = parameter.default
+
+        # The docstring contains the template that will be rendered to be used
+        # as a prompt to the language model.
+        template = inspect.cleandoc(fn.__doc__)
+
+        def wrapper(*args, **kwargs):
+            """Call the LLM with the rendered template.
+
+            Building prompts with recursive calls to language models is common
+            in prompt engineering, we thus return both the raw answer from the
+            language model as well as the rendered prompt including the answer.
+
+            Returns
+            -------
+            A tuple that contains the result of the language model call, and the
+            rendered prompt concatenated with the result of the language model
+            call.
+
+            """
+            args_data = {name: arg for name, arg in zip(var_names, args)}
+            kwargs_data.update(kwargs)
+            data = {**args_data, **kwargs_data}
+
+            prompt = compose(template, **data)
+            result = llm(prompt)
+            return result, prompt + result
+
+        return wrapper
+
+    return decorator
diff --git a/outlines/text/models/model.py b/outlines/text/models/model.py
deleted file mode 100644
index a48ed0755..000000000
--- a/outlines/text/models/model.py
+++ /dev/null
@@ -1,52 +0,0 @@
-from outlines.graph import Apply, Op
-from outlines.text.var import StringVariable, as_string
-
-
-class LanguageModel(Op):
-    """An `Op` that produces a sample from a language model.
-
-    The output of language models in outlines is represented as a random
-    variable.  Therefore, calling a language model will return a random sequence
-    (via ancestral sampling) by default. Other decoding methods are constructed
-    as graph transformations.
-
-    """
-
-    def __init__(self, name=None):
-        """Instantiate the `LanguageModel` `Op`.
-
-        Parameters
-        ----------
-        name
-            The name of the `Op` in the graph.
-
-        """
-        super().__init__()
-        self.name = name
-
-    def __call__(self, prompt, stops_at=None, name=None):
-        """Create the `Apply` node that represents the `Op`'s application to inputs.
-
-        Parameters
-        ----------
-        prompt
-            The prompt used to condition the language model's sampling procedure.
-        name
-            The name of the output variable in the graph.
-
-        """
-        res = super().__call__(prompt)
-
-        if name is not None:
-            res.name = name
-
-        return res
-
-    def make_node(self, prompt):
-        prompt = as_string(prompt)
-        out = StringVariable()
-
-        return Apply(self, [prompt], [out])
-
-    def perform(self, prompt):
-        return NotImplementedError
diff --git a/tests/text/test_model.py b/tests/text/test_model.py
index 9b90e2da9..90a358731 100644
--- a/tests/text/test_model.py
+++ b/tests/text/test_model.py
@@ -1,8 +1,10 @@
+import pytest
+
 from outlines.text import string
-from outlines.text.models.model import LanguageModel
+from outlines.text.models.language_model import LanguageModel, model
 
 
-def test_initialize_model():
+def test_initialize_LanguageModel():
     llm = LanguageModel(name="llm")
 
     prompt = string()
@@ -10,3 +12,24 @@ def test_initialize_model():
     assert isinstance(out.owner.op, LanguageModel)
     assert out.owner.inputs[0] == prompt
     assert out.owner.op.name == "llm"
+
+
+def test_model_wrong_provide():
+    with pytest.raises(NameError, match="not available"):
+
+        @model("aa/model_name")
+        def test_function():
+            """"""
+
+
+@pytest.mark.skip
+def test_model():
+    @model("openai/text-davinci-001", stops_at=["."])
+    def test_function(question, type="bad"):
+        """You're a witty and sarcastic AI.
+
+        Tell me a ${type} ${question}.
+        Joke:
+        """
+
+    answer, prompt = test_function("joke", type="good")