add example: HF -> OpenAI -> HF -> analyze

shcheklein · shcheklein · commit 8c34b87aea22 · 2024-10-31T16:45:30.000-07:00
diff --git a/examples/llm_and_nlp/hf-dataset-llm-eval.py b/examples/llm_and_nlp/hf-dataset-llm-eval.py
@@ -0,0 +1,65 @@
+import os
+
+from dotenv import load_dotenv
+from openai import OpenAI
+
+from datachain import C, DataChain, DataModel
+
+PROMPT = """
+Was this dialog successful? Put result as a single word: Success or Failure.
+Explain the reason in a few words.
+"""
+
+load_dotenv(".env.test")
+
+
+class DialogEval(DataModel):
+    result: str
+    reason: str
+
+
+def eval_dialog(user_input: str, bot_response: str) -> DialogEval:
+    client = OpenAI()
+
+    completion = client.beta.chat.completions.parse(
+        model="gpt-4o-2024-08-06",
+        messages=[
+            {
+                "role": "user",
+                "content": f"{PROMPT}\n\nUser: {user_input}\nBot: {bot_response}",
+            },
+        ],
+        response_format=DialogEval,
+    )
+
+    message = completion.choices[0].message
+    if message.parsed:
+        return message.parsed
+
+    return DialogEval(result="Error", reason="Failed to parse response.")
+
+
+# Run OpenAI in parallel for each example
+# Get result as Pydantic model that DataChain can understand and serialize
+# Save to HF as CSV
+(
+    DataChain.from_csv(
+        "hf://datasets/infinite-dataset-hub/MobilePlanAssistant/data.csv"
+    )
+    .settings(parallel=10)
+    .map(response=eval_dialog)
+    .to_csv(
+        "hf://datasets/dvcorg/test-datachain-llm-eval/data.csv",
+        fs_kwargs={"token": os.environ["HF_API_TOKEN"]},
+    )
+)
+
+# Read it back to filter and show
+(
+    DataChain.from_csv(
+        "hf://datasets/dvcorg/test-datachain-llm-eval/data.csv",
+        column_types={"source.file.location": "str"},
+    )
+    .filter(C("response_result") == "Failure")
+    .show(3)
+)