Merge pull request #921 from parea-ai/datasets-updates

Datasets updates
parea-ai · Jun 4, 2024 · 493c2ba · 493c2ba
2 parents b2d628d + 0195e3b
commit 493c2ba
Show file tree

Hide file tree

Showing 5 changed files with 111 additions and 7 deletions.
diff --git a/parea/client.py b/parea/client.py
@@ -304,19 +304,21 @@ def _create_or_get_project(self, name: str) -> CreateGetProjectResponseSchema:
         )
         return structure(r.json(), CreateGetProjectResponseSchema)
 
-    def get_collection(self, test_collection_identifier: Union[str, int]) -> TestCaseCollection:
+    def get_collection(self, test_collection_identifier: Union[str, int]) -> Optional[TestCaseCollection]:
         r = self._client.request(
             "GET",
             GET_COLLECTION_ENDPOINT.format(test_collection_identifier=test_collection_identifier),
         )
-        return structure(r.json(), TestCaseCollection)
+        collection = r.json()
+        return structure(collection, TestCaseCollection) if collection else None
 
-    async def aget_collection(self, test_collection_identifier: Union[str, int]) -> TestCaseCollection:
+    async def aget_collection(self, test_collection_identifier: Union[str, int]) -> Optional[TestCaseCollection]:
         r = await self._client.request_async(
             "GET",
             GET_COLLECTION_ENDPOINT.format(test_collection_identifier=test_collection_identifier),
         )
-        return structure(r.json(), TestCaseCollection)
+        collection = r.json()
+        return structure(collection, TestCaseCollection) if collection else None
 
     def create_test_collection(self, data: List[Dict[str, Any]], name: Optional[str] = None) -> None:
         request: CreateTestCaseCollection = create_test_collection(data, name)

diff --git a/parea/cookbook/parea_llm_proxy/dynamic_few_shot_injection.py b/parea/cookbook/parea_llm_proxy/dynamic_few_shot_injection.py
@@ -0,0 +1,102 @@
+from typing import List, Optional
+
+import os
+import random
+from datetime import datetime
+
+from dotenv import load_dotenv
+from pydantic import BaseModel
+
+from parea import Parea, trace, trace_insert
+from parea.schemas import Completion, CompletionResponse, FeedbackRequest, LLMInputs, Message, Role, TestCase
+
+load_dotenv()
+
+p = Parea(api_key=os.getenv("PAREA_API_KEY"))
+
+NUM_INTERACTIONS = 5
+
+
+class Person(BaseModel):
+    name: str
+    email: str
+
+
+class Email(BaseModel):
+    contact: Person
+    email_sent: str
+
+
+mock_DB: dict[str, Email] = {}
+
+
+def call_llm(messages: List[Message]) -> CompletionResponse:
+    return p.completion(Completion(llm_configuration=LLMInputs(model="gpt-4o", messages=messages)))
+
+
+# Imitate collecting few shot examples from prod based on user feedback
+@trace
+def email_writer(main_objective: str, contact: Person, few_shot_examples: Optional[List[str]] = None) -> str:
+    trace_insert({"end_user_identifier": contact.name, "metadata": {"has_few_shot_examples": bool(few_shot_examples)}})
+
+    few_shot_examples_prompt = ("\nHere are some examples of good emails\n" + "\n".join(few_shot_examples)) if few_shot_examples else ""
+    messages = [
+        Message(
+            role=Role.system,
+            content=f"You are an AI who performs an email writing task based on the following objective: {main_objective}",
+        ),
+        # added date to prompt to avoid cache
+        Message(
+            role=Role.user,
+            content=f"""
+            Your email is from: {contact.model_dump()}
+            Today's date is: {datetime.now().isoformat()}
+            {few_shot_examples_prompt if few_shot_examples else ""}
+            Email:
+            """,
+        ),
+    ]
+    response: CompletionResponse = call_llm(messages)
+    trace_id = response.inference_id
+    # insert into mock_DB
+    mock_DB[trace_id] = Email(contact=contact, email_sent=response.content)
+    return response.content
+
+
+def mimic_prod(few_shot_limit: int = 3):
+    contact = Person(name="John Doe", email="[email protected]")
+    dataset = p.get_collection("Good_Email_Examples")
+    selected_few_shot_examples = None
+    if dataset:
+        testcases: list[TestCase] = list(dataset.test_cases.values())
+        few_shot_examples = [case.inputs["email"] for case in testcases if case.inputs["user"] == contact.name]
+        # This is simply taking most recent n examples. You can imagine adding additional logic to the dataset
+        # that allows you to rank the examples based on some criteria
+        selected_few_shot_examples = few_shot_examples[-few_shot_limit:] if few_shot_examples else None
+    for interaction in range(NUM_INTERACTIONS):
+        email = email_writer("Convincing email to gym to cancel membership early.", contact, selected_few_shot_examples)
+        print(email)
+
+
+def add_good_email_example_to_dataset(user_name, email):
+    # Note: if the test case collection doesn't exist, we will create a new collection with the provided name and data
+    p.add_test_cases([{"user": user_name, "email": email}], name="Good_Email_Examples")
+
+
+def mimic_prod_feedback_collection():
+    # imagine the trace_id of the email is stored in state in the UI, so when the user provides feedback, we can use it
+    trace_ids = mock_DB.keys()
+    for trace_id in trace_ids:
+        score = random.uniform(0, 1)
+        p.record_feedback(FeedbackRequest(trace_id=trace_id, score=score))
+        # if the feedback is good, add it to the dataset to use later as a few-shot example
+        if score >= 0.5:
+            add_good_email_example_to_dataset(mock_DB[trace_id].contact.name, mock_DB[trace_id].email_sent)
+
+
+if __name__ == "__main__":
+    mimic_prod()
+    mimic_prod_feedback_collection()
+    # future llm calls will now have few-shot examples from the feedback collection
+    mimic_prod()
+    print("Done")
diff --git a/parea/cookbook/use_dataset_for_finetuning.py b/parea/cookbook/use_dataset_for_finetuning.py
@@ -8,6 +8,6 @@
 
 p = Parea(api_key=os.getenv("PAREA_API_KEY"))
 
-dataset = p.get_collection(DATASET_ID)  # Replace DATASET_ID with the actual dataset ID
+dataset = p.get_collection("DATASET_ID")  # Replace DATASET_ID with the actual dataset ID
 
 dataset.write_to_finetune_jsonl("finetune.jsonl")
diff --git a/parea/schemas/log.py b/parea/schemas/log.py
@@ -48,7 +48,7 @@ class LLMInputs:
 
     model: Optional[str] = None
     provider: Optional[str] = None
-    model_params: Optional[ModelParams] = None
+    model_params: Optional[ModelParams] = ModelParams()
     messages: Optional[List[Message]] = None
     functions: Optional[List[Any]] = None
     function_call: Optional[Union[str, Dict[str, str]]] = None

diff --git a/pyproject.toml b/pyproject.toml
@@ -6,7 +6,7 @@ build-backend = "poetry.core.masonry.api"
 [tool.poetry]
 name = "parea-ai"
 packages = [{ include = "parea" }]
-version = "0.2.164"
+version = "0.2.165"
 description = "Parea python sdk"
 readme = "README.md"
 authors = ["joel-parea-ai <[email protected]>"]