Add labels match to OpenAIChatRuntime, RAG with only errors

nik · nik · commit e73e317d33ca · 2023-11-30T09:20:00.000Z
diff --git a/adala/runtimes/_openai.py b/adala/runtimes/_openai.py
@@ -1,4 +1,5 @@
 import os
+import difflib
 from rich import print
 
 from typing import Optional, Dict, Any, List
@@ -32,9 +33,9 @@ def check_if_new_openai_version():
 from tenacity import retry, stop_after_attempt, wait_random
 
 
-@retry(wait=wait_random(min=5, max=10), stop=stop_after_attempt(6))
+@retry(wait=wait_random(min=5, max=10), stop=stop_after_attempt(3))
 def chat_completion_call(model, messages):
-    return openai.ChatCompletion.create(model=model, messages=messages)
+    return openai.ChatCompletion.create(model=model, messages=messages, timeout=120, request_timeout=120)
 
 
 class OpenAIChatRuntime(Runtime):
@@ -158,8 +159,27 @@ def record_to_record(
             ]
 
         completion_text = self.execute(messages)
+
+        field_schema = field_schema or {}
+        if output_field_name in field_schema and field_schema[output_field_name]["type"] == "array":
+            # expected output is one item from the array
+            expected_items = field_schema[output_field_name]['items']['enum']
+            completion_text = self._match_items(completion_text, expected_items)
+
         return {output_field_name: completion_text}
 
+    def _match_items(self, query: str, items: List[str]) -> str:
+        # hard constraint: the item must be in the query
+        filtered_items = [item for item in items if item in query]
+        if not filtered_items:
+            # make the best guess - find the most similar item to the query
+            filtered_items = items
+
+        # soft constraint: find the most similar item to the query
+        scores = list(map(lambda item: difflib.SequenceMatcher(None, query, item).ratio(), filtered_items))
+        matched_item = filtered_items[scores.index(max(scores))]
+        return matched_item
+
 
 class OpenAIVisionRuntime(OpenAIChatRuntime):
     """
diff --git a/adala/skills/collection/rag.py b/adala/skills/collection/rag.py
@@ -46,6 +46,7 @@ class RAGSkill(TransformSkill):
     output_template: str = "{rag}"
     num_results: int = 1
     memory: Memory = None
+    only_errors: bool = True
 
     @model_validator(mode="after")
     def init_memory(self):
@@ -119,13 +120,16 @@ def improve(
             runtime: Runtime to use for generation (not used).
         """
 
-        error_indices = feedback.match[
-            (feedback.match.fillna(True) == False).any(axis=1)
-        ].index
-        inputs = predictions.loc[error_indices]
+        if self.only_errors:
+            indices = feedback.match[
+                (feedback.match.fillna(True) == False).any(axis=1)
+            ].index
+        else:
+            indices = feedback.match.index
+        inputs = predictions.loc[indices]
         input_strings = inputs.apply(
             lambda r: self.input_template.format(**r), axis=1
         ).tolist()
-        fb = feedback.feedback.loc[error_indices].rename(columns=lambda c: f"{c}__fb")
+        fb = feedback.feedback.loc[indices].rename(columns=lambda c: f"{c}__fb")
         inputs = inputs.join(fb)
         self.memory.remember_many(input_strings, inputs.to_dict(orient="records"))