add async query to improve latency

aditya1503 · aditya1503 · commit 0a2164907003 · 2025-03-26T11:28:38.000-07:00
diff --git a/src/cleanlab_codex/validator.py b/src/cleanlab_codex/validator.py
@@ -5,6 +5,7 @@
 from __future__ import annotations
 
 from typing import TYPE_CHECKING, Any, Callable, Optional, cast
+import asyncio
 
 from cleanlab_tlm import TrustworthyRAG
 from pydantic import BaseModel, Field, field_validator
@@ -138,10 +139,14 @@ def validate(
                 - 'is_bad_response': True if the response is flagged as potentially bad (when True, a lookup in Codex is performed), False otherwise.
                 - Additional keys: Various keys from a [`ThresholdedTrustworthyRAGScore`](/cleanlab_codex/types/validator/#class-thresholdedtrustworthyragscore) dictionary, with raw scores from [TrustworthyRAG](/tlm/api/python/utils.rag/#class-trustworthyrag) for each evaluation metric.  `is_bad` indicating whether the score is below the threshold.
         """
+        expert_task = asyncio.create_task(self.remediate_async(query))
         scores, is_bad_response = self.detect(query, context, response, prompt, form_prompt)
-        expert_answer = None
         if is_bad_response:
-            expert_answer = self.remediate(query)
+            expert_answer, maybe_entry = asyncio.run(expert_task)
+            if expert_answer == None:
+                self._project.add_entries([maybe_entry])
+        else:
+            expert_answer = None
 
         return {
             "expert_answer": expert_answer,
@@ -198,3 +203,7 @@ def remediate(self, query: str) -> str | None:
         """
         codex_answer, _ = self._project.query(question=query)
         return codex_answer
+
+    async def remediate_async(self, query: str):
+        codex_answer, entry = self._project.query(question=query, read_only=True)
+        return codex_answer, entry