Merge pull request #7 from ittia-research/dev

Add DSPy pipeline
ittia-research · Aug 13, 2024 · a9bd755 · a9bd755
2 parents 05c4c1e + ba2ad67
commit a9bd755
Show file tree

Hide file tree

Showing 14 changed files with 457 additions and 251 deletions.
diff --git a/Dockerfile.local b/Dockerfile.local
@@ -1,6 +1,7 @@
 FROM intel/intel-optimized-pytorch:2.3.0-serving-cpu
 WORKDIR /app
-COPY requirements.local.txt /app
+COPY requirements.*.txt /app
+RUN pip install --no-cache-dir -r requirements.base.txt
 RUN pip install --no-cache-dir -r requirements.local.txt
 COPY . /app
 EXPOSE 8000

diff --git a/Dockerfile.remote b/Dockerfile.remote
@@ -1,7 +1,7 @@
 FROM python:3.11-slim-bookworm
 WORKDIR /app
-COPY requirements.remote.txt /app
-RUN pip install --no-cache-dir -r requirements.remote.txt
+COPY requirements.base.txt /app
+RUN pip install --no-cache-dir -r requirements.base.txt
 COPY . /app
 EXPOSE 8000
 ENV NAME "Fact-check API"

diff --git a/README.md b/README.md
@@ -63,6 +63,10 @@ Contexts
 Retrieval
 - [ ] Retrieve the latest info when facts might change
 
+### pipeline
+DSPy:
+- [ ] make dspy.settings apply to sessions only in order to support multiple retrieve index
+
 ### Toolchain
 - [ ] Evaluate MLOps pipeline
   - https://kitops.ml

diff --git a/docs/changelog.md b/docs/changelog.md
@@ -1,3 +1,7 @@
 ## application
 2024/8/3:
   - Change from AutoGen to plain OpenAI, since AutoGen AssistantAgent adds system role which are not compateble with Gemma 2 + vllm.
+
+## pipeline
+2024/8/13:
+  - Introduce DSPy to replace the get verdict part, with multi-step reasoning.
diff --git a/requirements.remote.txt → requirements.base.txt b/requirements.remote.txt → requirements.base.txt
@@ -1,4 +1,5 @@
 aiohttp
+dspy-ai
 fastapi
 llama-index
 llama-index-embeddings-ollama

diff --git a/requirements.local.txt b/requirements.local.txt
@@ -1,8 +1 @@
-aiohttp
-fastapi
-llama-index
-llama-index-embeddings-huggingface
-llama-index-embeddings-ollama
-llama-index-postprocessor-jinaai-rerank
-openai
-uvicorn
+llama-index-embeddings-huggingface
diff --git a/src/dspy_modules.py b/src/dspy_modules.py
@@ -0,0 +1,99 @@
+import dspy
+from dsp.utils import deduplicate
+
+from retrieve import LlamaIndexRM
+from settings import settings
+
+llm = dspy.OpenAI(model=settings.LLM_MODEL_NAME, api_base=f"{settings.OPENAI_BASE_URL}/", max_tokens=200, stop='\n\n')
+dspy.settings.configure(lm=llm)
+
+class CheckStatementFaithfulness(dspy.Signature):
+    """Verify that the statement is based on the provided context."""
+    context = dspy.InputField(desc="facts here are assumed to be true")
+    statement = dspy.InputField()
+    verdict = dspy.OutputField(desc="True/False/Irrelevant indicating if statement is faithful to context")
+
+class GenerateSearchQuery(dspy.Signature):
+    """Write a simple search query that will help retrieve info related to the statement."""
+    context = dspy.InputField(desc="may contain relevant facts")
+    statement = dspy.InputField()
+    query = dspy.OutputField()
+
+class GenerateCitedParagraph(dspy.Signature):
+    """Generate a paragraph with citations."""
+    context = dspy.InputField(desc="may contain relevant facts")
+    statement = dspy.InputField()
+    verdict = dspy.InputField()
+    paragraph = dspy.OutputField(desc="includes citations")
+
+"""
+SimplifiedBaleen module
+Avoid unnecessary content in module cause MIPROv2 optimizer will analize modules.
+
+Args:
+    retrieve: dspy.Retrieve
+    
+To-do: 
+  - retrieve latest facts
+  - remove some contexts incase token reaches to max
+  - does different InputField name other than answer compateble with dspy evaluate
+"""
+class ContextVerdict(dspy.Module):
+    def __init__(self, retrieve, passages_per_hop=3, max_hops=3):
+        super().__init__()
+        # self.generate_query = dspy.ChainOfThought(GenerateSearchQuery)  # IMPORTANT: solves error `list index out of range`
+        self.generate_query = [dspy.ChainOfThought(GenerateSearchQuery) for _ in range(max_hops)]
+        self.retrieve = retrieve
+        self.retrieve.k = passages_per_hop
+        self.generate_verdict = dspy.ChainOfThought(CheckStatementFaithfulness)
+        self.max_hops = max_hops
+
+    def forward(self, statement):
+        context = []
+        for hop in range(self.max_hops):
+            query = self.generate_query[hop](context=context, statement=statement).query
+            passages = self.retrieve(query=query, text_only=True)
+            context = deduplicate(context + passages)
+
+        verdict = self.generate_verdict(context=context, statement=statement)
+        pred = dspy.Prediction(answer=verdict.verdict, rationale=verdict.rationale, context=context)
+        return pred
+
+"""Generate citation from context and verdict"""
+class Citation(dspy.Module):
+    def __init__(self):
+        super().__init__()
+        self.generate_cited_paragraph = dspy.ChainOfThought(GenerateCitedParagraph)
+
+    def forward(self, statement, context, verdict):
+        citation = self.generate_cited_paragraph(context=context, statement=statement, verdict=verdict)
+        pred = dspy.Prediction(verdict=verdict, citation=citation.paragraph, context=context)
+        return pred
+
+"""
+Get both verdict and citation.
+
+Args:
+    retrieve: dspy.Retrieve
+"""
+class VerdictCitation():
+    def __init__(
+        self,
+        docs,
+    ):
+        self.retrieve = LlamaIndexRM(docs=docs)
+
+        # loading compiled ContextVerdict
+        self.context_verdict = ContextVerdict(retrieve=self.retrieve)
+        self.context_verdict.load("./optimizers/verdict_MIPROv2.json")
+
+    def get(self, statement):
+        rep = self.context_verdict(statement)
+        context = rep.context
+        verdict = rep.answer
+
+        rep = Citation()(statement=statement, context=context, verdict=verdict)
+        citation = rep.citation
+
+        return verdict, citation
+
diff --git a/src/index.py b/src/index.py