From 8d0a74e8657d25dd6f1c36d9b6ee400103b616f0 Mon Sep 17 00:00:00 2001
From: Jake Pullen <hello@jake-is.me>
Date: Sun, 8 Feb 2026 15:09:39 +0000
Subject: [PATCH] just sync

---
 TODO                     |   4 --
 justfile                 |   2 +
 src/experts/dnd_agent.py | 108 ++++++++++++++++-----------------------
 src/retrieve.py          |   5 +-
 4 files changed, 48 insertions(+), 71 deletions(-)

diff --git a/TODO b/TODO
index 5525a87..8dc84f1 100644
--- a/TODO
+++ b/TODO
@@ -8,7 +8,3 @@ Is RAG still the "thing"? - What is the cutting edge
     Too little context and the llm doesnt have enough info to give an accurate answer 
     Too much conflicting context (poison)
     too much context (confusion)
-
-Turso - better? vector store, but sqlite so data <3 
-
-How can we RaG in AW?
diff --git a/justfile b/justfile
index 5b0ca43..4573861 100644
--- a/justfile
+++ b/justfile
@@ -4,3 +4,5 @@ git-sync:
     git add .
     git commit -m 'just sync'
     git push
+
+sync-git: git-sync
\ No newline at end of file
diff --git a/src/experts/dnd_agent.py b/src/experts/dnd_agent.py
index d312c29..63cd55a 100644
--- a/src/experts/dnd_agent.py
+++ b/src/experts/dnd_agent.py
@@ -1,7 +1,7 @@
-from pathlib import Path
-
+# from pathlib import Path
+import turso
 import dspy
-from langchain_community.vectorstores import FAISS
+#  from langchain_community.vectorstores import FAISS
 
 from config_loader import load_config
 from embedding import LocalLMEmbeddings
@@ -12,93 +12,73 @@ DATABASE_PATH = CFG["ingestion"]["db_path"]
 EMBEDDING_MODEL = CFG["models"]["embedding"]
 API_BASE = CFG["api"]["base_url"]
 
-import turso
-
 # Inside your retrieval logic:
-def retrieve_from_turso(question, k=5):
+def retrieve_from_turso(embedded_question, k=5):
     # Example query: search for relevant notes using full-text search or embedding similarity
     # Note: Turso supports SQLite, so you can use FTS5 or a vector extension if available
     query = f"""
-    SELECT source, synopsis, tags, entities, content, embedding
+    SELECT file_path, synopsis, tags, entities, chunk_data,
+    vector_distance_cos(embedding, vector32('{embedded_question[0]}')) AS distance
     FROM notes
-    WHERE content LIKE ? OR synopsis LIKE ?
-    ORDER BY (similarity(embedding, ?)) DESC
-    LIMIT {k}
+    ORDER BY distance ASC
+    LIMIT {k};
     """
-    # You'll need to generate or store embeddings in the DB or use a function to compute similarity
-    # If embeddings are stored, you can query them directly
-    # Otherwise, you'll need to compute embeddings in Python and compare
-    results = turso.execute(query, (f"%{question}%", f"%{question}%", question))
-    return results
+    con = turso.connect(DATABASE_PATH)
+    cur = con.cursor()
+    cur.execute(query)
+    rows = cur.fetchall()
+    return rows
 
 # --- DSPy Signature ---
 class DnDContextQA(dspy.Signature):
-    """Answer DnD campaign questions using provided snippets and full file context.
-    /no_think
+    """Answer DnD campaign questions using provided details.
     """
 
     context = dspy.InputField(
-        desc="Relevant chunks and full file contents from the campaign notes."
+        desc="Relevant chunks and metadata from the campaign notes."
     )
     question = dspy.InputField()
     answer = dspy.OutputField(desc="A detailed answer based on the notes, citing the source file.")
 
 
-# --- DSPy Module ---
 class DnDRAG(dspy.Module):
-    def __init__(self, db_path=DATABASE_PATH, k=3):
+    def __init__(self):
         super().__init__()
-        # 1. Setup Embeddings & Load FAISS
-        self.embeddings = LocalLMEmbeddings(model=EMBEDDING_MODEL, base_url=API_BASE)
-        self.vectorstore = FAISS.load_local(
-            db_path, self.embeddings, allow_dangerous_deserialization=True
-        )
-        self.k = k
-
-        # 2. Setup the Predictor (Chain of Thought for better reasoning)
+        self.embeddings_model = LocalLMEmbeddings(
+            model=EMBEDDING_MODEL,
+            base_url=API_BASE,
+            batch_size=1, # we only send 1 question at a time.
+            )
         self.generate_answer = dspy.ChainOfThought(DnDContextQA)
 
-    def get_full_file_content(self, file_path):
-        """Helper to read the full source file if it exists."""
-        try:
-            return Path(file_path).read_text(encoding="utf-8")
-        except Exception:
-            return ""
-
     def forward(self, question):
-        # 1. Search for top-k chunks
-        results = self.vectorstore.similarity_search(question, k=self.k)
-
-        # 2. Extract unique file paths to load "Full Context"
-        # This prevents the LLM from being 'blind' to the rest of a relevant session note
-        unique_paths = list(set([doc.metadata.get("full_path") for doc in results]))
+        # Use Turso to retrieve relevant notes
+        embedded_question = self.embeddings_model._post_request(question)
+        results = retrieve_from_turso(embedded_question, k=5)  # k is limit to return
 
+        # Format context as before
         context_parts = []
-        for i, doc in enumerate(results):
-            source = doc.metadata.get("source", "Unknown")
-            synopsis = doc.metadata.get("synopsis", "None")
-            tags = doc.metadata.get("tags", "None")
-            entities = doc.metadata.get("entities", "None")
+        for i, row in enumerate(results):
+            source = row[0]  # file_path
+            synopsis = row[1]  # synopsis
+            tags = row[2]    # tags
+            entities = row[3]  # entities
+            content = row[4]  # chunk_data
+
+
             context_parts.append(f"""
 --- Chunk {i+1} from {source} ---
-synpsis: {synopsis}, 
-tags: {tags}, 
+synopsis: {synopsis},
+tags: {tags},
 entities: {entities}
-{doc.page_content}
+{content}
 """)
-        #print(context_parts)
+            
+        print('Closest embedding hits')
+        for part in context_parts:
+            print(part)
+        
+        context = "\n\n".join(context_parts)
 
-        # 3. Add the Full Content of the top match (optional, but requested!)
-        # We'll just take the top 1 file to avoid context window explosion
-        if unique_paths:
-            top_file_content = self.get_full_file_content(unique_paths[0])
-            context_parts.append(
-                f"\n=== FULL SOURCE FILE: {Path(unique_paths[0]).name} ===\n{top_file_content[:10000]}"
-            )
-
-        # 4. Join everything into one context string
-        context_str = "\n\n".join(context_parts)
-
-        # 5. Generate Response
-        prediction = self.generate_answer(context=context_str, question=question)
-        return dspy.Prediction(answer=prediction.answer, context=context_str)
+        prediction = self.generate_answer(context=context, question=question)
+        return dspy.Prediction(answer=prediction.answer, context=context)
diff --git a/src/retrieve.py b/src/retrieve.py
index f9cbd79..f7cc2af 100644
--- a/src/retrieve.py
+++ b/src/retrieve.py
@@ -1,6 +1,6 @@
 import sys
-
 import dspy
+# import turso
 
 from config_loader import load_config
 from experts.dnd_agent import DnDRAG
@@ -10,7 +10,6 @@ RETRIEVE_MODEL = CFG["models"]["retrieval"]
 API_BASE = CFG["api"]["base_url"]
 API_VERSION = CFG["api"]["api_version"]
 
-
 def main():
     # 1. Setup the LLM
     print("🚀 Initializing Qwen-8B via LM Studio...")
@@ -18,7 +17,7 @@ def main():
     dspy.configure(lm=lm)
 
     # 2. Load the RAG System (only happens once!)
-    print("📚 Loading FAISS index and campaign notes...")
+    print("📚 Loading campaign notes...")
     try:
         rag_system = DnDRAG()
         print("✅ Ready! Ask me anything about the campaign. (Type 'exit' or 'q' to quit)")