From d372632d879178690b1c564483357e8cc05cac02 Mon Sep 17 00:00:00 2001
From: ImBenji <benjamin.watt@imbenji.net>
Date: Thu, 23 Oct 2025 22:22:00 +0100
Subject: [PATCH] Add initial project setup with environment variables, server
 logic, and memory handling

---
 supabase/functions/llm-pipeline/index.ts    | 30 +++++++++++++++---
 supabase/functions/llm-pipeline/prompts.xml | 35 ++++++++++++++++++---
 2 files changed, 55 insertions(+), 10 deletions(-)

diff --git a/supabase/functions/llm-pipeline/index.ts b/supabase/functions/llm-pipeline/index.ts
index 9ecf0c3..84f55bf 100644
--- a/supabase/functions/llm-pipeline/index.ts
+++ b/supabase/functions/llm-pipeline/index.ts
@@ -19,7 +19,17 @@ await load({ export: true, envPath: ".env" });
 let supabaseClient = null;
 
 // Load and parse prompts.xml
-const xmlContent = await Deno.readTextFile(new URL('./prompts.xml', import.meta.url).pathname);
+// In production (Supabase Edge), load from Git; locally, load from file system
+const isProduction = Deno.env.get('DENO_DEPLOYMENT_ID') !== undefined;
+let xmlContent: string;
+
+if (isProduction) {
+    const response = await fetch('https://git.imbenji.dev/ImBenji/Mori/raw/branch/main/supabase/functions/llm-pipeline/prompts.xml');
+    xmlContent = await response.text();
+} else {
+    xmlContent = await Deno.readTextFile('./prompts.xml');
+}
+
 const doc = new DOMParser().parseFromString(xmlContent, 'text/html');
 
 const corsHeaders = {
@@ -51,7 +61,7 @@ async function extractMemories(controller, messages, doc, user: User, allTags, r
     const response = await openai.chat.completions.create({
         model: 'gpt-4.1',
         temperature: 0.1,
-        max_completion_tokens: 20000,
+        max_completion_tokens: 50000,
         messages: [
             { role: 'system', content: system_prompt },
             ...messages,
@@ -63,7 +73,7 @@ Available tags: ${JSON.stringify(allTags?.map(t => t.name) || [])}
 
 Existing memories: ${JSON.stringify(relevantMemories || [])}
 
-Now I will analyze the conversation above and extract memories.`
+Now I will analyze the conversation above and extract memories. I will extract EVERY SINGLE atomic fact from the user's messages. For detailed reports, I expect to extract 100-200+ separate memories. I will NOT summarize or limit myself. I will break down every detail into individual atomic facts.`
             }
         ]
     });
@@ -169,10 +179,17 @@ Now I will analyze the conversation above and extract memories.`
 
         } else if (change.action === "DELETE") {
             deletedCount++;
+
+            // First, fetch the memory content before deleting
+            const memoryToDelete = relevantMemories?.find(m => m.id === change.memory_id);
+
             extractedMemories.push({
                 action: 'DELETE',
-                memory_id: change.memory_id
+                memory_id: change.memory_id,
+                content: memoryToDelete?.content || change.content,
+                reason: change.reason
             });
+
             // Delete memory (cascade should handle memory_tags)
             await supabaseClient
                 .schema("mori")
@@ -301,6 +318,8 @@ async function generateResponse(controller, messages, doc, user: User, pipelineC
                 pipelineAwareness += `• Learned: ${mem.content}\n`;
             } else if (mem.action === 'UPDATE') {
                 pipelineAwareness += `• Updated: ${mem.content}\n`;
+            } else if (mem.action === 'DELETE') {
+                pipelineAwareness += `• Forgot: ${mem.content || 'a previous memory'}\n`;
             }
         });
         pipelineAwareness += `\n`;
@@ -310,6 +329,7 @@ async function generateResponse(controller, messages, doc, user: User, pipelineC
     pipelineAwareness += `- This awareness is internal. Don't report it.\n`;
     pipelineAwareness += `- Let it naturally inform your response\n`;
     pipelineAwareness += `- If the user explicitly asks you to remember something, you can acknowledge it naturally (e.g., "got it" or "I'll remember that")\n`;
+    pipelineAwareness += `- If the user asks you to forget something and memories were deleted, acknowledge it naturally (e.g., "forgot it" or "done")\n`;
     pipelineAwareness += `- Reference past memories naturally without saying "I retrieved" or "according to my memory"\n`;
     pipelineAwareness += `- You're a companion who pays attention, not a system reporting operations\n`;
 
@@ -322,7 +342,7 @@ async function generateResponse(controller, messages, doc, user: User, pipelineC
     responseMessages.push(...messages);
 
     const stream = await openai.chat.completions.create({
-        model: 'gpt-4.1-mini',
+        model: 'gpt-4.1',
         messages: responseMessages,
         stream: true
     });
diff --git a/supabase/functions/llm-pipeline/prompts.xml b/supabase/functions/llm-pipeline/prompts.xml
index 44b78eb..7081d26 100644
--- a/supabase/functions/llm-pipeline/prompts.xml
+++ b/supabase/functions/llm-pipeline/prompts.xml
@@ -104,6 +104,14 @@
         - If user explicitly says something changed/ended, DELETE old memory
         - Don't create duplicates—check existing memories first
 
+        FORGET REQUESTS:
+        If the user explicitly asks to forget something (e.g., "forget that", "don't remember that", "forget about X"), you must:
+        1. Identify which existing memories match what they want forgotten
+        2. Use DELETE action for each matching memory
+        3. Be specific in the "reason" field about what the user requested
+        4. If the request is vague ("forget that"), use context from recent messages to identify what "that" refers to
+        5. If unclear what to forget, DELETE nothing and explain in the "reason" field
+
         TAGGING GUIDELINES:
         You will be provided with existing tags in the reference data section.
         - **Reuse existing tags whenever possible** to maintain consistency
@@ -159,12 +167,29 @@
         }
 
         EXTRACTION THOROUGHNESS:
-        - Rich sources (long messages, reports) should yield 20-50+ changes
-        - Don't self-limit; extract ALL atomic facts
-        - Err on the side of over-extraction rather than under-extraction
-        - Each paragraph of substantial content likely contains multiple extractable facts
+        CRITICAL: You MUST extract EVERY SINGLE atomic fact from the user's messages.
 
-        BE PRECISE. BE THOROUGH. BE ATOMIC.
+        - A detailed personal report should yield 100-200+ separate memories
+        - Each sentence typically contains 2-5 extractable atomic facts
+        - Break down EVERY detail: demographics, preferences, relationships, experiences, skills, beliefs, habits, feelings, goals, challenges
+        - If you can answer "who, what, when, where, why, how" from a statement, those are separate facts
+        - DO NOT SUMMARIZE - extract each detail as its own memory
+        - DO NOT LIMIT YOURSELF - there is no maximum number of memories
+        - Over-extraction is REQUIRED, not optional
+        - Under-extraction means losing valuable information about the user
+
+        Example of proper extraction density:
+        Input: "I'm a 28-year-old software engineer at Google in NYC, working on search algorithms"
+        Should extract AT LEAST:
+        1. User is 28 years old
+        2. User works as a software engineer
+        3. User works at Google
+        4. User is located in NYC
+        5. User works on search algorithms
+        6. User works in the tech industry
+        7. User has experience with algorithms
+
+        BE PRECISE. BE THOROUGH. BE ATOMIC. EXTRACT EVERYTHING.
         Extract every distinct, useful fact about the user from their conversation messages - ignore the reference data section completely.
     </memory_extraction>