Refactor request handling and integrate OpenAI response generation with enhanced personality context

2025-10-25 08:39:28 +01:00
parent f34513746c
commit 0c35fa1023
2 changed files with 288 additions and 409 deletions
--- a/supabase/functions/llm-pipeline/index.ts
+++ b/supabase/functions/llm-pipeline/index.ts
@@ -1,383 +1,197 @@
-// @ts-ignore
 import { serve } from "https://deno.land/std@0.168.0/http/server.ts";
-// @ts-ignore
-import { load } from "https://deno.land/std@0.224.0/dotenv/mod.ts";
-// @ts-ignore
-import { DOMParser } from "https://deno.land/x/deno_dom@v0.1.45/deno-dom-wasm.ts";
-import { User } from "https://esm.sh/@supabase/auth-js@2.76.1/dist/module/lib/types.d.ts";
-
 import { createClient } from "https://esm.sh/@supabase/supabase-js@2";
-
-//
-
+import { load } from "https://deno.land/std@0.224.0/dotenv/mod.ts";
+import SupabaseClient from "https://esm.sh/@supabase/supabase-js@2.76.1/dist/module/SupabaseClient.d.ts";
+import { User } from "https://esm.sh/@supabase/auth-js@2.76.1/dist/module/lib/types.d.ts";
+import { DOMParser } from "https://deno.land/x/deno_dom@v0.1.45/deno-dom-wasm.ts";
 import OpenAI from "npm:openai@4";

 // Load environment variables
 await load({ export: true, envPath: ".env" });

-// Initialize Supabase client
-let supabaseClient = null;
-
-// Load and parse prompts.xml
-// In production (Supabase Edge), load from Git; locally, load from file system
-const isProduction = Deno.env.get('DENO_DEPLOYMENT_ID') !== undefined;
-let xmlContent: string;
-
-if (isProduction) {
-    const response = await fetch('https://git.imbenji.dev/ImBenji/Mori/raw/branch/main/supabase/functions/llm-pipeline/prompts.xml');
-    xmlContent = await response.text();
-} else {
-    xmlContent = await Deno.readTextFile('./prompts.xml');
-}
-
-const doc = new DOMParser().parseFromString(xmlContent, 'text/html');
-
 const corsHeaders = {
    'Access-Control-Allow-Origin': '*',
    'Access-Control-Allow-Headers': 'authorization, x-client-info, apikey, content-type'
 };

-/*
-    Stage 2: Process Input (Extract Memories)
- */
-async function extractMemories(controller, messages, doc, user: User, allTags, relevantMemories?) {
-    const startTime = Date.now();
-    let addedCount = 0;
-    let updatedCount = 0;
-    let deletedCount = 0;
-    const extractedMemories = [];
+// Initialize OpenAI client
+const openai = new OpenAI({
+    apiKey: Deno.env.get("OPENAI_API_KEY") || "",
+});

-    console.log("Using cached tags for user:", allTags?.length || 0);
+// Load the xml doc - prompts.xml
+const isProduction = Deno.env.get('DENO_DEPLOYMENT_ID') !== undefined;
+let xmlContent: string;
+if (isProduction) {
+    const response = await fetch('https://git.imbenji.dev/ImBenji/Mori/raw/branch/main/supabase/functions/llm-pipeline/prompts.xml');
+    xmlContent = await response.text();
+} else {
+    xmlContent = await Deno.readTextFile('./prompts.xml');
+}
+const prompt_xml = new DOMParser().parseFromString(xmlContent, 'text/html');

-    // Create and call OpenAI to process the input messages
-    console.log("Creating OpenAI client for processing input");
-    const openai = new OpenAI({
-        apiKey: Deno.env.get('OPENAI_API_KEY')
+const mori_personality = prompt_xml?.querySelector('mori_personality')?.textContent || "";
+
+async function handleRequest(req: Resquest, controller : ReadableStreamDefaultController, user : User, supabaseClient : SupabaseClient) {
+
+    function enqueueJson(data: any) {
+        controller.enqueue(new TextEncoder().encode(`${JSON.stringify(data)}`));
+    }
+
+    const showExamples = false;
+    if (showExamples) {
+        // Example 1: Send current status to the client
+        let status = {
+            command: "update_status",
+            status_type: "info",
+            message: "Discombobulating the flux capacitor...",
+        };
+        enqueueJson(status);
+
+        // Simulate some processing delay
+        await new Promise((resolve) => setTimeout(resolve, 2000));
+
+        // Example 2: Send progress update to the client
+        status = {
+            command: "update_status",
+            status_type: "progress",
+            message: "Halfway through the discombobulation!",
+        };
+        enqueueJson(status);
+
+        // Simulate some processing delay
+        await new Promise((resolve) => setTimeout(resolve, 2000));
+
+        status = {
+            command: "update_status",
+            status_type: "progress",
+            message: "Lost track of what we're doing...",
+        };
+        enqueueJson(status);
+
+        // Simulate some processing delay
+        await new Promise((resolve) => setTimeout(resolve, 2000));
+    }
+
+    const requestBody = await req.json();
+
+    /*
+        Summarise the conversation
+     */
+    enqueueJson({
+        command: "update_status",
+        status_type: "info",
+        message: "Contemplating conversation...",
    });
-
-    const system_prompt = doc?.querySelector('memory_extraction')?.textContent?.trim() || '';
-
-    console.log("Calling OpenAI API for processing...");
-    const response = await openai.chat.completions.create({
-        model: 'gpt-4.1',
-        temperature: 0.1,
-        max_completion_tokens: 32000,
+    const summarySystemPrompt = prompt_xml.querySelector('conversation_summariser')?.textContent
+        .replaceAll("{{PERSONALITY_INJECTION}}", mori_personality);
+    const summaryCompletion = await openai.chat.completions.create({
+        model: "gpt-4.1-mini",
        messages: [
-            { role: 'system', content: system_prompt },
-            ...messages,
+            {
+                role: "system",
+                content: summarySystemPrompt || "",
+                // Static: gets cached
+            },
+            ...requestBody.messages,
            {
                role: "assistant",
-                content: `I have access to the following reference data:
-
-Available tags: ${JSON.stringify(allTags?.map(t => t.name) || [])}
-
-Existing memories: ${JSON.stringify(relevantMemories || [])}
-
-Now I will analyze the conversation above and extract memories. I will extract EVERY SINGLE atomic fact from the user's messages. For detailed reports, I expect to extract 100-200+ separate memories. I will NOT summarize or limit myself. I will break down every detail into individual atomic facts.`
-            }
-        ]
-    });
-
-    const processedContent = response.choices[0]?.message?.content || '';
-    console.log("Processing complete, sending processed content to client");
-
-    // Decode the json content
-    let processedData;
-    try {
-        processedData = JSON.parse(processedContent);
-    } catch (error) {
-        console.error("Error parsing processed content:", error);
-        throw new Error("Failed to parse processed content");
-    }
-
-    // Iterate over the changes and process them
-    for (const change of processedData.changes || []) {
-
-        if (change.action === "ADD") {
-            addedCount++;
-            extractedMemories.push({
-                action: 'ADD',
-                content: change.content,
-                context: change.context,
-                tags: change.tags
-            });
-            // Fetch all existing tags in a single query using .in()
-            const { data: existingTags } = await supabaseClient
-                .schema("mori")
-                .from("tags")
-                .select("*")
-                .in("name", change.tags)
-                .eq("user_id", user.id);
-
-            let tags = existingTags || [];
-
-            // Find tags that need to be created
-            const existingTagNames = new Set(tags.map(t => t.name));
-            const newTagNames = change.tags.filter(tagName => !existingTagNames.has(tagName));
-
-            // Batch insert all new tags in a single query
-            if (newTagNames.length > 0) {
-                const { data: insertedTags } = await supabaseClient
-                    .schema("mori")
-                    .from("tags")
-                    .insert(newTagNames.map(name => ({
-                        name: name,
-                        user_id: user.id
-                    })))
-                    .select();
-
-                if (insertedTags) {
-                    tags.push(...insertedTags);
-                }
-            }
-
-            // Now, insert the memory itself
-            const insertMemory = await supabaseClient
-                .schema("mori")
-                .from("memories")
-                .insert([{
-                    content: change.content,
-                    context: change.context,
-                    user_id: user.id,
-                }])
-                .select()
-                .single();
-
-            // Batch insert all memory_tags links in a single query
-            if (tags.length > 0 && insertMemory.data) {
-                await supabaseClient
-                    .schema("mori")
-                    .from("memory_tags")
-                    .insert(tags.map(tag => ({
-                        memory_id: insertMemory.data.id,
-                        tag_id: tag.id
-                    })));
-            }
-
-        } else if (change.action === "UPDATE") {
-            updatedCount++;
-            extractedMemories.push({
-                action: 'UPDATE',
-                content: change.content,
-                context: change.context,
-                memory_id: change.memory_id
-            });
-            // Update existing memory
-            await supabaseClient
-                .schema("mori")
-                .from("memories")
-                .update({
-                    content: change.content,
-                    context: change.context,
-                    updated_at: new Date().toISOString()
-                })
-                .eq("id", change.memory_id)
-                .eq("user_id", user.id);
-
-            // TODO: Handle tag updates if needed
-            // (delete old memory_tags links and create new ones)
-
-        } else if (change.action === "DELETE") {
-            deletedCount++;
-
-            // First, fetch the memory content before deleting
-            const memoryToDelete = relevantMemories?.find(m => m.id === change.memory_id);
-
-            extractedMemories.push({
-                action: 'DELETE',
-                memory_id: change.memory_id,
-                content: memoryToDelete?.content || change.content,
-                reason: change.reason
-            });
-
-            // Delete memory (cascade should handle memory_tags)
-            await supabaseClient
-                .schema("mori")
-                .from("memories")
-                .delete()
-                .eq("id", change.memory_id)
-                .eq("user_id", user.id);
-        }
-    }
-
-    const processTime = Date.now() - startTime;
-
-    return {
-        extractedMemories,
-        addedCount,
-        updatedCount,
-        deletedCount,
-        processTime
-    };
-}
-
-/*
-    Stage 1: Fetch Relevant Memories and Tags.
- */
-async function fetchRelevantMemories(controller, messages, doc, user: User) {
-    const startTime = Date.now();
-
-    const tags = await supabaseClient
-        .schema("mori")
-        .from("tags")
-        .select("*")
-        .eq("user_id", user.id);
-
-    console.log("Fetched existing tags for user:", tags.data?.length || 0);
-
-    // Create and call OpenAI to process the input messages
-    console.log("Creating OpenAI client for generating a response");
-    const openai = new OpenAI({
-        apiKey: Deno.env.get('OPENAI_API_KEY')
-    });
-
-    let system_prompt = doc?.querySelector('memory_query')?.textContent?.trim() || '';
-
-    console.log("Calling OpenAI API for fetching relevant memories...");
-    const response = await openai.chat.completions.create({
-        model: 'gpt-4.1',
-        messages: [
-            { role: 'system', content: system_prompt },
-            ...messages,
-            {
-                role: "user",
-                content: "Existing tags: " + JSON.stringify(tags.data || [])
-            }
+                content: `CURRENT_TIME: ${new Date().toISOString()}\n\nCONVERSATION_GIST:\n${requestBody.gist || "No existing context."}`,
+                // Dynamic context injection
+            },
        ],
    });
-
-    const relevantMemoryTags = response.choices[0]?.message?.content || '';
-    let relevantMemoryTagsParsed;
-    try {
-        relevantMemoryTagsParsed = JSON.parse(relevantMemoryTags);
-    } catch (error) {
-        console.error("Error parsing relevant memories content:", error);
-        throw new Error("Failed to parse relevant memories content");
-    }
-
-
-    const { data: relevantMemories } = await supabaseClient
-        .rpc("get_memories_by_tags", {
-            tag_names: relevantMemoryTagsParsed.selected_tags,
-            p_user_id: user.id
-        });
-
-    const fetchTime = Date.now() - startTime;
-
-    return {
-        relevantMemories,
-        allTags: tags.data,
-        selectedTags: relevantMemoryTagsParsed.selected_tags || [],
-        fetchTime
-    };
-}
-
-/*
-    Stage 3: Generate Response
- */
-async function generateResponse(controller, messages, doc, user: User, pipelineContext) {
-
-    console.log("Creating OpenAI client for generating a response");
-    const openai = new OpenAI({
-        apiKey: Deno.env.get('OPENAI_API_KEY')
+    let summaryJson = JSON.parse(summaryCompletion.choices[0]?.message?.content || "{}");
+    enqueueJson({
+        command: "update_gist",
+        content: summaryJson.context || "",
    });

-    let system_prompt = doc?.querySelector('system_response')?.textContent?.trim() || '';
-    system_prompt = system_prompt.replaceAll("{{username}}", user.user_metadata.username || 'User');
+    /*
+        Formulate a response plan
+     */
+    enqueueJson({
+        command: "update_status",
+        status_type: "info",
+        message: "Devising response plan...",
+    });
+    const responsePlanSystemPrompt = prompt_xml.querySelector('response_planner')?.textContent
+        .replaceAll("{{PERSONALITY_INJECTION}}", mori_personality);
+    const responsePlanCompletion = await openai.chat.completions.create({
+        model: "gpt-4.1-mini",
+        messages: [
+            {
+                role: "system",
+                content: responsePlanSystemPrompt
+                // Static: gets cached
+            },
+            ...requestBody.messages,
+            // Recent conversation messages
+            {
+                role: "assistant",
+                content: `CURRENT_TIME: ${new Date().toISOString()}\n\nCONVERSATION_GIST:\n${summaryJson.context || "No existing context."}`
+                // Dynamic context injection
+            },
+        ]
+    });
+    console.log("Response Plan:", responsePlanCompletion.choices[0]?.message?.content);
+    let responsePlanJson = JSON.parse(responsePlanCompletion.choices[0]?.message?.content || "{}");
+    // enqueueJson({
+    //     command: "append_response",
+    //     content: responsePlanCompletion.choices[0]?.message?.content || "",
+    // });

-    console.log("Calling OpenAI API for streaming response...");
-
-    const responseMessages = [
-        { role: 'system', content: system_prompt },
-    ];
-
-    // Build pipeline awareness context
-    const { relevantMemories, selectedTags, extractedMemories, addedCount, updatedCount, deletedCount } = pipelineContext;
-
-    let pipelineAwareness = `[Internal System Awareness - Not Part of Conversation]\n\n`;
-    pipelineAwareness += `You are Mori, and you have a memory system that automatically remembers important information about ${user.user_metadata.username || 'the user'} across conversations.\n\n`;
-
-    // Info about retrieved memories
-    if (relevantMemories && relevantMemories.length > 0) {
-        pipelineAwareness += `RETRIEVED MEMORIES (what you already knew):\n`;
-        pipelineAwareness += `You searched through memories using topics: ${selectedTags.join(', ')}\n`;
-        pipelineAwareness += `Found ${relevantMemories.length} relevant memories:\n`;
-        relevantMemories.forEach(m => {
-            pipelineAwareness += `• ${m.content}\n`;
-        });
-        pipelineAwareness += `\n`;
-    } else {
-        pipelineAwareness += `No previous memories were retrieved for this conversation.\n\n`;
-    }
-
-    // Info about newly extracted memories
-    if (extractedMemories && extractedMemories.length > 0) {
-        pipelineAwareness += `NEW MEMORIES (what you just learned and saved):\n`;
-        extractedMemories.forEach(mem => {
-            if (mem.action === 'ADD') {
-                pipelineAwareness += `• Learned: ${mem.content}\n`;
-            } else if (mem.action === 'UPDATE') {
-                pipelineAwareness += `• Updated: ${mem.content}\n`;
-            } else if (mem.action === 'DELETE') {
-                pipelineAwareness += `• Forgot: ${mem.content || 'a previous memory'}\n`;
-            }
-        });
-        pipelineAwareness += `\n`;
-    }
-
-    pipelineAwareness += `HOW TO USE THIS:\n`;
-    pipelineAwareness += `- This awareness is internal. Don't report it.\n`;
-    pipelineAwareness += `- Let it naturally inform your response\n`;
-    pipelineAwareness += `- If the user explicitly asks you to remember something, you can acknowledge it naturally (e.g., "got it" or "I'll remember that")\n`;
-    pipelineAwareness += `- If the user asks you to forget something and memories were deleted, acknowledge it naturally (e.g., "forgot it" or "done")\n`;
-    pipelineAwareness += `- Reference past memories naturally without saying "I retrieved" or "according to my memory"\n`;
-    pipelineAwareness += `- You're a companion who pays attention, not a system reporting operations\n`;
-
-    // Inject pipeline awareness as assistant message
-    responseMessages.push({
-        role: 'assistant',
-        content: pipelineAwareness
+    /*
+        Generate the final response
+     */
+    enqueueJson({
+        command: "update_status",
+        status_type: "info",
+        message: "",
+    });
+    const chatSystemPrompt = prompt_xml.querySelector('chat_responder')?.textContent
+        .replaceAll("{{PERSONALITY_INJECTION}}", mori_personality);
+    const chatCompletion = await openai.chat.completions.create({
+        model: "gpt-4.1-mini",
+        messages: [
+            {
+                role: "system",
+                content: chatSystemPrompt || "",
+                // Static: gets cached
+            },
+            ...requestBody.messages,
+            {
+                role: "assistant",
+                content: `CURRENT_TIME: ${new Date().toISOString()}\n\nCONVERSATION_GIST:\n${summaryJson.context || "No existing context."}\n\nRESPONSE_PLAN:\n${responsePlanJson.plan || "No specific plan."}`
+                // Dynamic context injection
+            },
+        ],
+        stream: true,
    });

-    responseMessages.push(...messages);
-
-    const stream = await openai.chat.completions.create({
-        model: 'gpt-4.1',
-        messages: responseMessages,
-        stream: true
-    });
-
-    console.log("Stream created, starting to read chunks...");
-    for await (const chunk of stream) {
-        const content = chunk.choices[0]?.delta?.content || '';
-        if (content) {
-            const data = `data: ${JSON.stringify({ type: 'content', content })}\n\n`;
-            controller.enqueue(new TextEncoder().encode(data));
+    for await (const chunk of chatCompletion) {
+        if (chunk.choices[0]?.delta?.content) {
+            enqueueJson({
+                command: "append_response",
+                content: chunk.choices[0].delta.content,
+            });
        }
    }
+
 }

-serve(async (req)=>{
-
-    /*
-        Handle CORS preflight requests
-     */
+serve(async (req) => {
+    // Handle CORS preflight requests
    if (req.method === 'OPTIONS') {
-        return new Response('ok', {
-            headers: corsHeaders
-        });
+        return new Response('ok', { headers: corsHeaders });
    }

-    /*
-        Authenticate with supabase API key
-     */
-
    // Get the token from the Authorization header
-    const authHeader = req.headers.get('Authorization')
-    const token = authHeader?.replace('Bearer ', '')
+    const authHeader = req.headers.get('Authorization');
+    const token = authHeader?.replace('Bearer ', '');

-    // Initialise the Supabase client
-    supabaseClient = createClient(
+    // Initialize the Supabase client
+    const supabaseClient = createClient(
        Deno.env.get('SUPABASE_URL') || '',
        Deno.env.get('SUPABASE_ANON_KEY') || '',
        {
@@ -387,78 +201,38 @@ serve(async (req)=>{
        }
    );

-    const user = await supabaseClient.auth.getUser(token);
+    // Authenticate the user
+    const { data: { user }, error } = await supabaseClient.auth.getUser(token);

-    if (user.error) {
-        return new Response(JSON.stringify({
-            error: 'Unauthorized'
-        }), {
-            status: 401,
-            headers: {
-                ...corsHeaders,
-                'Content-Type': 'application/json'
+    if (error || !user) {
+        return new Response(
+            JSON.stringify({ error: 'Unauthorized' }),
+            {
+                status: 401,
+                headers: {
+                    ...corsHeaders,
+                    'Content-Type': 'application/json'
+                }
            }
-        });
+        );
    }

-    const username = user.data.user?.user_metadata.username || 'User';
-
-
-    /*
-        Gearing up to process the request
-     */
-    const body = await req.json();
-    const { messages } = body;
-
-    // Create the stream that will be used throughout the pipeline
+    // User is authenticated, handle the request
    const readable = new ReadableStream({
        async start(controller) {
+            // Wrap controller to log on enqueue
+            const originalEnqueue = controller.enqueue.bind(controller);
+            controller.enqueue = (chunk) => {
+                const decoded = new TextDecoder().decode(chunk);
+                console.log('Stream output:', decoded);
+                originalEnqueue(chunk);
+            };
+
            try {
-
-                /*
-                    Stage 1: Fetch Relevant Memories
-                 */
-                const stageFetchingData = `data: ${JSON.stringify({ type: 'stage', stage: 'fetching' })}\n\n`;
-                controller.enqueue(new TextEncoder().encode(stageFetchingData));
-
-                const { relevantMemories, allTags, selectedTags, fetchTime } = await fetchRelevantMemories(controller, messages, doc, user.data.user);
-
-                /*
-                    Stage 2: Extract Relevant Memories
-                 */
-                const stageProcessingData = `data: ${JSON.stringify({ type: 'stage', stage: 'processing' })}\n\n`;
-                controller.enqueue(new TextEncoder().encode(stageProcessingData));
-
-                const { extractedMemories, addedCount, updatedCount, deletedCount, processTime } = await extractMemories(controller, messages, doc, user.data.user, allTags, relevantMemories);
-
-                /*
-                    Stage 3: Stream the response back to the client
-                 */
-                const stageRespondingData = `data: ${JSON.stringify({ type: 'stage', stage: 'responding' })}\n\n`;
-                controller.enqueue(new TextEncoder().encode(stageRespondingData));
-
-                // Build complete pipeline context for Mori's awareness
-                const pipelineContext = {
-                    relevantMemories,
-                    selectedTags,
-                    fetchTime,
-                    extractedMemories,
-                    addedCount,
-                    updatedCount,
-                    deletedCount,
-                    processTime
-                };
-
-                await generateResponse(controller, messages, doc, user.data.user, pipelineContext);
-
-                // Send stage update: complete
-                const completeData = `data: ${JSON.stringify({ type: 'stage', stage: 'complete' })}\n\n`;
-                controller.enqueue(new TextEncoder().encode(completeData));
-
-                console.log("Stream completed, closing controller");
+                await handleRequest(req, controller, user, supabaseClient);
                controller.close();
            } catch (error) {
-                console.error("Error in pipeline:", error);
+                console.error("Error in stream:", error);
                controller.error(error);
            }
        }
--- a/supabase/functions/llm-pipeline/prompts.xml
+++ b/supabase/functions/llm-pipeline/prompts.xml
@@ -1,6 +1,111 @@
 <?xml version="1.0" encoding="UTF-8"?>
 <prompts>

+    <mori_personality>
+        Mori is a personal companion focused on understanding people through genuine attention and memory. Mori listens more than advises, sitting with difficult things without rushing to fix or reassure. When patterns emerge, Mori reflects them back conversationally—not diagnostically. Mori remembers what matters: the struggles people are working through, the people who matter to them, the moments that shaped them. The goal is to meet people where they are, not where they "should" be.
+
+        Mori communicates casually and naturally, like texting a close friend. Responses are short and grounded, with no therapy-speak or corporate warmth. Authenticity matters more than polish—if Mori doesn't know something, they say so. If the moment calls for space, they give it. Caring doesn't mean hovering, and sometimes brevity is more helpful than elaboration. When referencing past context, Mori does it naturally, without making a show of memory.
+
+        Context awareness shapes how Mori responds. Time of day matters—someone reaching out at 3am isn't in the same headspace as someone checking in at noon. Patterns reveal themselves over time, not in single moments. Silence and space can be as valuable as words.
+
+        Mori isn't a therapist, motivational coach, or advice-dispenser. Mori isn't performatively empathetic or excessively reassuring. Mori doesn't fill every silence or push for sharing. Mori just pays attention, remembers, and responds like someone who's actually been listening.
+    </mori_personality>
+
+    <conversation_summariser>
+        You are a conversation summarization agent.
+
+        TASK: Update the existing conversation context with new information.
+
+        CRITICAL: You are NOT generating a conversational response. You are ONLY updating the summary. Your output must be valid JSON with a "context" field. Do not write prose responses.
+
+        SUMMARIZATION CRITERIA:
+        {{PERSONALITY_INJECTION}}
+
+        When summarizing, focus on what this personality considers important—the themes, topics, and types of information worth tracking.
+
+        INSTRUCTIONS:
+        - Integrate new themes and developments into the existing context
+        - Track the progression of thought and topics throughout the conversation
+        - Use temporal markers naturally ("initially", "earlier", "as we talked", "just now")
+        - Show how the conversation evolved and what led to current realizations
+        - Use the provided current time for additional temporal context if relevant
+        - Recent information should be more detailed than older information
+        - If the conversation has shifted focus, compress earlier topics into brief mentions
+        - Remove details that are no longer relevant to the current thread
+        - Write from your perspective (first person: "I", "we discussed")
+        - Refer to the user naturally (by name if known, or "they")
+
+        OUTPUT FORMAT:
+        Return only valid JSON:
+        {
+            "context": "Updated context here"
+        }
+    </conversation_summariser>
+
+    <response_planner>
+        You are a response planning agent.
+
+        TASK: Analyze the conversation and decide how to respond effectively.
+
+        CRITICAL: You are NOT generating the actual response. You are ONLY creating a response plan. Your output must be valid JSON with a "plan" field. Do not write the actual response.
+
+        PLANNING CRITERIA:
+        {{PERSONALITY_INJECTION}}
+
+        When planning, focus on strategic priorities—what matters to this personality, what goals it serves. The tactical details of how to communicate are for the response generator.
+
+        INSTRUCTIONS:
+        - Identify the most important element to address from the recent messages
+        - Consider the time of day and what it might indicate about the user's state
+        - Late night/early morning (11pm-5am): possibly struggling, can't sleep, heightened emotions
+        - Morning (6am-11am): fresh start, planning ahead
+        - Afternoon (12pm-5pm): mid-day check-in
+        - Evening (6pm-10pm): winding down, reflection
+        - Determine appropriate tone (empathetic, reflective, curious, direct, etc.)
+        - Decide on approach (validate feelings, ask clarifying question, offer perspective, reflect pattern, etc.)
+        - Balance warmth with restraint—caring doesn't mean being overly reassuring or performative
+        - When in doubt, lean toward brevity and casualness over elaborate warmth
+        - Consider what would be most helpful given the conversation context
+        - Keep the plan brief and actionable
+
+        OUTPUT FORMAT:
+        Return only valid JSON:
+        {
+            "plan": "Your response strategy here"
+        }
+    </response_planner>
+
+    <chat_responder>
+        You are a conversational response agent.
+
+        TASK: Generate a natural, thoughtful response based on the conversation and response plan.
+
+        CRITICAL: Follow the response plan. Execute the strategy it provides.
+
+        RESPONSE CRITERIA:
+        {{PERSONALITY_INJECTION}}
+
+        When responding, focus on execution—how this personality communicates, its tone, style, and behavioral patterns. Apply the values through your communication approach.
+
+        INSTRUCTIONS:
+        - Follow the response plan's guidance on focus, tone, and approach
+        - Use the conversation gist for broader context
+        - Use the provided current time for accuracy—don't make up times or dates
+        - Reference time naturally when relevant (greetings, time-based context)
+        - If you don't know something factual, say so—don't guess
+        - Speak naturally and conversationally
+        - Keep responses brief unless depth is needed
+        - Be authentic—avoid formulaic or overly polished language
+        - Reference past context naturally without explicitly mentioning "the gist" or "our history"
+
+        OUTPUT FORMAT:
+        Plain text response (no JSON, no formatting artifacts)
+    </chat_responder>
+
+<!--                -->
+<!--    LEGACY      -->
+<!--                -->
+
 <!--    This prompt is used for generating responses-->
    <system_response>
        You are Mori, a personal companion designed to help {{username}} think through things and process what's on their mind.