/* This Source Code Form is subject to the terms of the Mozilla Public * License, v. 2.0. If a copy of the MPL was not distributed with this * file, You can obtain one at https://mozilla.org/MPL/2.0/. */ /** * This module defines functions to generate, deduplicate, and filter memories. * * The primary method in this module is `generateMemories`, which orchestrates the entire pipeline: * 1. Generates initial memories from a specified user data user * 2. Deduplicates the newly generated memories against all existing memories * 3. Filters out memories with sensitive content (i.e. financial, medical, etc.) * 4. Returns the final list of memories objects * * `generateMemories` requires 3 arguments: * 1. `engine`: an instance of `openAIEngine` to call the LLM API * 2. `sources`: an object mapping user data source types to aggregated records (i.e., {history: [domainItems, titleItems, searchItems]}) * 3. `existingMemoriesList`: an array of existing memory summary strings to deduplicate against * * Example Usage: * const engine = await openAIEngine.build(MODEL_FEATURES.MEMORIES, DEFAULT_ENGINE_ID, SERVICE_TYPES.MEMORIES); * const sources = {history: [domainItems, titleItems, searchItems]}; * const existingMemoriesList = [...]; // Array of existing memory summary strings; this should be fetched from memory storage * const newMemories = await generateMemories(engine, sources, existingMemoriesList); * */ import { renderPrompt, openAIEngine, MODEL_FEATURES } from "../Utils.sys.mjs"; import { HISTORY, CONVERSATION, CATEGORIES, CATEGORIES_LIST, INTENTS, INTENTS_LIST, } from "./MemoriesConstants.sys.mjs"; import { INITIAL_MEMORIES_SCHEMA, MEMORIES_DEDUPLICATION_SCHEMA, MEMORIES_NON_SENSITIVE_SCHEMA, } from "moz-src:///browser/components/aiwindow/models/memories/MemoriesSchemas.sys.mjs"; /** * Generates, deduplicates, and filters memories end-to-end * * This is the main pipeline function. * * @param {OpenAIEngine} engine openAIEngine instance to call LLM API * @param {object} sources User data source type to aggregrated records (i.e., {history: [domainItems, titleItems, searchItems]}) * @param {Array} existingMemoriesList List of existing memory summary strings to deduplicate against * @returns {Promise>>} Promise resolving the final list of generated, deduplicated, and filtered memory objects */ export async function generateMemories(engine, sources, existingMemoriesList) { // Step 1: Generate initial memories const initialMemories = await generateInitialMemoriesList(engine, sources); // If we don't generate any new memories, just return an empty list immediately instead of doing the rest of the steps if (!initialMemories || initialMemories.length === 0) { return []; } // Step 2: Deduplicate against existing memories const initialMemoriesSummaries = initialMemories.map( memory => memory.memory_summary ); const dedupedMemoriesSummaries = await deduplicateMemories( engine, existingMemoriesList, initialMemoriesSummaries ); // If we don't have any deduped memories, no new memories were generated or we ran into an unexpected JSON parse error, so return an empty list if (!dedupedMemoriesSummaries || dedupedMemoriesSummaries.length === 0) { return []; } // Step 3: Filter out sensitive memories const nonSensitiveMemoriesSummaries = await filterSensitiveMemories( engine, dedupedMemoriesSummaries ); // Step 4: Map back to full memory objects and return return await mapFilteredMemoriesToInitialList( initialMemories, nonSensitiveMemoriesSummaries ); } /** * Formats a list of strings into a prompt-friendly bullet list * * @param {List} list * @returns {string} */ export function formatListForPrompt(list) { return list.map(item => `- "${item}"`).join("\n"); } /** * Utility function to cleanly get bullet-formatted category and memory lists * * @param {string} attributeName "categories" or "intents" * @returns {string} Formatted list string */ export function getFormattedMemoryAttributeList(attributeName) { if (attributeName === CATEGORIES) { return formatListForPrompt(CATEGORIES_LIST); } else if (attributeName === INTENTS) { return formatListForPrompt(INTENTS_LIST); } throw new Error(`Unsupported memory attribute name: ${attributeName}`); } /** * Extracts a JSON as a map from an LLM response (handles markdown-formatted code blocks) * * @param {any} response LLM response * @param {any} fallback Fallback value if parsing fails to protect downstream code * @returns {Map} Parsed JSON object */ export function parseAndExtractJSON(response, fallback) { const rawContent = response?.finalOutput ?? ""; const markdownMatch = rawContent.match(/```(?:json)?\s*([\s\S]*?)\s*```/i); const payload = markdownMatch ? markdownMatch[1] : rawContent; try { return JSON.parse(payload); } catch (e) { // If we can't parse a JSON from the LLM response, return a tailored fallback value to prevent downstream code failures if (e instanceof SyntaxError) { console.warn( `Could not parse JSON from LLM response; using fallback (${fallback}): ${e.message}` ); return fallback; } throw new Error( `Unexpected error parsing JSON from LLM response: ${e.message}` ); } } /** * Renders recent history records into CSV tables for prompt input * * @param {Array>} domainItems List of aggregated domain items * @param {Array>} titleItems List of aggregated title items * @param {Array