From 0b9b9ab440cee0cd0e5413d28ea648cc1c7540cd Mon Sep 17 00:00:00 2001 From: Martin McKeaveney Date: Tue, 1 Oct 2024 14:56:16 +0100 Subject: [PATCH] AI functionaly working E2E --- .../common/AIFieldConfiguration.svelte | 4 +- .../src/utilities/rowProcessor/utils.ts | 52 +++++++++++-------- 2 files changed, 31 insertions(+), 25 deletions(-) diff --git a/packages/builder/src/components/common/AIFieldConfiguration.svelte b/packages/builder/src/components/common/AIFieldConfiguration.svelte index 66af1266be..73e0562dbe 100644 --- a/packages/builder/src/components/common/AIFieldConfiguration.svelte +++ b/packages/builder/src/components/common/AIFieldConfiguration.svelte @@ -47,11 +47,11 @@ prompt: OperationFieldTypes.BINDABLE_TEXT, }, CLEAN_DATA: { - columns: OperationFieldTypes.MULTI_COLUMN, + column: OperationFieldTypes.COLUMN, prompt: OperationFieldTypes.BINDABLE_TEXT, }, TRANSLATE: { - columns: OperationFieldTypes.MULTI_COLUMN, + column: OperationFieldTypes.COLUMN, language: OperationFieldTypes.BINDABLE_TEXT, prompt: OperationFieldTypes.BINDABLE_TEXT, }, diff --git a/packages/server/src/utilities/rowProcessor/utils.ts b/packages/server/src/utilities/rowProcessor/utils.ts index 30942edc93..6055a2511c 100644 --- a/packages/server/src/utilities/rowProcessor/utils.ts +++ b/packages/server/src/utilities/rowProcessor/utils.ts @@ -102,8 +102,9 @@ export async function processAIColumns( ): Promise { return tracer.trace("processAIColumns", {}, async span => { const numRows = Array.isArray(inputRows) ? inputRows.length : 1 - span?.addTags({ table_id: table._id }) + span?.addTags({ table_id: table._id, numRows }) const rows = Array.isArray(inputRows) ? inputRows : [inputRows] + const llm = await pro.ai.LargeLanguageModel.forCurrentTenant("gpt-4o-mini") if (rows) { // Ensure we have snippet context await context.ensureSnippetContext() @@ -113,29 +114,34 @@ export async function processAIColumns( continue } - // const llm = pro.ai.LargeLanguageModel() - // if ( - // schema.formula == null || - // (dynamic && isStatic) || - // (!dynamic && !isStatic) - // ) { - // continue - // } - // iterate through rows and process formula - for (let i = 0; i < rows.length; i++) { - let row = rows[i] - // let context = contextRows ? contextRows[i] : row - // let formula = schema.prompt - rows[i] = { - ...row, - [column]: tracer.trace("processAIColumn", {}, span => { - span?.addTags({ table_id: table._id, column }) - // return processStringSync(formula, context) - // TODO: Add the AI stuff in to this - return "YEET AI" - }), + const rowUpdates = rows.map((row, i) => { + const contextRow = contextRows ? contextRows[i] : row + // TODO: Map the prompts with string-templates + // grab the operation based on the schema + // then check the types in the fields, and decide whether to pass them through string templates + // TODO: cleaner way to map to the schema, move things into BB types and check against the AI schema + for (const key in schema) { + if (["prompt", "categories"].includes(key)) { + schema[key] = processStringSync(schema[key], contextRow) + } } - } + + const prompt = llm.buildPromptFromAIOperation({ schema, row }) + + return tracer.trace("processAIColumn", {}, async span => { + span?.addTags({ table_id: table._id, column }) + const llmResponse = await llm.run(prompt) + return { + ...row, + [column]: llmResponse + } + }) + }) + + const processedRows = await Promise.all(rowUpdates) + + // Promise.all is deterministic so can rely on the indexing here + processedRows.forEach((processedRow, index) => rows[index] = processedRow) } } return Array.isArray(inputRows) ? rows : rows[0]