Added JSON / Summary LLM safeguard

2026-03-26 12:50:52 -04:00 · 2026-03-26 12:33:50 -04:00 · 2026-03-26 12:24:20 -04:00 · 2026-03-21 14:34:24 -04:00 · 2026-03-13 18:55:38 -04:00 · 2026-03-03 00:26:00 -05:00
4 changed files with 199 additions and 33 deletions
--- a/package.json
+++ b/package.json
@@ -1,6 +1,6 @@
 {
 	"name": "@ztimson/ai-utils",
-	"version": "0.8.3",
+	"version": "0.8.14",
 	"description": "AI Utility library",
 	"author": "Zak Timson",
 	"license": "MIT",
--- a/src/llm.ts
+++ b/src/llm.ts
@@ -1,3 +1,4 @@
+import {sum} from '@tensorflow/tfjs';
 import {JSONAttemptParse} from '@ztimson/utils';
 import {AbortablePromise, Ai} from './ai.ts';
 import {Anthropic} from './antrhopic.ts';
@@ -117,12 +118,13 @@ class LLM {
 						const score = (o ? this.cosineSimilarity(m.embeddings[0], o[0].embedding) : 0)
 							+ (q ? this.cosineSimilarity(m.embeddings[1], q[0].embedding) : 0);
 						return {...m, score};
-					}).toSorted((a: any, b: any) => a.score - b.score).slice(0, limit);
+					}).toSorted((a: any, b: any) => a.score - b.score).slice(0, limit)
+						.map(m => `- ${m.owner}: ${m.fact}`).join('\n');
 				}

 				options.system += '\nYou have RAG memory and will be given the top_k closest memories regarding the users query. Save anything new you have learned worth remembering from the user message using the remember tool and feel free to recall memories manually.\n';
 				const relevant = await search(message);
-				if(relevant.length) options.history.push({role: 'tool', name: 'recall', id: 'auto_recall_' + Math.random().toString(), args: {}, content: 'Things I remembered:\n' + relevant.map(m => `${m.owner}: ${m.fact}`).join('\n')});
+				if(relevant.length) options.history.push({role: 'tool', name: 'recall', id: 'auto_recall_' + Math.random().toString(), args: {}, content: `Things I remembered:\n${relevant}`});
 				options.tools = [{
 					name: 'recall',
 					description: 'Recall the closest memories you have regarding a query using RAG',
@@ -151,7 +153,7 @@ class LLM {
 						const newMem = {owner: args.owner, fact: args.fact, embeddings: <any>[e[0][0].embedding, e[1][0].embedding]};
 						options.memory.splice(0, options.memory.length, ...[
 							...options.memory.filter(m => {
-								return this.cosineSimilarity(newMem.embeddings[0], m.embeddings[0]) < 0.9 && this.cosineSimilarity(newMem.embeddings[1], m.embeddings[1]) < 0.8;
+								return !(this.cosineSimilarity(newMem.embeddings[0], m.embeddings[0]) >= 0.9 && this.cosineSimilarity(newMem.embeddings[1], m.embeddings[1]) >= 0.8);
 							}),
 							newMem
 						]);
@@ -356,11 +358,30 @@ class LLM {
 	 * @returns {Promise<{} | {} | RegExpExecArray | null>}
 	 */
 	async json(text: string, schema: string, options?: LLMRequest): Promise<any> {
-		const code = await this.code(text, {...options, system: [
-			options?.system,
-			`Only respond using JSON matching this schema:\n\`\`\`json\n${schema}\n\`\`\``
-		].filter(t => !!t).join('\n')});
-		return code ? JSONAttemptParse(code, {}) : null;
+		let system =  `Your job is to convert input to JSON using tool calls. Call the \`submit\` tool at least once with JSON matching this schema:\n\`\`\`json\n${schema}\n\`\`\`\n\nResponses are ignored`;
+		if(options?.system) system += '\n\n' + options.system;
+		return new Promise(async (resolve, reject) => {
+			let done = false;
+			const resp = await this.ask(text, {
+				temperature: 0.3,
+				...options,
+				system,
+				tools: [{
+					name: 'submit',
+					description: 'Submit JSON',
+					args: {json: {type: 'string', description: 'Javascript parsable JSON string', required: true}},
+					fn: (args) => {
+						try {
+							const json = JSON.parse(args.json);
+							resolve(json);
+							done = true;
+						} catch { return 'Invalid JSON'; }
+						return 'Saved';
+					}
+				}, ...(options?.tools || [])],
+			});
+			if(!done) reject(`AI failed to create JSON:\n${resp}`);
+		});
 	}

 	/**
@@ -370,8 +391,31 @@ class LLM {
 	 * @param options LLM request options
 	 * @returns {Promise<string>} Summary
 	 */
-	summarize(text: string, tokens: number = 500, options?: LLMRequest): Promise<string | null> {
-		return this.ask(text, {system: `Generate the shortest summary possible <= ${tokens} tokens. Output nothing else`, temperature: 0.3, ...options});
+	async summarize(text: string, tokens: number = 500, options?: LLMRequest): Promise<string | null> {
+		let system =  `Your job is to summarize the users message using tool calls. Call the \`submit\` tool at least once with the shortest summary possible that's <= ${tokens} tokens. The tool call will respond with the token count. Responses are ignored`;
+		if(options?.system) system += '\n\n' + options.system;
+		return new Promise(async (resolve, reject) => {
+			let done = false;
+			const resp = await this.ask(text, {
+				temperature: 0.3,
+				...options,
+				system,
+				tools: [{
+					name: 'submit',
+					description: 'Submit summary',
+					args: {summary: {type: 'string', description: 'Text summarization', required: true}},
+					fn: (args) => {
+						if(!args.summary) return 'No summary provided';
+						const count = this.estimateTokens(args.summary);
+						if(count > tokens) return `Summary is too long (${count} tokens)`;
+						done = true;
+						resolve(args.summary || null);
+						return `Saved (${count} tokens)`;
+					}
+				}, ...(options?.tools || [])],
+			});
+			if(!done) reject(`AI failed to create summary:\n${resp}`);
+		});
 	}
 }

--- a/src/open-ai.ts
+++ b/src/open-ai.ts
@@ -103,15 +103,37 @@ export class OpenAi extends LLMProvider {
 				if(options.stream) {
 					if(!isFirstMessage) options.stream({text: '\n\n'});
 					else isFirstMessage = false;
-					resp.choices = [{message: {content: '', tool_calls: []}}];
+					resp.choices = [{message: {role: 'assistant', content: '', tool_calls: []}}];
 					for await (const chunk of resp) {
 						if(controller.signal.aborted) break;
 						if(chunk.choices[0].delta.content) {
 							resp.choices[0].message.content += chunk.choices[0].delta.content;
 							options.stream({text: chunk.choices[0].delta.content});
 						}
+
 						if(chunk.choices[0].delta.tool_calls) {
-							resp.choices[0].message.tool_calls = chunk.choices[0].delta.tool_calls;
+							for(const deltaTC of chunk.choices[0].delta.tool_calls) {
+								const existing = resp.choices[0].message.tool_calls.find(tc => tc.index === deltaTC.index);
+								if(existing) {
+									if(deltaTC.id) existing.id = deltaTC.id;
+									if(deltaTC.type) existing.type = deltaTC.type;
+									if(deltaTC.function) {
+										if(!existing.function) existing.function = {};
+										if(deltaTC.function.name) existing.function.name = deltaTC.function.name;
+										if(deltaTC.function.arguments) existing.function.arguments = (existing.function.arguments || '') + deltaTC.function.arguments;
+									}
+								} else {
+									resp.choices[0].message.tool_calls.push({
+										index: deltaTC.index,
+										id: deltaTC.id || '',
+										type: deltaTC.type || 'function',
+										function: {
+											name: deltaTC.function?.name || '',
+											arguments: deltaTC.function?.arguments || ''
+										}
+									});
+								}
+							}
 						}
 					}
 				}
--- a/src/tools.ts
+++ b/src/tools.ts
@@ -1,9 +1,15 @@
-import * as cheerio from 'cheerio';
-import {$, $Sync} from '@ztimson/node-utils';
+import  * as cheerio from 'cheerio';
+import {$Sync} from '@ztimson/node-utils';
 import {ASet, consoleInterceptor, Http, fn as Fn} from '@ztimson/utils';
+import * as os from 'node:os';
 import {Ai} from './ai.ts';
 import {LLMRequest} from './llm.ts';

+const getShell = () => {
+	if(os.platform() == 'win32') return 'cmd';
+	return $Sync`echo $SHELL`?.split('/').pop() || 'bash';
+}
+
 export type AiToolArg = {[key: string]: {
 	/** Argument type */
 	type: 'array' | 'boolean' | 'number' | 'object' | 'string',
@@ -40,11 +46,18 @@ export const CliTool: AiTool = {
 	name: 'cli',
 	description: 'Use the command line interface, returns any output',
 	args: {command: {type: 'string', description: 'Command to run', required: true}},
-	fn: (args: {command: string}) => $`${args.command}`
+	fn: (args: {command: string}) => $Sync`${args.command}`
 }

 export const DateTimeTool: AiTool = {
 	name: 'get_datetime',
+	description: 'Get local date / time',
+	args: {},
+	fn: async () => new Date().toString()
+}
+
+export const DateTimeUTCTool: AiTool = {
+	name: 'get_datetime_utc',
 	description: 'Get current UTC date / time',
 	args: {},
 	fn: async () => new Date().toUTCString()
@@ -54,19 +67,20 @@ export const ExecTool: AiTool = {
 	name: 'exec',
 	description: 'Run code/scripts',
 	args: {
-		language: {type: 'string', description: 'Execution language', enum: ['cli', 'node', 'python'], required: true},
+		language: {type: 'string', description: `Execution language (CLI: ${getShell()})`, enum: ['cli', 'node', 'python'], required: true},
 		code: {type: 'string', description: 'Code to execute', required: true}
 	},
 	fn: async (args, stream, ai) => {
 		try {
-			switch(args.type) {
-				case 'bash':
+			switch(args.language) {
+				case 'cli':
 					return await CliTool.fn({command: args.code}, stream, ai);
 				case 'node':
 					return await JSTool.fn({code: args.code}, stream, ai);
-				case 'python': {
+				case 'python':
 					return await PythonTool.fn({code: args.code}, stream, ai);
-				}
+				default:
+					throw new Error(`Unsupported language: ${args.language}`);
 			}
 		} catch(err: any) {
 			return {error: err?.message || err.toString()};
@@ -98,9 +112,9 @@ export const JSTool: AiTool = {
 		code: {type: 'string', description: 'CommonJS javascript', required: true}
 	},
 	fn: async (args: {code: string}) => {
-		const console = consoleInterceptor(null);
-		const resp = await Fn<any>({console}, args.code, true).catch((err: any) => console.output.error.push(err));
-		return {...console.output, return: resp, stdout: undefined, stderr: undefined};
+		const c = consoleInterceptor(null);
+		const resp = await Fn<any>({console: c}, args.code, true).catch((err: any) => c.output.error.push(err));
+		return {...c.output, return: resp, stdout: undefined, stderr: undefined};
 	}
 }

@@ -115,24 +129,82 @@ export const PythonTool: AiTool = {

 export const ReadWebpageTool: AiTool = {
 	name: 'read_webpage',
-	description: 'Extract clean, structured content from a webpage. Use after web_search to read specific URLs',
+	description: 'Extract clean, structured content from a webpage or convert media/documents to accessible formats',
 	args: {
 		url: {type: 'string', description: 'URL to extract content from', required: true},
-		focus: {type: 'string', description: 'Optional: What aspect to focus on (e.g., "pricing", "features", "contact info")'}
+		mimeRegex: {type: 'string', description: 'Optional: Regex pattern to filter MIME types (e.g., "^image/", "text/", "application/pdf")'},
+		maxSize: {type: 'number', description: 'Optional: Max file size in bytes for binary content (default: 10MB)'}
 	},
-	fn: async (args: {url: string; focus?: string}) => {
-		const html = await fetch(args.url, {headers: {"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64)"}})
-			.then(r => r.text()).catch(err => {throw new Error(`Failed to fetch: ${err.message}`)});
+	fn: async (args: {url: string; mimeRegex?: string;}) => {
+		const maxSize = 10 * 1024 * 1024; // 10 MB

+		const response = await fetch(args.url, {
+			headers: {
+				"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36",
+				"Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8",
+				"Accept-Language": "en-US,en;q=0.5"
+			},
+			redirect: 'follow'
+		}).catch(err => {throw new Error(`Failed to fetch: ${err.message}`)});
+
+		const contentType = response.headers.get('content-type') || '';
+		const mimeType = contentType.split(';')[0].trim().toLowerCase();
+		const charset = contentType.match(/charset=([^;]+)/)?.[1] || 'utf-8';
+
+		// Filter by MIME type if specified
+		if (args.mimeRegex) {
+			const regex = new RegExp(args.mimeRegex, 'i');
+			if (!regex.test(mimeType)) {
+				return {url: args.url, error: 'MIME type rejected', mimeType, filter: args.mimeRegex};
+			}
+		}
+
+		// Handle images, audio, video -> data URL
+		if (mimeType.startsWith('image/') || mimeType.startsWith('audio/') || mimeType.startsWith('video/')) {
+			const buffer = await response.arrayBuffer();
+			if (buffer.byteLength > maxSize) {
+				return {url: args.url, type: 'media', mimeType, error: 'File too large', size: buffer.byteLength, maxSize};
+			}
+			const base64 = Buffer.from(buffer).toString('base64');
+			return {url: args.url, type: 'media', mimeType, dataUrl: `data:${mimeType};base64,${base64}`, size: buffer.byteLength};
+		}
+
+		// Handle plain text, json, xml, csv
+		if (mimeType.match(/^(text\/(plain|csv|xml)|application\/(json|xml|csv|x-yaml))/) ||
+			args.url.match(/\.(txt|json|xml|csv|yaml|yml|md)$/i)) {
+			const text = await response.text();
+			return {url: args.url, type: 'text', mimeType, content: text.slice(0, 100000)};
+		}
+
+		// Handle PDFs and other binaries -> data URL
+		if (mimeType === 'application/pdf' || mimeType.startsWith('application/') && !mimeType.includes('html')) {
+			const buffer = await response.arrayBuffer();
+			if (buffer.byteLength > maxSize) {
+				return {url: args.url, type: 'binary', mimeType, error: 'File too large', size: buffer.byteLength, maxSize};
+			}
+			const base64 = Buffer.from(buffer).toString('base64');
+			return {url: args.url, type: 'binary', mimeType, dataUrl: `data:${mimeType};base64,${base64}`, size: buffer.byteLength};
+		}
+
+		// Default HTML handling
+		const html = await response.text();
 		const $ = cheerio.load(html);
-		$('script, style, nav, footer, header, aside, iframe, noscript, [role="navigation"], [role="banner"], .ad, .ads, .cookie, .popup').remove();
+
+		// Remove noise
+		$('script, style, nav, footer, header, aside, iframe, noscript, svg, [role="navigation"], [role="banner"], [role="complementary"], .ad, .ads, .advertisement, .cookie, .popup, .modal, .sidebar, .related, .comments, .social-share').remove();
+
+		// Extract metadata
 		const metadata = {
 			title: $('meta[property="og:title"]').attr('content') || $('title').text() || '',
 			description: $('meta[name="description"]').attr('content') || $('meta[property="og:description"]').attr('content') || '',
+			author: $('meta[name="author"]').attr('content') || '',
+			published: $('meta[property="article:published_time"]').attr('content') || $('time').attr('datetime') || '',
+			image: $('meta[property="og:image"]').attr('content') || ''
 		};

+		// Extract structured content
 		let content = '';
-		const contentSelectors = ['article', 'main', '[role="main"]', '.content', '.post', '.entry', 'body'];
+		const contentSelectors = ['article', 'main', '[role="main"]', '.content', '.post-content', '.entry-content', '.article-content', 'body'];
 		for (const selector of contentSelectors) {
 			const el = $(selector).first();
 			if (el.length && el.text().trim().length > 200) {
@@ -141,9 +213,37 @@ export const ReadWebpageTool: AiTool = {
 			}
 		}
 		if (!content) content = $('body').text();
-		content = content.replace(/\s+/g, ' ').trim().slice(0, 8000);

-		return {url: args.url, title: metadata.title.trim(), description: metadata.description.trim(), content, focus: args.focus};
+		// Clean whitespace but preserve structure
+		content = content
+			.replace(/\n\s*\n\s*\n/g, '\n\n')
+			.replace(/[ \t]+/g, ' ')
+			.trim()
+			.slice(0, 50000);
+
+		// Extract links if minimal content
+		let links: any[] = [];
+		if (content.length < 500) {
+			$('a[href]').each((_, el) => {
+				const href = $(el).attr('href');
+				const text = $(el).text().trim();
+				if (href && text && !href.startsWith('#')) {
+					links.push({text, href});
+				}
+			});
+			links = links.slice(0, 50);
+		}
+
+		return {
+			url: args.url,
+			type: 'html',
+			title: metadata.title.trim(),
+			description: metadata.description.trim(),
+			author: metadata.author.trim(),
+			published: metadata.published,
+			content,
+			links: links.length ? links : undefined,
+		};
 	}
 }
Author	SHA1	Message	Date
ztimson	eda4eed87d	Added JSON / Summary LLM safeguard All checks were successful Publish Library / Build NPM Project (push) Successful in 41s Details Publish Library / Tag Version (push) Successful in 21s Details	2026-03-26 12:50:52 -04:00
ztimson	7f88c2d1d0	Added JSON / Summary LLM safeguard All checks were successful Publish Library / Build NPM Project (push) Successful in 1m17s Details Publish Library / Tag Version (push) Successful in 13s Details	2026-03-26 12:33:50 -04:00
ztimson	5eae84f6cf	Added JSON / Summary LLM safeguard All checks were successful Publish Library / Build NPM Project (push) Successful in 1m1s Details Publish Library / Tag Version (push) Successful in 14s Details	2026-03-26 12:24:20 -04:00
ztimson	52a3e73484	Improved read_webpage tool All checks were successful Publish Library / Build NPM Project (push) Successful in 57s Details Publish Library / Tag Version (push) Successful in 14s Details	2026-03-21 14:34:24 -04:00
ztimson	ccb1bdf043	Added Non-UTC version of date/time tool All checks were successful Publish Library / Build NPM Project (push) Successful in 54s Details Publish Library / Tag Version (push) Successful in 6s Details	2026-03-13 18:55:38 -04:00
ztimson	b814ea8b28	Improved memory recall results All checks were successful Publish Library / Build NPM Project (push) Successful in 42s Details Publish Library / Tag Version (push) Successful in 10s Details	2026-03-03 00:26:00 -05:00
ztimson	06dda88dbc	Removed log statements All checks were successful Publish Library / Build NPM Project (push) Successful in 36s Details Publish Library / Tag Version (push) Successful in 10s Details	2026-03-02 14:00:58 -05:00
ztimson	5d34652d46	Fixed CLI tool All checks were successful Publish Library / Build NPM Project (push) Successful in 39s Details Publish Library / Tag Version (push) Successful in 10s Details	2026-03-01 18:11:25 -05:00
ztimson	6454548364	Fixed CLI tool All checks were successful Publish Library / Build NPM Project (push) Successful in 41s Details Publish Library / Tag Version (push) Successful in 9s Details	2026-03-01 17:18:30 -05:00
ztimson	936317f2f2	Better memory de-duplication All checks were successful Publish Library / Build NPM Project (push) Successful in 37s Details Publish Library / Tag Version (push) Successful in 10s Details	2026-03-01 00:11:17 -05:00
ztimson	cfde2ac4d3	Fixed open AI tool call streaming! All checks were successful Publish Library / Build NPM Project (push) Successful in 42s Details Publish Library / Tag Version (push) Successful in 8s Details	2026-02-27 13:11:41 -05:00