5 Commits

Author SHA1 Message Date
a5ed4076b7 Handle anthropic multiple responses better.
All checks were successful
Publish Library / Build NPM Project (push) Successful in 34s
Publish Library / Tag Version (push) Successful in 8s
2025-12-16 12:22:14 -05:00
0112c92505 Removed log statements
All checks were successful
Publish Library / Build NPM Project (push) Successful in 20s
Publish Library / Tag Version (push) Successful in 5s
2025-12-14 21:16:39 -05:00
2351f590b5 Removed ASR file intermediary
All checks were successful
Publish Library / Build NPM Project (push) Successful in 37s
Publish Library / Tag Version (push) Successful in 8s
2025-12-14 09:27:07 -05:00
2c2acef84e ASR logging
All checks were successful
Publish Library / Build NPM Project (push) Successful in 37s
Publish Library / Tag Version (push) Successful in 8s
2025-12-14 08:49:02 -05:00
a6de121551 Fixed ASR command
All checks were successful
Publish Library / Build NPM Project (push) Successful in 26s
Publish Library / Tag Version (push) Successful in 7s
2025-12-13 23:19:30 -05:00
3 changed files with 51 additions and 40 deletions

View File

@@ -1,6 +1,6 @@
{ {
"name": "@ztimson/ai-utils", "name": "@ztimson/ai-utils",
"version": "0.1.11", "version": "0.1.16",
"description": "AI Utility library", "description": "AI Utility library",
"author": "Zak Timson", "author": "Zak Timson",
"license": "MIT", "license": "MIT",

View File

@@ -1,25 +1,21 @@
import {$} from '@ztimson/node-utils';
import {createWorker} from 'tesseract.js'; import {createWorker} from 'tesseract.js';
import {LLM, LLMOptions} from './llm'; import {LLM, LLMOptions} from './llm';
import fs from 'node:fs/promises'; import fs from 'node:fs/promises';
import Path from 'node:path'; import Path from 'node:path';
import * as tf from '@tensorflow/tfjs'; import * as tf from '@tensorflow/tfjs';
import {spawn} from 'node:child_process';
export type AiOptions = LLMOptions & { export type AiOptions = LLMOptions & {
whisper?: { whisper?: {
/** Whisper binary location */ /** Whisper binary location */
binary: string; binary: string;
/** Model */ /** Model: `ggml-base.en.bin` */
model: WhisperModel; model: string;
/** Path to models */ /** Path to models */
path: string; path: string;
/** Path to storage location for temporary files */
temp?: string;
} }
} }
export type WhisperModel = 'tiny' | 'base' | 'small' | 'medium' | 'large';
export class Ai { export class Ai {
private downloads: {[key: string]: Promise<string>} = {}; private downloads: {[key: string]: Promise<string>} = {};
private whisperModel!: string; private whisperModel!: string;
@@ -30,7 +26,7 @@ export class Ai {
constructor(public readonly options: AiOptions) { constructor(public readonly options: AiOptions) {
this.llm = new LLM(this, options); this.llm = new LLM(this, options);
if(this.options.whisper?.binary) { if(this.options.whisper?.binary) {
this.whisperModel = Path.join(<string>this.options.whisper?.path, this.options.whisper?.model + this.options.whisper?.model.endsWith('.bin') ? '' : '.bin'); this.whisperModel = this.options.whisper?.model.endsWith('.bin') ? this.options.whisper?.model : this.options.whisper?.model + '.bin';
this.downloadAsrModel(); this.downloadAsrModel();
} }
} }
@@ -41,16 +37,23 @@ export class Ai {
* @param model Whisper model * @param model Whisper model
* @returns {Promise<any>} Extracted text * @returns {Promise<any>} Extracted text
*/ */
async asr(path: string, model?: WhisperModel): Promise<string | null> { asr(path: string, model: string = this.whisperModel): {abort: () => void, response: Promise<string | null>} {
if(!this.options.whisper?.binary) throw new Error('Whisper not configured'); if(!this.options.whisper?.binary) throw new Error('Whisper not configured');
const m = await this.downloadAsrModel(model); let abort: any = () => {};
const name = Math.random().toString(36).substring(2, 10) + '-' + path.split('/').pop() + '.txt'; const response = new Promise<string | null>((resolve, reject) => {
const output = Path.join(this.options.whisper.temp || '/tmp', name); this.downloadAsrModel(model).then(m => {
console.log(this.options.whisper?.model + ' -> ' + this.whisperModel); let output = '';
console.log(`rm -f ${output} && ${this.options.whisper.binary} -nt -np -m ${m} -f ${path} -otxt -of ${output}`); const proc = spawn(<string>this.options.whisper?.binary, ['-nt', '-np', '-m', m, '-f', path], {stdio: ['ignore', 'pipe', 'ignore']});
await $`rm -f ${output} && ${this.options.whisper.binary} -nt -np -m ${m} -f ${path} -otxt -of ${output}`; abort = () => proc.kill('SIGTERM');
return fs.readFile(output, 'utf-8').then(text => text?.trim() || null) proc.on('error', (err: Error) => reject(err));
.finally(() => fs.rm(output, {force: true}).catch(() => {})); proc.stdout.on('data', (data: Buffer) => output += data.toString());
proc.on('close', (code: number) => {
if(code === 0) resolve(output.trim() || null);
else reject(new Error(`Exit code ${code}`));
});
});
});
return {response, abort};
} }
/** /**
@@ -59,20 +62,20 @@ export class Ai {
* @param {string} model Whisper model that will be downloaded * @param {string} model Whisper model that will be downloaded
* @return {Promise<string>} Absolute path to model file, resolves once downloaded * @return {Promise<string>} Absolute path to model file, resolves once downloaded
*/ */
async downloadAsrModel(model?: string): Promise<string> { async downloadAsrModel(model: string = this.whisperModel): Promise<string> {
if(!this.options.whisper?.binary) throw new Error('Whisper not configured'); if(!this.options.whisper?.binary) throw new Error('Whisper not configured');
const m = model ? (model.endsWith('.bin') ? model : model + '.bin') : this.whisperModel.split('/').pop()!; if(!model.endsWith('.bin')) model += '.bin';
const p = Path.join(this.options.whisper.path, m); const p = Path.join(this.options.whisper.path, model);
if(await fs.stat(p).then(() => true).catch(() => false)) return p; if(await fs.stat(p).then(() => true).catch(() => false)) return p;
if(!!this.downloads[m]) return this.downloads[m]; if(!!this.downloads[model]) return this.downloads[model];
this.downloads[m] = fetch(`https://huggingface.co/ggerganov/whisper.cpp/resolve/main/${m}`) this.downloads[model] = fetch(`https://huggingface.co/ggerganov/whisper.cpp/resolve/main/${model}`)
.then(resp => resp.arrayBuffer()) .then(resp => resp.arrayBuffer())
.then(arr => Buffer.from(arr)).then(async buffer => { .then(arr => Buffer.from(arr)).then(async buffer => {
await fs.writeFile(p, buffer); await fs.writeFile(p, buffer);
delete this.downloads[m]; delete this.downloads[model];
return p; return p;
}); });
return this.downloads[m]; return this.downloads[model];
} }
/** /**

View File

@@ -13,24 +13,29 @@ export class Anthropic extends LLMProvider {
} }
private toStandard(history: any[]): LLMMessage[] { private toStandard(history: any[]): LLMMessage[] {
const merged: any[] = [];
for(let i = 0; i < history.length; i++) { for(let i = 0; i < history.length; i++) {
const orgI = i; const msg = history[i];
if(typeof history[orgI].content != 'string') { if(typeof msg.content != 'string') {
if(history[orgI].role == 'assistant') { if(msg.role == 'assistant') {
history[orgI].content.filter((c: any) => c.type =='tool_use').forEach((c: any) => { msg.content.filter((c: any) => c.type == 'tool_use').forEach((c: any) => {
i++; merged.push({role: 'tool', id: c.id, name: c.name, args: c.input});
history.splice(i, 0, {role: 'tool', id: c.id, name: c.name, args: c.input});
}); });
} else if(history[orgI].role == 'user') { } else if(msg.role == 'user') {
history[orgI].content.filter((c: any) => c.type =='tool_result').forEach((c: any) => { msg.content.filter((c: any) => c.type == 'tool_result').forEach((c: any) => {
const h = history.find((h: any) => h.id == c.tool_use_id); const h = merged.find((h: any) => h.id == c.tool_use_id);
h[c.is_error ? 'error' : 'content'] = c.content; if(h) h[c.is_error ? 'error' : 'content'] = c.content;
}); });
} }
history[orgI].content = history[orgI].content.filter((c: any) => c.type == 'text').map((c: any) => c.text).join('\n\n'); msg.content = msg.content.filter((c: any) => c.type == 'text').map((c: any) => c.text).join('\n\n');
}
if(msg.content) {
const last = merged.at(-1);
if(last && last.role == 'assistant' && msg.role == 'assistant') last.content += '\n\n' + msg.content;
else merged.push({role: msg.role, content: msg.content});
} }
} }
return history.filter(h => !!h.content); return merged;
} }
private fromStandard(history: LLMMessage[]): any[] { private fromStandard(history: LLMMessage[]): any[] {
@@ -71,13 +76,15 @@ export class Anthropic extends LLMProvider {
stream: !!options.stream, stream: !!options.stream,
}; };
// Run tool changes
let resp: any; let resp: any;
let isFirstMessage = true;
do { do {
resp = await this.client.messages.create(requestParams); resp = await this.client.messages.create(requestParams);
// Streaming mode
if(options.stream) { if(options.stream) {
if(!isFirstMessage) options.stream({text: '\n\n'});
isFirstMessage = false;
resp.content = []; resp.content = [];
for await (const chunk of resp) { for await (const chunk of resp) {
if(controller.signal.aborted) break; if(controller.signal.aborted) break;
@@ -104,7 +111,6 @@ export class Anthropic extends LLMProvider {
} }
} }
// Run tools
const toolCalls = resp.content.filter((c: any) => c.type === 'tool_use'); const toolCalls = resp.content.filter((c: any) => c.type === 'tool_use');
if(toolCalls.length && !controller.signal.aborted) { if(toolCalls.length && !controller.signal.aborted) {
history.push({role: 'assistant', content: resp.content}); history.push({role: 'assistant', content: resp.content});
@@ -122,12 +128,14 @@ export class Anthropic extends LLMProvider {
requestParams.messages = history; requestParams.messages = history;
} }
} while (!controller.signal.aborted && resp.content.some((c: any) => c.type === 'tool_use')); } while (!controller.signal.aborted && resp.content.some((c: any) => c.type === 'tool_use'));
if(options.stream) options.stream({done: true}); if(options.stream) options.stream({done: true});
res(this.toStandard([...history, { res(this.toStandard([...history, {
role: 'assistant', role: 'assistant',
content: resp.content.filter((c: any) => c.type == 'text').map((c: any) => c.text).join('\n\n') content: resp.content.filter((c: any) => c.type == 'text').map((c: any) => c.text).join('\n\n')
}])); }]));
}); });
return Object.assign(response, {abort: () => controller.abort()}); return Object.assign(response, {abort: () => controller.abort()});
} }
} }