Compare commits

...

4 Commits

Author SHA1 Message Date
0360f2493d Added hugging face token
All checks were successful
Publish Library / Build NPM Project (push) Successful in 31s
Publish Library / Tag Version (push) Successful in 5s
2026-02-12 22:15:57 -05:00
0172887877 audio worker fix
All checks were successful
Publish Library / Build NPM Project (push) Successful in 28s
Publish Library / Tag Version (push) Successful in 5s
2026-02-12 20:24:12 -05:00
8f89f5e3cf embedding worker fix
All checks were successful
Publish Library / Build NPM Project (push) Successful in 28s
Publish Library / Tag Version (push) Successful in 5s
2026-02-12 20:18:56 -05:00
5bd41f8c6a worker fix?
All checks were successful
Publish Library / Build NPM Project (push) Successful in 29s
Publish Library / Tag Version (push) Successful in 5s
2026-02-12 20:17:31 -05:00
6 changed files with 17 additions and 12 deletions

View File

@@ -1,6 +1,6 @@
{
"name": "@ztimson/ai-utils",
"version": "0.6.7",
"version": "0.6.10",
"description": "AI Utility library",
"author": "Zak Timson",
"license": "MIT",

View File

@@ -8,6 +8,8 @@ export type AbortablePromise<T> = Promise<T> & {
};
export type AiOptions = {
/** Token to pull models from hugging face */
hfToken?: string;
/** Path to models */
path?: string;
/** ASR model: whisper-tiny, whisper-base */

View File

@@ -14,14 +14,15 @@ export async function canDiarization(): Promise<boolean> {
});
}
async function runDiarization(audioPath: string, torchHome: string): Promise<any[]> {
async function runDiarization(audioPath: string, dir: string, token: string): Promise<any[]> {
const script = `
import sys
import json
import os
from pyannote.audio import Pipeline
os.environ['TORCH_HOME'] = "${torchHome}"
os.environ['TORCH_HOME'] = "${dir}"
os.environ['HF_TOKEN'] = "${token}"
pipeline = Pipeline.from_pretrained("pyannote/speaker-diarization-3.1")
diarization = pipeline(sys.argv[1])
@@ -82,8 +83,9 @@ function combineSpeakerTranscript(chunks: any[], speakers: any[]): string {
return lines.join('\n');
}
parentPort?.on('message', async ({ file, speaker, model, modelDir }) => {
parentPort?.on('message', async ({ file, speaker, model, modelDir, token }) => {
try {
console.log('worker', file);
if(!whisperPipeline) whisperPipeline = await pipeline('automatic-speech-recognition', `Xenova/${model}`, {cache_dir: modelDir, quantized: true});
// Prepare audio file (convert to mono channel wave)
@@ -110,12 +112,12 @@ parentPort?.on('message', async ({ file, speaker, model, modelDir }) => {
// Speaker Diarization
const hasDiarization = await canDiarization();
if(!hasDiarization) {
if(!token || !hasDiarization) {
parentPort?.postMessage({ text: transcriptResult.text?.trim() || null, error: 'Speaker diarization unavailable' });
return;
}
const speakers = await runDiarization(file, modelDir);
const speakers = await runDiarization(file, modelDir, token);
const combined = combineSpeakerTranscript(transcriptResult.chunks || [], speakers);
parentPort?.postMessage({ text: combined });
} catch (err) {

View File

@@ -1,7 +1,8 @@
import {fileURLToPath} from 'url';
import {Worker} from 'worker_threads';
import Path from 'node:path';
import {AbortablePromise, Ai} from './ai.ts';
import {canDiarization} from './asr.ts';
import {dirname, join} from 'path';
export class Audio {
constructor(private ai: Ai) {}
@@ -12,7 +13,7 @@ export class Audio {
const abort = () => { aborted = true; };
const p = new Promise<string | null>((resolve, reject) => {
const worker = new Worker(Path.join(import.meta.dirname, 'asr.js'));
const worker = new Worker(join(dirname(fileURLToPath(import.meta.url)), 'asr.js'));
const handleMessage = ({ text, warning, error }: any) => {
worker.terminate();
if(aborted) return;
@@ -31,7 +32,7 @@ export class Audio {
worker.on('exit', (code) => {
if(code !== 0 && !aborted) reject(new Error(`Worker exited with code ${code}`));
});
worker.postMessage({file, model, speaker, modelDir: this.ai.options.path});
worker.postMessage({file, model, speaker, modelDir: this.ai.options.path, token: this.ai.options.hfToken});
});
return Object.assign(p, { abort });
}

View File

@@ -3,9 +3,9 @@ import { parentPort } from 'worker_threads';
let embedder: any;
parentPort?.on('message', async ({ id, text, model, modelDir }) => {
parentPort?.on('message', async ({text, model, modelDir }) => {
if(!embedder) embedder = await pipeline('feature-extraction', 'Xenova/' + model, {quantized: true, cache_dir: modelDir});
const output = await embedder(text, { pooling: 'mean', normalize: true });
const embedding = Array.from(output.data);
parentPort?.postMessage({ id, embedding });
parentPort?.postMessage({embedding});
});

View File

@@ -271,7 +271,7 @@ class LLM {
worker.on('exit', (code) => {
if(code !== 0) reject(new Error(`Worker exited with code ${code}`));
});
worker.postMessage({text, model: this.ai.options?.embedder || 'bge-small-en-v1.5', path: this.ai.options.path});
worker.postMessage({text, model: this.ai.options?.embedder || 'bge-small-en-v1.5', modelDir: this.ai.options.path});
});
};
const chunks = this.chunk(target, maxTokens, overlapTokens);