Enable quantized embedder for speed boost

2026-02-11 20:28:14 -05:00
parent f2c66b0cb8
commit c8d5660b1a
2 changed files with 2 additions and 2 deletions
--- a/package.json
+++ b/package.json
@@ -1,6 +1,6 @@
 {
 	"name": "@ztimson/ai-utils",
-	"version": "0.5.2",
+	"version": "0.5.3",
 	"description": "AI Utility library",
 	"author": "Zak Timson",
 	"license": "MIT",
--- a/src/embedder.ts
+++ b/src/embedder.ts
@@ -4,7 +4,7 @@ import { parentPort } from 'worker_threads';
 let embedder: any;
 parentPort?.on('message', async ({ id, text, model }) => {
-	if(!embedder) embedder = await pipeline('feature-extraction', 'Xenova/' + model);
+	if(!embedder) embedder = await pipeline('feature-extraction', 'Xenova/' + model, {quantized: true});
 	const output = await embedder(text, { pooling: 'mean', normalize: true });
 	const embedding = Array.from(output.data);
 	parentPort?.postMessage({ id, embedding });