/** * example_embeddings.js * * Drop-in ES module for browser use. Exports: * loadModelCached(url?) — load and cache model in IndexedDB * embed(session, source) — get 768-dim Float32Array from any image source * cosineSimilarity(a, b) — similarity score in [-1, 1] * l2Normalize(v) — normalize so dot product equals cosine similarity * findMostSimilar(q, list) — nearest-neighbor in an embedding array * * Requirements: onnxruntime-web (npm install onnxruntime-web) * * Usage: * import { loadModelCached, embed, cosineSimilarity } from "./example_embeddings.js"; * const session = await loadModelCached(); * const emb = await embed(session, document.getElementById("myImage")); */ import * as ort from "onnxruntime-web"; // ── Config ───────────────────────────────────────────────────────────────── ort.env.wasm.wasmPaths = "https://cdn.jsdelivr.net/npm/onnxruntime-web/dist/"; const MODEL_URL = "https://huggingface.co/barakplasma/sapiens2-onnx/resolve/main/sapiens2_0.1b_int8.onnx"; const H = 1024; const W = 768; const MEAN = [0.485, 0.456, 0.406]; const STD = [0.229, 0.224, 0.225]; const DB_NAME = "sapiens2-onnx"; const DB_STORE = "models"; // ── IndexedDB helpers ────────────────────────────────────────────────────── function openDB() { return new Promise((resolve, reject) => { const req = indexedDB.open(DB_NAME, 1); req.onupgradeneeded = () => req.result.createObjectStore(DB_STORE); req.onsuccess = () => resolve(req.result); req.onerror = () => reject(req.error); }); } function idbGet(db, key) { return new Promise(resolve => { const req = db.transaction(DB_STORE).objectStore(DB_STORE).get(key); req.onsuccess = () => resolve(req.result ?? null); req.onerror = () => resolve(null); }); } function idbPut(db, key, value) { return new Promise((resolve, reject) => { const req = db.transaction(DB_STORE, "readwrite").objectStore(DB_STORE).put(value, key); req.onsuccess = () => resolve(); req.onerror = () => reject(req.error); }); } // ── Public API ───────────────────────────────────────────────────────────── /** * Load the ONNX model. On first call, fetches from HuggingFace and stores the * ArrayBuffer in IndexedDB. Subsequent calls load from cache instantly. * * @param {string} [url] Override the default model URL. * @returns {Promise} */ export async function loadModelCached(url = MODEL_URL) { const db = await openDB(); const cached = await idbGet(db, url); const buf = cached ?? await fetch(url) .then(r => { if (!r.ok) throw new Error(`Failed to fetch model: ${r.status} ${r.statusText}`); return r.arrayBuffer(); }) .then(async buf => { await idbPut(db, url, buf); return buf; }); return ort.InferenceSession.create(buf, { executionProviders: ["webgpu", "wasm"], graphOptimizationLevel: "all", }); } /** * Convert an image source to a float32 NCHW tensor with ImageNet normalization. * Accepts anything drawImage() accepts: ,