Spaces:

darkfire514
/

OpenClawBot

Paused

App Files Files Community

OpenClawBot / test /media-understanding.auto.e2e.test.ts

darkfire514

Upload 321 files

9f069df verified 3 months ago

raw

history blame contribute delete

5.29 kB

	import fs from "node:fs/promises";
	import os from "node:os";
	import path from "node:path";
	import { afterEach, describe, expect, it, vi } from "vitest";
	import type { MsgContext } from "../src/auto-reply/templating.js";
	import type { OpenClawConfig } from "../src/config/config.js";

	const makeTempDir = async (prefix: string) => await fs.mkdtemp(path.join(os.tmpdir(), prefix));

	const writeExecutable = async (dir: string, name: string, content: string) => {
	const filePath = path.join(dir, name);
	await fs.writeFile(filePath, content, { mode: 0o755 });
	return filePath;
	};

	const makeTempMedia = async (ext: string) => {
	const dir = await makeTempDir("openclaw-media-e2e-");
	const filePath = path.join(dir, `sample${ext}`);
	await fs.writeFile(filePath, "audio");
	return { dir, filePath };
	};

	const loadApply = async () => {
	vi.resetModules();
	return await import("../src/media-understanding/apply.js");
	};

	const envSnapshot = () => ({
	PATH: process.env.PATH,
	SHERPA_ONNX_MODEL_DIR: process.env.SHERPA_ONNX_MODEL_DIR,
	WHISPER_CPP_MODEL: process.env.WHISPER_CPP_MODEL,
	});

	const restoreEnv = (snapshot: ReturnType<typeof envSnapshot>) => {
	process.env.PATH = snapshot.PATH;
	process.env.SHERPA_ONNX_MODEL_DIR = snapshot.SHERPA_ONNX_MODEL_DIR;
	process.env.WHISPER_CPP_MODEL = snapshot.WHISPER_CPP_MODEL;
	};

	describe("media understanding auto-detect (e2e)", () => {
	let tempPaths: string[] = [];

	afterEach(async () => {
	for (const p of tempPaths) {
	await fs.rm(p, { recursive: true, force: true }).catch(() => {});
	}
	tempPaths = [];
	});

	it("uses sherpa-onnx-offline when available", async () => {
	const snapshot = envSnapshot();
	try {
	const binDir = await makeTempDir("openclaw-bin-sherpa-");
	const modelDir = await makeTempDir("openclaw-sherpa-model-");
	tempPaths.push(binDir, modelDir);

	await fs.writeFile(path.join(modelDir, "tokens.txt"), "a");
	await fs.writeFile(path.join(modelDir, "encoder.onnx"), "a");
	await fs.writeFile(path.join(modelDir, "decoder.onnx"), "a");
	await fs.writeFile(path.join(modelDir, "joiner.onnx"), "a");

	await writeExecutable(
	binDir,
	"sherpa-onnx-offline",
	`#!/usr/bin/env bash\necho "{\\"text\\":\\"sherpa ok\\"}"\n`,
	);

	process.env.PATH = `${binDir}:/usr/bin:/bin`;
	process.env.SHERPA_ONNX_MODEL_DIR = modelDir;

	const { filePath } = await makeTempMedia(".wav");
	tempPaths.push(path.dirname(filePath));

	const { applyMediaUnderstanding } = await loadApply();
	const ctx: MsgContext = {
	Body: "<media:audio>",
	MediaPath: filePath,
	MediaType: "audio/wav",
	};
	const cfg: OpenClawConfig = { tools: { media: { audio: {} } } };

	await applyMediaUnderstanding({ ctx, cfg });

	expect(ctx.Transcript).toBe("sherpa ok");
	} finally {
	restoreEnv(snapshot);
	}
	});

	it("uses whisper-cli when sherpa is missing", async () => {
	const snapshot = envSnapshot();
	try {
	const binDir = await makeTempDir("openclaw-bin-whispercpp-");
	const modelDir = await makeTempDir("openclaw-whispercpp-model-");
	tempPaths.push(binDir, modelDir);

	const modelPath = path.join(modelDir, "tiny.bin");
	await fs.writeFile(modelPath, "model");

	await writeExecutable(
	binDir,
	"whisper-cli",
	"#!/usr/bin/env bash\n" +
	'out=""\n' +
	'prev=""\n' +
	'for arg in "$@"; do\n' +
	' if [ "$prev" = "-of" ]; then out="$arg"; break; fi\n' +
	' prev="$arg"\n' +
	"done\n" +
	'if [ -n "$out" ]; then echo \'whisper cpp ok\' > "${out}.txt"; fi\n',
	);

	process.env.PATH = `${binDir}:/usr/bin:/bin`;
	process.env.WHISPER_CPP_MODEL = modelPath;

	const { filePath } = await makeTempMedia(".wav");
	tempPaths.push(path.dirname(filePath));

	const { applyMediaUnderstanding } = await loadApply();
	const ctx: MsgContext = {
	Body: "<media:audio>",
	MediaPath: filePath,
	MediaType: "audio/wav",
	};
	const cfg: OpenClawConfig = { tools: { media: { audio: {} } } };

	await applyMediaUnderstanding({ ctx, cfg });

	expect(ctx.Transcript).toBe("whisper cpp ok");
	} finally {
	restoreEnv(snapshot);
	}
	});

	it("uses gemini CLI for images when available", async () => {
	const snapshot = envSnapshot();
	try {
	const binDir = await makeTempDir("openclaw-bin-gemini-");
	tempPaths.push(binDir);

	await writeExecutable(
	binDir,
	"gemini",
	`#!/usr/bin/env bash\necho '{\\"response\\":\\"gemini ok\\"' + "}'\n`,
	);

	process.env.PATH = `${binDir}:/usr/bin:/bin`;

	const { filePath } = await makeTempMedia(".png");
	tempPaths.push(path.dirname(filePath));

	const { applyMediaUnderstanding } = await loadApply();
	const ctx: MsgContext = {
	Body: "<media:image>",
	MediaPath: filePath,
	MediaType: "image/png",
	};
	const cfg: OpenClawConfig = { tools: { media: { image: {} } } };

	await applyMediaUnderstanding({ ctx, cfg });

	expect(ctx.Body).toContain("gemini ok");
	} finally {
	restoreEnv(snapshot);
	}
	});
	});