mirror of
https://github.com/openclaw/openclaw.git
synced 2026-03-13 19:10:39 +00:00
180 lines
6.0 KiB
TypeScript
180 lines
6.0 KiB
TypeScript
import { describe, expect, it } from "vitest";
|
|
import { buildInboundMediaNote } from "./media-note.js";
|
|
import { createSuccessfulImageMediaDecision } from "./media-understanding.test-fixtures.js";
|
|
|
|
describe("buildInboundMediaNote", () => {
|
|
it("formats single MediaPath as a media note", () => {
|
|
const note = buildInboundMediaNote({
|
|
MediaPath: "/tmp/a.png",
|
|
MediaType: "image/png",
|
|
MediaUrl: "/tmp/a.png",
|
|
});
|
|
expect(note).toBe("[media attached: /tmp/a.png (image/png) | /tmp/a.png]");
|
|
});
|
|
|
|
it("formats multiple MediaPaths as numbered media notes", () => {
|
|
const note = buildInboundMediaNote({
|
|
MediaPaths: ["/tmp/a.png", "/tmp/b.png", "/tmp/c.png"],
|
|
MediaUrls: ["/tmp/a.png", "/tmp/b.png", "/tmp/c.png"],
|
|
});
|
|
expect(note).toBe(
|
|
[
|
|
"[media attached: 3 files]",
|
|
"[media attached 1/3: /tmp/a.png | /tmp/a.png]",
|
|
"[media attached 2/3: /tmp/b.png | /tmp/b.png]",
|
|
"[media attached 3/3: /tmp/c.png | /tmp/c.png]",
|
|
].join("\n"),
|
|
);
|
|
});
|
|
|
|
it("skips media notes for attachments with understanding output", () => {
|
|
const note = buildInboundMediaNote({
|
|
MediaPaths: ["/tmp/a.png", "/tmp/b.png"],
|
|
MediaUrls: ["https://example.com/a.png", "https://example.com/b.png"],
|
|
MediaUnderstanding: [
|
|
{
|
|
kind: "audio.transcription",
|
|
attachmentIndex: 0,
|
|
text: "hello",
|
|
provider: "groq",
|
|
},
|
|
],
|
|
});
|
|
expect(note).toBe("[media attached: /tmp/b.png | https://example.com/b.png]");
|
|
});
|
|
|
|
it("only suppresses attachments when media understanding succeeded", () => {
|
|
const note = buildInboundMediaNote({
|
|
MediaPaths: ["/tmp/a.png", "/tmp/b.png"],
|
|
MediaUrls: ["https://example.com/a.png", "https://example.com/b.png"],
|
|
MediaUnderstandingDecisions: [
|
|
{
|
|
capability: "image",
|
|
outcome: "skipped",
|
|
attachments: [
|
|
{
|
|
attachmentIndex: 0,
|
|
attempts: [
|
|
{
|
|
type: "provider",
|
|
outcome: "skipped",
|
|
reason: "maxBytes: too large",
|
|
},
|
|
],
|
|
},
|
|
],
|
|
},
|
|
],
|
|
});
|
|
expect(note).toBe(
|
|
[
|
|
"[media attached: 2 files]",
|
|
"[media attached 1/2: /tmp/a.png | https://example.com/a.png]",
|
|
"[media attached 2/2: /tmp/b.png | https://example.com/b.png]",
|
|
].join("\n"),
|
|
);
|
|
});
|
|
|
|
it("suppresses attachments when media understanding succeeds via decisions", () => {
|
|
const note = buildInboundMediaNote({
|
|
MediaPaths: ["/tmp/a.png", "/tmp/b.png"],
|
|
MediaUrls: ["https://example.com/a.png", "https://example.com/b.png"],
|
|
MediaUnderstandingDecisions: [
|
|
createSuccessfulImageMediaDecision() as unknown as NonNullable<
|
|
Parameters<typeof buildInboundMediaNote>[0]["MediaUnderstandingDecisions"]
|
|
>[number],
|
|
],
|
|
});
|
|
expect(note).toBe("[media attached: /tmp/b.png | https://example.com/b.png]");
|
|
});
|
|
|
|
it("strips audio attachments when transcription succeeded via MediaUnderstanding (issue #4197)", () => {
|
|
const note = buildInboundMediaNote({
|
|
MediaPaths: ["/tmp/voice.ogg", "/tmp/image.png"],
|
|
MediaUrls: ["https://example.com/voice.ogg", "https://example.com/image.png"],
|
|
MediaTypes: ["audio/ogg", "image/png"],
|
|
MediaUnderstanding: [
|
|
{
|
|
kind: "audio.transcription",
|
|
attachmentIndex: 0,
|
|
text: "Hello world",
|
|
provider: "whisper",
|
|
},
|
|
],
|
|
});
|
|
// Audio attachment should be stripped (already transcribed), image should remain
|
|
expect(note).toBe(
|
|
"[media attached: /tmp/image.png (image/png) | https://example.com/image.png]",
|
|
);
|
|
});
|
|
|
|
it("only strips audio attachments that were transcribed", () => {
|
|
const note = buildInboundMediaNote({
|
|
MediaPaths: ["/tmp/voice-1.ogg", "/tmp/voice-2.ogg"],
|
|
MediaUrls: ["https://example.com/voice-1.ogg", "https://example.com/voice-2.ogg"],
|
|
MediaTypes: ["audio/ogg", "audio/ogg"],
|
|
MediaUnderstanding: [
|
|
{
|
|
kind: "audio.transcription",
|
|
attachmentIndex: 0,
|
|
text: "First transcript",
|
|
provider: "whisper",
|
|
},
|
|
],
|
|
});
|
|
expect(note).toBe(
|
|
"[media attached: /tmp/voice-2.ogg (audio/ogg) | https://example.com/voice-2.ogg]",
|
|
);
|
|
});
|
|
|
|
it("strips audio attachments when Transcript is present (issue #4197)", () => {
|
|
const note = buildInboundMediaNote({
|
|
MediaPaths: ["/tmp/voice.opus"],
|
|
MediaTypes: ["audio/opus"],
|
|
Transcript: "Hello world from Whisper",
|
|
});
|
|
// Audio should be stripped when transcript is available
|
|
expect(note).toBeUndefined();
|
|
});
|
|
|
|
it("does not strip multiple audio attachments using transcript-only fallback", () => {
|
|
const note = buildInboundMediaNote({
|
|
MediaPaths: ["/tmp/voice-1.ogg", "/tmp/voice-2.ogg"],
|
|
MediaTypes: ["audio/ogg", "audio/ogg"],
|
|
Transcript: "Transcript text without per-attachment mapping",
|
|
});
|
|
expect(note).toBe(
|
|
[
|
|
"[media attached: 2 files]",
|
|
"[media attached 1/2: /tmp/voice-1.ogg (audio/ogg)]",
|
|
"[media attached 2/2: /tmp/voice-2.ogg (audio/ogg)]",
|
|
].join("\n"),
|
|
);
|
|
});
|
|
|
|
it("strips audio by extension even without mime type (issue #4197)", () => {
|
|
const note = buildInboundMediaNote({
|
|
MediaPaths: ["/tmp/voice_message.ogg", "/tmp/document.pdf"],
|
|
MediaUnderstanding: [
|
|
{
|
|
kind: "audio.transcription",
|
|
attachmentIndex: 0,
|
|
text: "Transcribed audio content",
|
|
provider: "whisper",
|
|
},
|
|
],
|
|
});
|
|
// Only PDF should remain, audio stripped by extension
|
|
expect(note).toBe("[media attached: /tmp/document.pdf]");
|
|
});
|
|
|
|
it("keeps audio attachments when no transcription available", () => {
|
|
const note = buildInboundMediaNote({
|
|
MediaPaths: ["/tmp/voice.ogg"],
|
|
MediaTypes: ["audio/ogg"],
|
|
});
|
|
// No transcription = keep audio attachment as fallback
|
|
expect(note).toBe("[media attached: /tmp/voice.ogg (audio/ogg)]");
|
|
});
|
|
});
|