Spaces:
Paused
Paused
| import { describe, expect, it } from "vitest"; | |
| import { buildInboundMediaNote } from "./media-note.js"; | |
| describe("buildInboundMediaNote", () => { | |
| it("formats single MediaPath as a media note", () => { | |
| const note = buildInboundMediaNote({ | |
| MediaPath: "/tmp/a.png", | |
| MediaType: "image/png", | |
| MediaUrl: "/tmp/a.png", | |
| }); | |
| expect(note).toBe("[media attached: /tmp/a.png (image/png) | /tmp/a.png]"); | |
| }); | |
| it("formats multiple MediaPaths as numbered media notes", () => { | |
| const note = buildInboundMediaNote({ | |
| MediaPaths: ["/tmp/a.png", "/tmp/b.png", "/tmp/c.png"], | |
| MediaUrls: ["/tmp/a.png", "/tmp/b.png", "/tmp/c.png"], | |
| }); | |
| expect(note).toBe( | |
| [ | |
| "[media attached: 3 files]", | |
| "[media attached 1/3: /tmp/a.png | /tmp/a.png]", | |
| "[media attached 2/3: /tmp/b.png | /tmp/b.png]", | |
| "[media attached 3/3: /tmp/c.png | /tmp/c.png]", | |
| ].join("\n"), | |
| ); | |
| }); | |
| it("skips media notes for attachments with understanding output", () => { | |
| const note = buildInboundMediaNote({ | |
| MediaPaths: ["/tmp/a.png", "/tmp/b.png"], | |
| MediaUrls: ["https://example.com/a.png", "https://example.com/b.png"], | |
| MediaUnderstanding: [ | |
| { | |
| kind: "audio.transcription", | |
| attachmentIndex: 0, | |
| text: "hello", | |
| provider: "groq", | |
| }, | |
| ], | |
| }); | |
| expect(note).toBe("[media attached: /tmp/b.png | https://example.com/b.png]"); | |
| }); | |
| it("only suppresses attachments when media understanding succeeded", () => { | |
| const note = buildInboundMediaNote({ | |
| MediaPaths: ["/tmp/a.png", "/tmp/b.png"], | |
| MediaUrls: ["https://example.com/a.png", "https://example.com/b.png"], | |
| MediaUnderstandingDecisions: [ | |
| { | |
| capability: "image", | |
| outcome: "skipped", | |
| attachments: [ | |
| { | |
| attachmentIndex: 0, | |
| attempts: [ | |
| { | |
| type: "provider", | |
| outcome: "skipped", | |
| reason: "maxBytes: too large", | |
| }, | |
| ], | |
| }, | |
| ], | |
| }, | |
| ], | |
| }); | |
| expect(note).toBe( | |
| [ | |
| "[media attached: 2 files]", | |
| "[media attached 1/2: /tmp/a.png | https://example.com/a.png]", | |
| "[media attached 2/2: /tmp/b.png | https://example.com/b.png]", | |
| ].join("\n"), | |
| ); | |
| }); | |
| it("suppresses attachments when media understanding succeeds via decisions", () => { | |
| const note = buildInboundMediaNote({ | |
| MediaPaths: ["/tmp/a.png", "/tmp/b.png"], | |
| MediaUrls: ["https://example.com/a.png", "https://example.com/b.png"], | |
| MediaUnderstandingDecisions: [ | |
| { | |
| capability: "image", | |
| outcome: "success", | |
| attachments: [ | |
| { | |
| attachmentIndex: 0, | |
| attempts: [ | |
| { | |
| type: "provider", | |
| outcome: "success", | |
| provider: "openai", | |
| model: "gpt-5.2", | |
| }, | |
| ], | |
| chosen: { | |
| type: "provider", | |
| outcome: "success", | |
| provider: "openai", | |
| model: "gpt-5.2", | |
| }, | |
| }, | |
| ], | |
| }, | |
| ], | |
| }); | |
| expect(note).toBe("[media attached: /tmp/b.png | https://example.com/b.png]"); | |
| }); | |
| it("strips audio attachments when transcription succeeded via MediaUnderstanding (issue #4197)", () => { | |
| const note = buildInboundMediaNote({ | |
| MediaPaths: ["/tmp/voice.ogg", "/tmp/image.png"], | |
| MediaUrls: ["https://example.com/voice.ogg", "https://example.com/image.png"], | |
| MediaTypes: ["audio/ogg", "image/png"], | |
| MediaUnderstanding: [ | |
| { | |
| kind: "audio.transcription", | |
| attachmentIndex: 0, | |
| text: "Hello world", | |
| provider: "whisper", | |
| }, | |
| ], | |
| }); | |
| // Audio attachment should be stripped (already transcribed), image should remain | |
| expect(note).toBe( | |
| "[media attached: /tmp/image.png (image/png) | https://example.com/image.png]", | |
| ); | |
| }); | |
| it("only strips audio attachments that were transcribed", () => { | |
| const note = buildInboundMediaNote({ | |
| MediaPaths: ["/tmp/voice-1.ogg", "/tmp/voice-2.ogg"], | |
| MediaUrls: ["https://example.com/voice-1.ogg", "https://example.com/voice-2.ogg"], | |
| MediaTypes: ["audio/ogg", "audio/ogg"], | |
| MediaUnderstanding: [ | |
| { | |
| kind: "audio.transcription", | |
| attachmentIndex: 0, | |
| text: "First transcript", | |
| provider: "whisper", | |
| }, | |
| ], | |
| }); | |
| expect(note).toBe( | |
| "[media attached: /tmp/voice-2.ogg (audio/ogg) | https://example.com/voice-2.ogg]", | |
| ); | |
| }); | |
| it("strips audio attachments when Transcript is present (issue #4197)", () => { | |
| const note = buildInboundMediaNote({ | |
| MediaPaths: ["/tmp/voice.opus"], | |
| MediaTypes: ["audio/opus"], | |
| Transcript: "Hello world from Whisper", | |
| }); | |
| // Audio should be stripped when transcript is available | |
| expect(note).toBeUndefined(); | |
| }); | |
| it("does not strip multiple audio attachments using transcript-only fallback", () => { | |
| const note = buildInboundMediaNote({ | |
| MediaPaths: ["/tmp/voice-1.ogg", "/tmp/voice-2.ogg"], | |
| MediaTypes: ["audio/ogg", "audio/ogg"], | |
| Transcript: "Transcript text without per-attachment mapping", | |
| }); | |
| expect(note).toBe( | |
| [ | |
| "[media attached: 2 files]", | |
| "[media attached 1/2: /tmp/voice-1.ogg (audio/ogg)]", | |
| "[media attached 2/2: /tmp/voice-2.ogg (audio/ogg)]", | |
| ].join("\n"), | |
| ); | |
| }); | |
| it("strips audio by extension even without mime type (issue #4197)", () => { | |
| const note = buildInboundMediaNote({ | |
| MediaPaths: ["/tmp/voice_message.ogg", "/tmp/document.pdf"], | |
| MediaUnderstanding: [ | |
| { | |
| kind: "audio.transcription", | |
| attachmentIndex: 0, | |
| text: "Transcribed audio content", | |
| provider: "whisper", | |
| }, | |
| ], | |
| }); | |
| // Only PDF should remain, audio stripped by extension | |
| expect(note).toBe("[media attached: /tmp/document.pdf]"); | |
| }); | |
| it("keeps audio attachments when no transcription available", () => { | |
| const note = buildInboundMediaNote({ | |
| MediaPaths: ["/tmp/voice.ogg"], | |
| MediaTypes: ["audio/ogg"], | |
| }); | |
| // No transcription = keep audio attachment as fallback | |
| expect(note).toBe("[media attached: /tmp/voice.ogg (audio/ogg)]"); | |
| }); | |
| }); | |