refactor(media): centralize voice compatibility policy

2026-02-14 03:17:02 +01:00
parent 03fee3c605
commit 6ebf503fa8
6 changed files with 62 additions and 40 deletions
--- a/extensions/matrix/src/matrix/send/formatting.ts
+++ b/extensions/matrix/src/matrix/send/formatting.ts
@@ -77,13 +77,17 @@ export function resolveMatrixVoiceDecision(opts: {
  if (!opts.wantsVoice) {
    return { useVoice: false };
  }
-  if (
-    getCore().media.isVoiceCompatibleAudio({
-      contentType: opts.contentType,
-      fileName: opts.fileName,
-    })
-  ) {
+  if (isMatrixVoiceCompatibleAudio(opts)) {
    return { useVoice: true };
  }
  return { useVoice: false };
 }
+
+function isMatrixVoiceCompatibleAudio(opts: { contentType?: string; fileName?: string }): boolean {
+  // Matrix currently shares the core voice compatibility policy.
+  // Keep this wrapper as the seam if Matrix policy diverges later.
+  return getCore().media.isVoiceCompatibleAudio({
+    contentType: opts.contentType,
+    fileName: opts.fileName,
+  });
+}
--- a/src/media/audio.test.ts
+++ b/src/media/audio.test.ts
@@ -1,22 +1,20 @@
 import { describe, expect, it } from "vitest";
-import { isVoiceCompatibleAudio } from "./audio.js";
+import {
+  isVoiceCompatibleAudio,
+  TELEGRAM_VOICE_AUDIO_EXTENSIONS,
+  TELEGRAM_VOICE_MIME_TYPES,
+} from "./audio.js";

 describe("isVoiceCompatibleAudio", () => {
  it.each([
-    { contentType: "audio/ogg", fileName: null },
-    { contentType: "audio/opus", fileName: null },
+    ...Array.from(TELEGRAM_VOICE_MIME_TYPES, (contentType) => ({ contentType, fileName: null })),
    { contentType: "audio/ogg; codecs=opus", fileName: null },
-    { contentType: "audio/mpeg", fileName: null },
-    { contentType: "audio/mp3", fileName: null },
-    { contentType: "audio/mp4", fileName: null },
    { contentType: "audio/mp4; codecs=mp4a.40.2", fileName: null },
-    { contentType: "audio/x-m4a", fileName: null },
-    { contentType: "audio/m4a", fileName: null },
  ])("returns true for MIME type $contentType", (opts) => {
    expect(isVoiceCompatibleAudio(opts)).toBe(true);
  });

-  it.each([".ogg", ".oga", ".opus", ".mp3", ".m4a"])("returns true for extension %s", (ext) => {
+  it.each(Array.from(TELEGRAM_VOICE_AUDIO_EXTENSIONS))("returns true for extension %s", (ext) => {
    expect(isVoiceCompatibleAudio({ fileName: `voice${ext}` })).toBe(true);
  });

--- a/src/media/audio.ts
+++ b/src/media/audio.ts
@@ -1,13 +1,13 @@
-import { getFileExtension } from "./mime.js";
+import { getFileExtension, normalizeMimeType } from "./mime.js";

-const VOICE_AUDIO_EXTENSIONS = new Set([".oga", ".ogg", ".opus", ".mp3", ".m4a"]);
+export const TELEGRAM_VOICE_AUDIO_EXTENSIONS = new Set([".oga", ".ogg", ".opus", ".mp3", ".m4a"]);

 /**
 * MIME types compatible with voice messages.
 * Telegram sendVoice supports OGG/Opus, MP3, and M4A.
 * https://core.telegram.org/bots/api#sendvoice
 */
-const VOICE_MIME_TYPES = new Set([
+export const TELEGRAM_VOICE_MIME_TYPES = new Set([
  "audio/ogg",
  "audio/opus",
  "audio/mpeg",
@@ -17,16 +17,13 @@ const VOICE_MIME_TYPES = new Set([
  "audio/m4a",
 ]);

-export function isVoiceCompatibleAudio(opts: {
+export function isTelegramVoiceCompatibleAudio(opts: {
  contentType?: string | null;
  fileName?: string | null;
 }): boolean {
-  const mime = opts.contentType?.toLowerCase().trim();
-  if (mime) {
-    const baseMime = mime.split(";")[0].trim();
-    if (VOICE_MIME_TYPES.has(baseMime)) {
-      return true;
-    }
+  const mime = normalizeMimeType(opts.contentType);
+  if (mime && TELEGRAM_VOICE_MIME_TYPES.has(mime)) {
+    return true;
  }
  const fileName = opts.fileName?.trim();
  if (!fileName) {
@@ -36,5 +33,16 @@ export function isVoiceCompatibleAudio(opts: {
  if (!ext) {
    return false;
  }
-  return VOICE_AUDIO_EXTENSIONS.has(ext);
+  return TELEGRAM_VOICE_AUDIO_EXTENSIONS.has(ext);
+}
+
+/**
+ * Backward-compatible alias used across plugin/runtime call sites.
+ * Keeps existing behavior while making Telegram-specific policy explicit.
+ */
+export function isVoiceCompatibleAudio(opts: {
+  contentType?: string | null;
+  fileName?: string | null;
+}): boolean {
+  return isTelegramVoiceCompatibleAudio(opts);
 }
--- a/src/media/mime.test.ts
+++ b/src/media/mime.test.ts
@@ -1,6 +1,12 @@
 import JSZip from "jszip";
 import { describe, expect, it } from "vitest";
-import { detectMime, extensionForMime, imageMimeFromFormat, isAudioFileName } from "./mime.js";
+import {
+  detectMime,
+  extensionForMime,
+  imageMimeFromFormat,
+  isAudioFileName,
+  normalizeMimeType,
+} from "./mime.js";

 async function makeOoxmlZip(opts: { mainMime: string; partPath: string }): Promise<Buffer> {
  const zip = new JSZip();
@@ -110,3 +116,15 @@ describe("isAudioFileName", () => {
    }
  });
 });
+
+describe("normalizeMimeType", () => {
+  it("normalizes case and strips parameters", () => {
+    expect(normalizeMimeType("Audio/MP4; codecs=mp4a.40.2")).toBe("audio/mp4");
+  });
+
+  it("returns undefined for empty input", () => {
+    expect(normalizeMimeType("   ")).toBeUndefined();
+    expect(normalizeMimeType(null)).toBeUndefined();
+    expect(normalizeMimeType(undefined)).toBeUndefined();
+  });
+});
--- a/src/media/mime.ts
+++ b/src/media/mime.ts
@@ -52,7 +52,7 @@ const AUDIO_FILE_EXTENSIONS = new Set([
  ".wav",
 ]);

-function normalizeHeaderMime(mime?: string | null): string | undefined {
+export function normalizeMimeType(mime?: string | null): string | undefined {
  if (!mime) {
    return undefined;
  }
@@ -120,7 +120,7 @@ async function detectMimeImpl(opts: {
  const ext = getFileExtension(opts.filePath);
  const extMime = ext ? MIME_BY_EXT[ext] : undefined;

-  const headerMime = normalizeHeaderMime(opts.headerMime);
+  const headerMime = normalizeMimeType(opts.headerMime);
  const sniffed = await sniffMime(opts.buffer);

  // Prefer sniffed types, but don't let generic container types override a more
@@ -145,10 +145,11 @@ async function detectMimeImpl(opts: {
 }

 export function extensionForMime(mime?: string | null): string | undefined {
-  if (!mime) {
+  const normalized = normalizeMimeType(mime);
+  if (!normalized) {
    return undefined;
  }
-  return EXT_BY_MIME[mime.toLowerCase()];
+  return EXT_BY_MIME[normalized];
 }

 export function isGifMedia(opts: {
--- a/src/telegram/voice.ts
+++ b/src/telegram/voice.ts
@@ -1,11 +1,4 @@
-import { isVoiceCompatibleAudio } from "../media/audio.js";
-
-export function isTelegramVoiceCompatible(opts: {
-  contentType?: string | null;
-  fileName?: string | null;
-}): boolean {
-  return isVoiceCompatibleAudio(opts);
-}
+import { isTelegramVoiceCompatibleAudio } from "../media/audio.js";

 export function resolveTelegramVoiceDecision(opts: {
  wantsVoice: boolean;
@@ -15,7 +8,7 @@ export function resolveTelegramVoiceDecision(opts: {
  if (!opts.wantsVoice) {
    return { useVoice: false };
  }
-  if (isTelegramVoiceCompatible(opts)) {
+  if (isTelegramVoiceCompatibleAudio(opts)) {
    return { useVoice: true };
  }
  const contentType = opts.contentType ?? "unknown";