feat(telegram-tts): add /tts_limit command and auto-summarization

- Add /tts_limit command to configure max text length (default 1500) - Auto-summarize long texts with gpt-4o-mini before TTS conversion - Add truncation safeguard if summary exceeds hard limit - Validate targetLength parameter (100-10000) - Use conservative max_tokens for multilingual text - Add prompt injection defense with XML delimiters Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
2026-01-24 00:49:14 +00:00
parent df09e583aa
commit 4b24753be7
1 changed files with 153 additions and 2 deletions
--- a/extensions/telegram-tts/index.ts
+++ b/extensions/telegram-tts/index.ts
@@ -48,9 +48,12 @@ interface UserPreferences {
  tts?: {
    enabled?: boolean;
    provider?: "openai" | "elevenlabs";
+    maxLength?: number; // Max chars before summarizing (default 1500)
  };
 }

+const DEFAULT_TTS_MAX_LENGTH = 1500;
+
 interface TtsResult {
  success: boolean;
  audioPath?: string;
@@ -151,6 +154,91 @@ function setTtsProvider(prefsPath: string, provider: "openai" | "elevenlabs"): v
  writeFileSync(prefsPath, JSON.stringify(prefs, null, 2));
 }

+function getTtsMaxLength(prefsPath: string): number {
+  try {
+    if (!existsSync(prefsPath)) return DEFAULT_TTS_MAX_LENGTH;
+    const prefs: UserPreferences = JSON.parse(readFileSync(prefsPath, "utf8"));
+    return prefs?.tts?.maxLength ?? DEFAULT_TTS_MAX_LENGTH;
+  } catch {
+    return DEFAULT_TTS_MAX_LENGTH;
+  }
+}
+
+function setTtsMaxLength(prefsPath: string, maxLength: number): void {
+  let prefs: UserPreferences = {};
+  try {
+    if (existsSync(prefsPath)) {
+      prefs = JSON.parse(readFileSync(prefsPath, "utf8"));
+    }
+  } catch {
+    // ignore
+  }
+  prefs.tts = { ...prefs.tts, maxLength };
+  writeFileSync(prefsPath, JSON.stringify(prefs, null, 2));
+}
+
+// =============================================================================
+// Text Summarization (for long texts)
+// =============================================================================
+
+async function summarizeText(
+  text: string,
+  targetLength: number,
+  apiKey: string,
+  timeoutMs: number = 30000
+): Promise<string> {
+  // Validate targetLength
+  if (targetLength < 100 || targetLength > 10000) {
+    throw new Error(`Invalid targetLength: ${targetLength}`);
+  }
+
+  const controller = new AbortController();
+  const timeout = setTimeout(() => controller.abort(), timeoutMs);
+
+  try {
+    const response = await fetch("https://api.openai.com/v1/chat/completions", {
+      method: "POST",
+      headers: {
+        Authorization: `Bearer ${apiKey}`,
+        "Content-Type": "application/json",
+      },
+      body: JSON.stringify({
+        model: "gpt-4o-mini",
+        messages: [
+          {
+            role: "system",
+            content: `Você é um assistente que resume textos de forma concisa mantendo as informações mais importantes. Resuma o texto para aproximadamente ${targetLength} caracteres. Mantenha o tom e estilo original. Responda apenas com o resumo, sem explicações adicionais.`,
+          },
+          {
+            role: "user",
+            content: `<text_to_summarize>\n${text}\n</text_to_summarize>`,
+          },
+        ],
+        max_tokens: Math.ceil(targetLength / 2), // Conservative estimate for multilingual text
+        temperature: 0.3,
+      }),
+      signal: controller.signal,
+    });
+
+    if (!response.ok) {
+      throw new Error("Summarization service unavailable");
+    }
+
+    const data = await response.json() as {
+      choices?: Array<{ message?: { content?: string } }>;
+    };
+    const summary = data.choices?.[0]?.message?.content?.trim();
+
+    if (!summary) {
+      throw new Error("No summary returned");
+    }
+
+    return summary;
+  } finally {
+    clearTimeout(timeout);
+  }
+}
+
 function getApiKey(config: TtsConfig, provider: string): string | undefined {
  if (provider === "elevenlabs") {
    return (
@@ -614,6 +702,39 @@ Do NOT add extra text around the MEDIA directive.`,
    },
  });

+  // /tts_limit [number] - Set or show max text length before summarizing
+  api.registerCommand({
+    name: "tts_limit",
+    description: "Set or show max text length for TTS (longer texts are summarized)",
+    acceptsArgs: true,
+    handler: (ctx) => {
+      const arg = ctx.args?.trim();
+      const currentLimit = getTtsMaxLength(prefsPath);
+
+      if (!arg) {
+        // Show current limit
+        return {
+          text: `📏 **Limite TTS**\n\n` +
+            `Limite atual: **${currentLimit}** caracteres\n\n` +
+            `Textos maiores que ${currentLimit} chars serão resumidos automaticamente com gpt-4o-mini antes de converter em áudio.\n\n` +
+            `Uso: /tts_limit 2000 (define novo limite)`,
+        };
+      }
+
+      const newLimit = parseInt(arg, 10);
+      if (isNaN(newLimit) || newLimit < 100 || newLimit > 10000) {
+        return { text: "❌ Limite inválido. Use um número entre 100 e 10000." };
+      }
+
+      setTtsMaxLength(prefsPath, newLimit);
+      log.info(`[${PLUGIN_ID}] Max length set to ${newLimit} via /tts_limit command`);
+      return {
+        text: `✅ Limite TTS alterado para **${newLimit}** caracteres!\n\n` +
+          `Textos maiores serão resumidos automaticamente antes de virar áudio.`,
+      };
+    },
+  });
+
  // ===========================================================================
  // Auto-TTS Hook (message_sending)
  // ===========================================================================
@@ -640,10 +761,40 @@ Do NOT add extra text around the MEDIA directive.`,
      return;
    }

-    log.info(`[${PLUGIN_ID}] Auto-TTS: Converting ${content.length} chars`);
+    const maxLength = getTtsMaxLength(prefsPath);
+    let textForAudio = content;
+
+    // If text exceeds limit, summarize it first
+    if (content.length > maxLength) {
+      log.info(`[${PLUGIN_ID}] Auto-TTS: Text too long (${content.length} > ${maxLength}), summarizing...`);
+
+      const openaiKey = getApiKey(config, "openai");
+      if (!openaiKey) {
+        log.warn(`[${PLUGIN_ID}] Auto-TTS: No OpenAI key for summarization, skipping audio`);
+        return; // Can't summarize without OpenAI key
+      }
+
+      try {
+        textForAudio = await summarizeText(content, maxLength, openaiKey, config.timeoutMs);
+        log.info(`[${PLUGIN_ID}] Auto-TTS: Summarized to ${textForAudio.length} chars`);
+
+        // Safeguard: if summary still exceeds hard limit, truncate
+        const hardLimit = config.maxTextLength || 4000;
+        if (textForAudio.length > hardLimit) {
+          log.warn(`[${PLUGIN_ID}] Auto-TTS: Summary exceeded hard limit (${textForAudio.length} > ${hardLimit}), truncating`);
+          textForAudio = textForAudio.slice(0, hardLimit - 3) + "...";
+        }
+      } catch (err) {
+        const error = err as Error;
+        log.error(`[${PLUGIN_ID}] Auto-TTS: Summarization failed: ${error.message}`);
+        return; // On summarization failure, skip audio
+      }
+    } else {
+      log.info(`[${PLUGIN_ID}] Auto-TTS: Converting ${content.length} chars`);
+    }

    try {
-      const result = await textToSpeech(content, config, prefsPath);
+      const result = await textToSpeech(textForAudio, config, prefsPath);

      if (result.success && result.audioPath) {
        log.info(`[${PLUGIN_ID}] Auto-TTS: Audio generated: ${result.audioPath}`);