feat: support Podcast generation

2026-04-21 05:14:45 +08:00 · 2025-04-19 17:37:40 +08:00
parent 6556056df2
commit be5f823395
9 changed files with 255 additions and 6 deletions
--- a/src/podcast/graph/tts_node.py
+++ b/src/podcast/graph/tts_node.py
@@ -0,0 +1,44 @@
+import base64
+import logging
+import os
+
+from src.podcast.graph.state import PodcastState
+from src.tools.tts import VolcengineTTS
+
+logger = logging.getLogger(__name__)
+
+
+def tts_node(state: PodcastState):
+    logger.info("Generating audio chunks for podcast...")
+    tts_client = _create_tts_client()
+    for line in state["script"].lines:
+        tts_client.voice_type = (
+            "BV002_streaming" if line.speaker == "male" else "BV001_streaming"
+        )
+        result = tts_client.text_to_speech(line.text, speed_ratio=1.1)
+        if result["success"]:
+            audio_data = result["audio_data"]
+            audio_chunk = base64.b64decode(audio_data)
+            state["audio_chunks"].append(audio_chunk)
+        else:
+            logger.error(result["error"])
+    return {
+        "audio_chunks": state["audio_chunks"],
+    }
+
+
+def _create_tts_client():
+    app_id = os.getenv("VOLCENGINE_TTS_APPID", "")
+    if not app_id:
+        raise Exception("VOLCENGINE_TTS_APPID is not set")
+    access_token = os.getenv("VOLCENGINE_TTS_ACCESS_TOKEN", "")
+    if not access_token:
+        raise Exception("VOLCENGINE_TTS_ACCESS_TOKEN is not set")
+    cluster = os.getenv("VOLCENGINE_TTS_CLUSTER", "volcano_tts")
+    voice_type = "BV001_streaming"
+    return VolcengineTTS(
+        appid=app_id,
+        access_token=access_token,
+        cluster=cluster,
+        voice_type=voice_type,
+    )