Add option to configure SentenceBoundary (#348)

* Create FUNDING.yml * add setence boundary which is more friendly to Chinese users --------- Co-authored-by: Rany <ranygh@riseup.net>
2025-08-05 18:06:03 +08:00
parent ffe009af9a
commit f78c8ece0a
10 changed files with 90 additions and 18 deletions
--- a/examples/async_audio_streaming_with_predefined_voice_and_subtitles.py
+++ b/examples/async_audio_streaming_with_predefined_voice_and_subtitles.py
@@ -21,7 +21,7 @@ async def amain() -> None:
        async for chunk in communicate.stream():
            if chunk["type"] == "audio":
                file.write(chunk["data"])
-            elif chunk["type"] == "WordBoundary":
+            elif chunk["type"] in ("WordBoundary", "SentenceBoundary"):
                submaker.feed(chunk)

    with open(SRT_FILE, "w", encoding="utf-8") as file:
--- a/examples/sync_audio_streaming_with_predefined_voice_subtitles.py
+++ b/examples/sync_audio_streaming_with_predefined_voice_subtitles.py
@@ -20,7 +20,7 @@ def main() -> None:
        for chunk in communicate.stream_sync():
            if chunk["type"] == "audio":
                file.write(chunk["data"])
-            elif chunk["type"] == "WordBoundary":
+            elif chunk["type"] in ("WordBoundary", "SentenceBoundary"):
                submaker.feed(chunk)

    with open(SRT_FILE, "w", encoding="utf-8") as file:
--- a/examples/sync_audio_streaming_with_predefined_voice_subtitles_print2stdout.py
+++ b/examples/sync_audio_streaming_with_predefined_voice_subtitles_print2stdout.py
@@ -0,0 +1,42 @@
+#!/usr/bin/env python3
+
+"""Sync variant of the async .stream() method to
+get audio chunks and feed them to SubMaker to
+generate subtitles"""
+import sys
+
+import edge_tts
+
+TEXT = """君不见，黄河之水天上来，奔流到海不复回。
+君不见，高堂明镜悲白发，朝如青丝暮成雪。
+人生得意须尽欢，莫使金樽空对月。
+天生我材必有用，千金散尽还复来。
+烹羊宰牛且为乐，会须一饮三百杯。
+岑夫子，丹丘生，将进酒，杯莫停。
+与君歌一曲，请君为我倾耳听。
+钟鼓馔玉不足贵，但愿长醉不复醒。
+古来圣贤皆寂寞，惟有饮者留其名。
+陈王昔时宴平乐，斗酒十千恣欢谑。
+主人何为言少钱，径须沽取对君酌。
+五花马，千金裘，呼儿将出换美酒，与尔同销万古愁。"""
+VOICE = "zh-CN-YunjianNeural"
+
+
+def main() -> None:
+    """Main function"""
+    communicate = edge_tts.Communicate(TEXT, VOICE, Boundary="SentenceBoundary")
+    submaker = edge_tts.SubMaker()
+    stdout = sys.stdout
+    audio_bytes = []
+    for chunk in communicate.stream_sync():
+        if chunk["type"] == "audio":
+            audio_bytes.append(chunk["data"])
+        elif chunk["type"] in ("WordBoundary", "SentenceBoundary"):
+            submaker.feed(chunk)
+
+    stdout.write(f"audio file length: {len(audio_bytes)}")
+    stdout.write(submaker.get_srt())
+
+
+if __name__ == "__main__":
+    main()