feat: add edge-tts as zero-cost voice output provider
Some checks failed
CI / test (pull_request) Failing after 33s
CI / validate (pull_request) Failing after 26s
Review Approval Gate / verify-review (pull_request) Failing after 5s

- Add EdgeTTSAdapter to bin/deepdive_tts.py (provider key: "edge-tts")
  default voice: en-US-GuyNeural, no API key required
- Add EdgeTTS class to intelligence/deepdive/tts_engine.py
- Update HybridTTS to try edge-tts as fallback between piper and elevenlabs
- Add --voice-memo flag to bin/night_watch.py for spoken nightly reports
- Add edge-tts>=6.1.9 to requirements.txt
- Create docs/voice-output.md documenting all providers and fallback chain
- Add tests/test_edge_tts.py with 17 unit tests (all mocked, no network)

Fixes #1126

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
This commit is contained in:
Alexander Whitestone
2026-04-08 06:29:26 -04:00
parent a1c153c095
commit ef74536e33
6 changed files with 694 additions and 7 deletions

View File

@@ -157,14 +157,45 @@ class ElevenLabsTTS:
return output_path
class EdgeTTS:
"""Zero-cost TTS using Microsoft Edge neural voices (no API key required).
Requires: pip install edge-tts>=6.1.9
"""
DEFAULT_VOICE = "en-US-GuyNeural"
def __init__(self, voice: str = None):
self.voice = voice or self.DEFAULT_VOICE
def synthesize(self, text: str, output_path: str) -> str:
"""Convert text to MP3 via Edge TTS."""
try:
import edge_tts
except ImportError:
raise RuntimeError("edge-tts not installed. Run: pip install edge-tts")
import asyncio
from pathlib import Path
mp3_path = str(Path(output_path).with_suffix(".mp3"))
async def _run():
communicate = edge_tts.Communicate(text, self.voice)
await communicate.save(mp3_path)
asyncio.run(_run())
return mp3_path
class HybridTTS:
"""TTS with sovereign primary, cloud fallback."""
def __init__(self, prefer_cloud: bool = False):
self.primary = None
self.fallback = None
self.prefer_cloud = prefer_cloud
# Try preferred engine
if prefer_cloud:
self._init_elevenlabs()
@@ -172,21 +203,29 @@ class HybridTTS:
self._init_piper()
else:
self._init_piper()
if not self.primary:
self._init_edge_tts()
if not self.primary:
self._init_elevenlabs()
def _init_piper(self):
try:
self.primary = PiperTTS()
except Exception as e:
print(f"Piper init failed: {e}")
def _init_edge_tts(self):
try:
self.primary = EdgeTTS()
except Exception as e:
print(f"EdgeTTS init failed: {e}")
def _init_elevenlabs(self):
try:
self.primary = ElevenLabsTTS()
except Exception as e:
print(f"ElevenLabs init failed: {e}")
def synthesize(self, text: str, output_path: str) -> str:
"""Synthesize with fallback."""
if self.primary:
@@ -194,7 +233,7 @@ class HybridTTS:
return self.primary.synthesize(text, output_path)
except Exception as e:
print(f"Primary failed: {e}")
raise RuntimeError("No TTS engine available")