feat: add call history API endpoints and TTS service client

Adds read-only access to persisted call records for the dashboard
and implements a client for the Rhema text-to-speech service.

- api/call_history.py: New router providing paged call lists
  and detailed call records with transcript metadata.
- services/tts.py: Async client for OpenAI-compatible TTS
  endpoints (Rhema/Kokoro) used for call-flow steps.
This commit is contained in:
2026-05-22 06:28:33 -04:00
parent dbdb03beb9
commit 63f1a270bb
28 changed files with 2275 additions and 11 deletions

90
services/tts.py Normal file
View File

@@ -0,0 +1,90 @@
"""
TTS Service — Rhema (OpenAI-compatible) text-to-speech client.
Synthesizes speech for the SPEAK call-flow step and the AI Receptionist.
Rhema exposes POST /v1/audio/speech (OpenAI-compatible) with Kokoro voices.
"""
import logging
from pathlib import Path
from typing import Optional
import httpx
from config import TTSSettings
logger = logging.getLogger(__name__)
class TTSService:
"""Client for Rhema TTS service."""
def __init__(self, settings: TTSSettings):
self.settings = settings
self._client: Optional[httpx.AsyncClient] = None
async def _get_client(self) -> httpx.AsyncClient:
if self._client is None or self._client.is_closed:
headers = {}
if self.settings.api_key:
headers["Authorization"] = f"Bearer {self.settings.api_key}"
self._client = httpx.AsyncClient(
base_url=self.settings.base_url,
timeout=httpx.Timeout(self.settings.timeout, connect=5.0),
headers=headers,
)
return self._client
async def synthesize(
self,
text: str,
voice: Optional[str] = None,
response_format: str = "wav",
) -> bytes:
"""Synthesize speech and return audio bytes."""
if not text or not text.strip():
return b""
client = await self._get_client()
body = {
"model": self.settings.model,
"input": text,
"voice": voice or self.settings.voice,
"response_format": response_format,
"sample_rate": self.settings.sample_rate,
}
try:
response = await client.post("/v1/audio/speech", json=body)
response.raise_for_status()
return response.content
except httpx.HTTPStatusError as e:
logger.error(f"Rhema TTS error: {e.response.status_code} {e.response.text}")
return b""
except httpx.ConnectError:
logger.error(f"Cannot connect to Rhema at {self.settings.base_url}")
return b""
except Exception as e:
logger.error(f"TTS synthesis failed: {e}")
return b""
async def synthesize_to_file(
self,
text: str,
filepath: str | Path,
voice: Optional[str] = None,
) -> bool:
"""Synthesize to a WAV file. Returns True on success."""
audio = await self.synthesize(text, voice=voice, response_format="wav")
if not audio:
return False
path = Path(filepath)
path.parent.mkdir(parents=True, exist_ok=True)
path.write_bytes(audio)
logger.debug(f"TTS wrote {len(audio)} bytes to {path}")
return True
async def close(self) -> None:
if self._client and not self._client.is_closed:
await self._client.aclose()
self._client = None