summaryrefslogtreecommitdiff
path: root/makima/src/server/handlers
diff options
context:
space:
mode:
authorsoryu <soryu@soryu.co>2026-02-01 03:04:36 +0000
committersoryu <soryu@soryu.co>2026-02-01 03:04:36 +0000
commita2c147ddd59f55a07b5be0c8970169726b55c876 (patch)
treee41a80f2dfdd8fcaf6b6e91c899392f4e619ca3e /makima/src/server/handlers
parent65eebd078af712d004a5a9e28863a16df30792a6 (diff)
downloadsoryu-a2c147ddd59f55a07b5be0c8970169726b55c876.tar.gz
soryu-a2c147ddd59f55a07b5be0c8970169726b55c876.zip
Use chatterbox TTS
Diffstat (limited to 'makima/src/server/handlers')
-rw-r--r--makima/src/server/handlers/speak.rs5
1 files changed, 2 insertions, 3 deletions
diff --git a/makima/src/server/handlers/speak.rs b/makima/src/server/handlers/speak.rs
index 3ed2620..b235c65 100644
--- a/makima/src/server/handlers/speak.rs
+++ b/makima/src/server/handlers/speak.rs
@@ -1,19 +1,18 @@
//! WebSocket handler for TTS streaming (direct in-process inference).
//!
//! This module implements the `/api/v1/speak` endpoint which performs
-//! text-to-speech synthesis directly using the candle-based TTS engine.
+//! text-to-speech synthesis directly using the Chatterbox ONNX TTS engine.
//! No external Python service or proxy — the model runs in-process.
//!
//! ## Architecture
//!
//! The speak handler will:
//! 1. Accept a WebSocket connection from the client
-//! 2. Lazily load the TTS model (candle) on first request
+//! 2. Lazily load the TTS model (Chatterbox ONNX) on first request
//! 3. Parse JSON control messages (start, speak, stop, cancel)
//! 4. Run inference directly and stream audio chunks back
//!
//! See `makima/src/tts/` for the TTS engine implementation.
-//! See `docs/specs/qwen3-tts-spec.md` for the full protocol specification.
use std::sync::atomic::{AtomicBool, Ordering};
use std::sync::Arc;