From d0436686f047f1d82c30da26cf83f9eca6727292 Mon Sep 17 00:00:00 2001
From: soryu <soryu@soryu.co>
Date: Wed, 28 Jan 2026 03:49:13 +0000
Subject: feat: add inference cancellation support for TTS generation

Add cooperative cancellation via Arc<AtomicBool> cancel flag that
threads through TtsEngine::generate -> Qwen3Tts -> GenerationContext.
The autoregressive loop and streaming decoder check the flag each
iteration and break early when set. The speak WebSocket handler
creates a per-session flag, passes it to generate, and sets it on
Cancel/Stop/Close messages.

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 makima/src/tts/mod.rs | 8 ++++++++
 1 file changed, 8 insertions(+)

(limited to 'makima/src/tts/mod.rs')
diff --git a/makima/src/tts/mod.rs b/makima/src/tts/mod.rs
index 2cd0412..b66f4a5 100644
--- a/makima/src/tts/mod.rs
+++ b/makima/src/tts/mod.rs
@@ -5,6 +5,8 @@
 //! - **Qwen3**: Pure Rust candle-based Qwen3-TTS-12Hz-0.6B
 
 use std::path::Path;
+use std::sync::atomic::AtomicBool;
+use std::sync::Arc;
 
 pub mod chatterbox;
 pub mod qwen3;
@@ -109,11 +111,17 @@ pub enum TtsBackend {
 #[async_trait::async_trait]
 pub trait TtsEngine: Send + Sync {
     /// Generate complete audio from text with a voice reference.
+    ///
+    /// The optional `cancel_flag` can be set to `true` by another thread/task
+    /// to request early termination of the generation loop. Engines that
+    /// support cancellation will check this flag periodically and return
+    /// whatever audio has been produced so far.
     async fn generate(
         &self,
         text: &str,
         reference_audio: Option<&[f32]>,
         reference_sample_rate: Option<u32>,
+        cancel_flag: Option<Arc<AtomicBool>>,
     ) -> Result<Vec<AudioChunk>, TtsError>;
 
     /// Check if the engine is loaded and ready.
-- 
cgit v1.2.3