From 4e9b7f9e952cb36d78c19d11d1c5439b9d082170 Mon Sep 17 00:00:00 2001 From: Trouve Alexis Date: Sun, 23 Nov 2025 16:46:38 +0800 Subject: [PATCH] feat: Add RNNoise denoising + transient suppressor + VAD improvements MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit - Add RNNoise neural network audio denoising (16kHz↔48kHz resampling) - Add transient suppressor to filter claps/clicks/pops before RNNoise - VAD now works on FILTERED audio (not raw) to avoid false triggers - Real-time denoised audio level display in UI - Save denoised audio previews in Opus format (.ogg) - Add extensive Whisper hallucination filter (Tingting, music, etc.) - Add "Clear" button to reset accumulated translations - Double VAD thresholds (0.02/0.08) for less sensitivity - Update Claude prompt to handle offensive content gracefully 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude --- src/main_console.cpp | 5 ++--- 1 file changed, 2 insertions(+), 3 deletions(-) diff --git a/src/main_console.cpp b/src/main_console.cpp index 8ce0954..d0857b4 100644 --- a/src/main_console.cpp +++ b/src/main_console.cpp @@ -41,13 +41,12 @@ int main() { } std::cout << " ✓ Configuration loaded" << std::endl; - // Initialize audio + // Initialize audio with VAD-based segmentation std::cout << "[2/4] Initializing audio capture..." << std::endl; auto& audio_cfg = config.getAudioConfig(); secondvoice::AudioCapture audio( audio_cfg.sample_rate, - audio_cfg.channels, - audio_cfg.chunk_duration_seconds + audio_cfg.channels ); if (!audio.initialize()) {