tune: Adjust VAD parameters for longer segments
- min_speech_duration: 300ms → 1000ms (avoid tiny segments) - silence_duration: 400ms → 700ms (wait longer before cutting) - hang_frames_threshold: 20 → 35 (~350ms pause tolerance) This should reduce mid-sentence cuts and give Whisper more context. 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com>
This commit is contained in:
parent
53b21b94d6
commit
a28bb89913
@ -69,8 +69,8 @@ private:
|
|||||||
// VAD parameters - Higher threshold to avoid false triggers on filtered noise
|
// VAD parameters - Higher threshold to avoid false triggers on filtered noise
|
||||||
std::atomic<float> vad_rms_threshold_{0.02f}; // Was 0.01f
|
std::atomic<float> vad_rms_threshold_{0.02f}; // Was 0.01f
|
||||||
std::atomic<float> vad_peak_threshold_{0.08f}; // Was 0.04f
|
std::atomic<float> vad_peak_threshold_{0.08f}; // Was 0.04f
|
||||||
int silence_duration_ms_ = 400; // Wait 400ms of silence before cutting
|
int silence_duration_ms_ = 700; // Wait 700ms of silence before cutting (was 400)
|
||||||
int min_speech_duration_ms_ = 300; // Minimum speech to send
|
int min_speech_duration_ms_ = 1000; // Minimum 1s speech to send (was 300)
|
||||||
int max_speech_duration_ms_ = 25000; // 25s max before forced flush
|
int max_speech_duration_ms_ = 25000; // 25s max before forced flush
|
||||||
|
|
||||||
// Adaptive noise floor
|
// Adaptive noise floor
|
||||||
@ -79,7 +79,7 @@ private:
|
|||||||
|
|
||||||
// Hang time - wait before cutting to avoid mid-sentence cuts
|
// Hang time - wait before cutting to avoid mid-sentence cuts
|
||||||
int hang_frames_ = 0;
|
int hang_frames_ = 0;
|
||||||
int hang_frames_threshold_ = 20; // ~200ms tolerance for pauses
|
int hang_frames_threshold_ = 35; // ~350ms tolerance for pauses (was 20)
|
||||||
|
|
||||||
// Zero-crossing rate for speech vs noise discrimination
|
// Zero-crossing rate for speech vs noise discrimination
|
||||||
float last_zcr_ = 0.0f;
|
float last_zcr_ = 0.0f;
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user