Add a comment with the different time horizons.

This commit is contained in:
laurent 2025-06-19 15:34:49 +02:00
parent d473deddaf
commit d7642ff1e9

View File

@ -172,8 +172,9 @@ impl Model {
for asr_msg in asr_msgs.iter() { for asr_msg in asr_msgs.iter() {
match asr_msg { match asr_msg {
moshi::asr::AsrMsg::Step { prs, .. } => { moshi::asr::AsrMsg::Step { prs, .. } => {
// prs is the probability of voice activity for different time horizons. // prs is the probability of having no voice activity for different time
// The first element is the most recent time horizon. // horizons.
// In kyutai/stt-1b-en_fr-candle, these horizons are 0.5s, 1s, 2s, and 3s.
if self.vad && prs[2][0] > 0.5 && !printed_eot { if self.vad && prs[2][0] > 0.5 && !printed_eot {
printed_eot = true; printed_eot = true;
if !self.timestamps { if !self.timestamps {