mirror of
https://github.com/kyutai-labs/delayed-streams-modeling.git
synced 2025-12-23 03:19:57 +00:00
Add a comment with the different time horizons.
This commit is contained in:
@@ -172,8 +172,9 @@ impl Model {
|
|||||||
for asr_msg in asr_msgs.iter() {
|
for asr_msg in asr_msgs.iter() {
|
||||||
match asr_msg {
|
match asr_msg {
|
||||||
moshi::asr::AsrMsg::Step { prs, .. } => {
|
moshi::asr::AsrMsg::Step { prs, .. } => {
|
||||||
// prs is the probability of voice activity for different time horizons.
|
// prs is the probability of having no voice activity for different time
|
||||||
// The first element is the most recent time horizon.
|
// horizons.
|
||||||
|
// In kyutai/stt-1b-en_fr-candle, these horizons are 0.5s, 1s, 2s, and 3s.
|
||||||
if self.vad && prs[2][0] > 0.5 && !printed_eot {
|
if self.vad && prs[2][0] > 0.5 && !printed_eot {
|
||||||
printed_eot = true;
|
printed_eot = true;
|
||||||
if !self.timestamps {
|
if !self.timestamps {
|
||||||
|
|||||||
Reference in New Issue
Block a user