interface VADOptions {
    activationThreshold: number;
    deactivationThreshold: number;
    maxBufferedSpeech: number;
    minSilenceDuration: number;
    minSpeechDuration: number;
    prefixPaddingDuration: number;
}

Properties

activationThreshold: number

Sigmoid probability threshold for activation.

deactivationThreshold: number

Sigmoid probability threshold for deactivation (defaults to max(activationThreshold - 0.15, 0.01)).

maxBufferedSpeech: number

Maximum (ms) of buffered speech per utterance.

minSilenceDuration: number

Trailing silence (ms) before reporting END_OF_SPEECH.

minSpeechDuration: number

Minimum speech duration (ms) before reporting START_OF_SPEECH.

prefixPaddingDuration: number

Pre-roll (ms) included in the speech buffer ahead of START_OF_SPEECH.