interface SpeechmaticsOptions {
    additional_vocab?: Record<string, unknown>[];
    audio_filtering_config?: Record<string, unknown>;
    diarization?: string;
    domain?: string;
    enable_entities?: boolean;
    enable_partials?: boolean;
    end_of_utterance_silence_trigger?: number;
    max_delay?: number;
    max_delay_mode?: string;
    max_speakers?: number;
    output_locale?: string;
    prefer_current_speaker?: boolean;
    punctuation_overrides?: Record<string, unknown>;
    speaker_sensitivity?: number;
    transcript_filtering_config?: Record<string, unknown>;
}

Properties

additional_vocab?: Record<string, unknown>[]

Additional vocabulary entries for custom dictionary support.

audio_filtering_config?: Record<string, unknown>

Audio filtering configuration.

diarization?: string

Enable diarization for modes other than "none".

domain?: string

Domain to use, for example "finance".

enable_entities?: boolean

Enable entity recognition.

enable_partials?: boolean

Enable partial results. Default: true, overridden by the gateway.

end_of_utterance_silence_trigger?: number

Seconds of silence before finalizing an utterance.

max_delay?: number

Maximum delay in seconds. Valid range is 0.7-4.0. Default: 1.0.

max_delay_mode?: string

Maximum delay mode.

max_speakers?: number

Maximum number of speakers to detect.

output_locale?: string

BCP-47 locale for output formatting.

prefer_current_speaker?: boolean

Prefer grouping nearby words as the current speaker.

punctuation_overrides?: Record<string, unknown>

Punctuation override configuration.

speaker_sensitivity?: number

Speaker diarization sensitivity. Valid range is 0.0-1.0.

transcript_filtering_config?: Record<string, unknown>

Transcript filtering configuration.