Interface TranscribeParams<Format, TokenTimestamp>

interface TranscribeParams<Format, TokenTimestamp> {
    audio_ctx: number;
    beam_size: number;
    best_of: number;
    debug_mode: boolean;
    duration_ms: number;
    entropy_thold: number;
    format: Format;
    initial_prompt: string;
    language: string;
    length_penalty: number;
    logprob_thold: number;
    max_initial_ts: number;
    max_len: number;
    max_tokens: number;
    n_max_text_ctx: number;
    n_threads: number;
    no_context: boolean;
    no_speech_thold: number;
    no_timestamps: boolean;
    offset_ms: number;
    print_progress: boolean;
    print_realtime: boolean;
    print_special: boolean;
    print_timestamps: boolean;
    single_segment: boolean;
    speed_up: boolean;
    split_on_word: boolean;
    strategy: WhisperSamplingStrategy;
    suppress_blank: boolean;
    suppress_non_speech_tokens: boolean;
    tdrz_enable: boolean;
    temperature: number;
    temperature_inc: number;
    thold_pt: number;
    thold_ptsum: number;
    token_timestamps: TokenTimestamp;
    translate: boolean;
}

Type Parameters

Properties

audio_ctx: number
beam_size: number
best_of: number
debug_mode: boolean
duration_ms: number
entropy_thold: number
format: Format
initial_prompt: string
language: string

Language code, e.g. "en", "de", "fr", "es", "it", "nl", "pt", "ru", "tr", "uk", "pl", "sv", "cs", "zh", "ja", "ko"

length_penalty: number
logprob_thold: number
max_initial_ts: number
max_len: number
max_tokens: number
n_max_text_ctx: number
n_threads: number
no_context: boolean
no_speech_thold: number
no_timestamps: boolean
offset_ms: number
print_progress: boolean
print_realtime: boolean
print_special: boolean
print_timestamps: boolean
single_segment: boolean
speed_up: boolean
split_on_word: boolean
suppress_blank: boolean
suppress_non_speech_tokens: boolean
tdrz_enable: boolean
temperature: number
temperature_inc: number
thold_pt: number
thold_ptsum: number
token_timestamps: TokenTimestamp
translate: boolean