RubyGems - whispercpp - Versions diffs - 1.2.0.2 → 1.3.1 - Mend

whispercpp 1.2.0.2 → 1.3.1

Files changed (135) hide show

checksums.yaml +4 -4
data/.gitignore +5 -0
data/LICENSE +1 -1
data/README.md +165 -434
data/Rakefile +46 -86
data/ext/.gitignore +13 -0
data/ext/cpu.mk +9 -0
data/ext/{dr_wav.h → examples/dr_wav.h} +3560 -1179
data/ext/extconf.rb +185 -7
data/ext/ggml/include/ggml-alloc.h +76 -0
data/ext/ggml/include/ggml-backend.h +352 -0
data/ext/ggml/include/ggml-blas.h +25 -0
data/ext/ggml/include/ggml-cann.h +123 -0
data/ext/ggml/include/ggml-cpp.h +38 -0
data/ext/ggml/include/ggml-cpu.h +135 -0
data/ext/ggml/include/ggml-cuda.h +47 -0
data/ext/ggml/include/ggml-kompute.h +50 -0
data/ext/ggml/include/ggml-metal.h +66 -0
data/ext/ggml/include/ggml-opencl.h +26 -0
data/ext/ggml/include/ggml-opt.h +216 -0
data/ext/ggml/include/ggml-rpc.h +28 -0
data/ext/ggml/include/ggml-sycl.h +49 -0
data/ext/ggml/include/ggml-vulkan.h +31 -0
data/ext/ggml/include/ggml.h +2285 -0
data/ext/ggml/src/ggml-alloc.c +1037 -0
data/ext/ggml/src/ggml-amx/common.h +94 -0
data/ext/ggml/src/ggml-amx/ggml-amx.cpp +446 -0
data/ext/ggml/src/ggml-amx/mmq.cpp +2510 -0
data/ext/ggml/src/ggml-amx/mmq.h +17 -0
data/ext/ggml/src/ggml-backend-impl.h +256 -0
data/ext/ggml/src/ggml-backend-reg.cpp +552 -0
data/ext/ggml/src/ggml-backend.cpp +1999 -0
data/ext/ggml/src/ggml-blas/ggml-blas.cpp +517 -0
data/ext/ggml/src/ggml-cann/acl_tensor.cpp +175 -0
data/ext/ggml/src/ggml-cann/acl_tensor.h +258 -0
data/ext/ggml/src/ggml-cann/aclnn_ops.cpp +3427 -0
data/ext/ggml/src/ggml-cann/aclnn_ops.h +592 -0
data/ext/ggml/src/ggml-cann/common.h +286 -0
data/ext/ggml/src/ggml-cann/ggml-cann.cpp +2188 -0
data/ext/ggml/src/ggml-cann/kernels/ascendc_kernels.h +19 -0
data/ext/ggml/src/ggml-cann/kernels/dup.cpp +236 -0
data/ext/ggml/src/ggml-cann/kernels/get_row_f16.cpp +197 -0
data/ext/ggml/src/ggml-cann/kernels/get_row_f32.cpp +190 -0
data/ext/ggml/src/ggml-cann/kernels/get_row_q4_0.cpp +204 -0
data/ext/ggml/src/ggml-cann/kernels/get_row_q8_0.cpp +191 -0
data/ext/ggml/src/ggml-cann/kernels/quantize_f16_q8_0.cpp +218 -0
data/ext/ggml/src/ggml-cann/kernels/quantize_f32_q8_0.cpp +216 -0
data/ext/ggml/src/ggml-cann/kernels/quantize_float_to_q4_0.cpp +295 -0
data/ext/ggml/src/ggml-common.h +1853 -0
data/ext/ggml/src/ggml-cpu/amx/amx.cpp +220 -0
data/ext/ggml/src/ggml-cpu/amx/amx.h +8 -0
data/ext/ggml/src/ggml-cpu/amx/common.h +91 -0
data/ext/ggml/src/ggml-cpu/amx/mmq.cpp +2511 -0
data/ext/ggml/src/ggml-cpu/amx/mmq.h +10 -0
data/ext/ggml/src/ggml-cpu/cpu-feats-x86.cpp +323 -0
data/ext/ggml/src/ggml-cpu/ggml-cpu-aarch64.cpp +4262 -0
data/ext/ggml/src/ggml-cpu/ggml-cpu-aarch64.h +8 -0
data/ext/ggml/src/ggml-cpu/ggml-cpu-hbm.cpp +55 -0
data/ext/ggml/src/ggml-cpu/ggml-cpu-hbm.h +8 -0
data/ext/ggml/src/ggml-cpu/ggml-cpu-impl.h +386 -0
data/ext/ggml/src/ggml-cpu/ggml-cpu-quants.c +10835 -0
data/ext/ggml/src/ggml-cpu/ggml-cpu-quants.h +63 -0
data/ext/ggml/src/ggml-cpu/ggml-cpu-traits.cpp +36 -0
data/ext/ggml/src/ggml-cpu/ggml-cpu-traits.h +38 -0
data/ext/ggml/src/ggml-cpu/ggml-cpu.c +14123 -0
data/ext/ggml/src/ggml-cpu/ggml-cpu.cpp +622 -0
data/ext/ggml/src/ggml-cpu/llamafile/sgemm.cpp +1884 -0
data/ext/ggml/src/ggml-cpu/llamafile/sgemm.h +14 -0
data/ext/ggml/src/ggml-cuda/vendors/cuda.h +14 -0
data/ext/ggml/src/ggml-cuda/vendors/hip.h +186 -0
data/ext/ggml/src/ggml-cuda/vendors/musa.h +134 -0
data/ext/ggml/src/ggml-impl.h +556 -0
data/ext/ggml/src/ggml-kompute/ggml-kompute.cpp +2251 -0
data/ext/ggml/src/ggml-metal/ggml-metal-impl.h +288 -0
data/ext/ggml/src/ggml-metal/ggml-metal.m +4884 -0
data/ext/ggml/src/ggml-metal/ggml-metal.metal +6732 -0
data/ext/ggml/src/ggml-opt.cpp +854 -0
data/ext/ggml/src/ggml-quants.c +5238 -0
data/ext/ggml/src/ggml-quants.h +100 -0
data/ext/ggml/src/ggml-rpc/ggml-rpc.cpp +1406 -0
data/ext/ggml/src/ggml-sycl/common.cpp +95 -0
data/ext/ggml/src/ggml-sycl/concat.cpp +196 -0
data/ext/ggml/src/ggml-sycl/conv.cpp +99 -0
data/ext/ggml/src/ggml-sycl/convert.cpp +547 -0
data/ext/ggml/src/ggml-sycl/dmmv.cpp +1023 -0
data/ext/ggml/src/ggml-sycl/element_wise.cpp +1030 -0
data/ext/ggml/src/ggml-sycl/ggml-sycl.cpp +4729 -0
data/ext/ggml/src/ggml-sycl/im2col.cpp +126 -0
data/ext/ggml/src/ggml-sycl/mmq.cpp +3031 -0
data/ext/ggml/src/ggml-sycl/mmvq.cpp +1015 -0
data/ext/ggml/src/ggml-sycl/norm.cpp +378 -0
data/ext/ggml/src/ggml-sycl/outprod.cpp +56 -0
data/ext/ggml/src/ggml-sycl/rope.cpp +276 -0
data/ext/ggml/src/ggml-sycl/softmax.cpp +251 -0
data/ext/ggml/src/ggml-sycl/tsembd.cpp +72 -0
data/ext/ggml/src/ggml-sycl/wkv6.cpp +141 -0
data/ext/ggml/src/ggml-threading.cpp +12 -0
data/ext/ggml/src/ggml-threading.h +14 -0
data/ext/ggml/src/ggml-vulkan/ggml-vulkan.cpp +8657 -0
data/ext/ggml/src/ggml-vulkan/vulkan-shaders/vulkan-shaders-gen.cpp +593 -0
data/ext/ggml/src/ggml.c +7694 -0
data/ext/include/whisper.h +672 -0
data/ext/metal-embed.mk +17 -0
data/ext/metal.mk +6 -0
data/ext/ruby_whisper.cpp +1608 -159
data/ext/ruby_whisper.h +10 -0
data/ext/scripts/get-flags.mk +38 -0
data/ext/src/coreml/whisper-decoder-impl.h +146 -0
data/ext/src/coreml/whisper-decoder-impl.m +201 -0
data/ext/src/coreml/whisper-encoder-impl.h +142 -0
data/ext/src/coreml/whisper-encoder-impl.m +197 -0
data/ext/src/coreml/whisper-encoder.h +26 -0
data/ext/src/openvino/whisper-openvino-encoder.cpp +108 -0
data/ext/src/openvino/whisper-openvino-encoder.h +31 -0
data/ext/src/whisper.cpp +7393 -0
data/extsources.rb +6 -0
data/lib/whisper/model/uri.rb +157 -0
data/lib/whisper.rb +2 -0
data/tests/helper.rb +7 -0
data/tests/jfk_reader/.gitignore +5 -0
data/tests/jfk_reader/extconf.rb +3 -0
data/tests/jfk_reader/jfk_reader.c +68 -0
data/tests/test_callback.rb +160 -0
data/tests/test_error.rb +20 -0
data/tests/test_model.rb +71 -0
data/tests/test_package.rb +31 -0
data/tests/test_params.rb +160 -0
data/tests/test_segment.rb +83 -0
data/tests/test_whisper.rb +211 -123
data/whispercpp.gemspec +36 -0
metadata +137 -11
data/ext/ggml.c +0 -8616
data/ext/ggml.h +0 -748
data/ext/whisper.cpp +0 -4829
data/ext/whisper.h +0 -402

data/ext/whisper.h DELETED Viewed

@@ -1,402 +0,0 @@
-#ifndef WHISPER_H
-#define WHISPER_H
-#include <stddef.h>
-#include <stdint.h>
-#include <stdbool.h>
-#ifdef WHISPER_SHARED
-#    ifdef _WIN32
-#        ifdef WHISPER_BUILD
-#            define WHISPER_API __declspec(dllexport)
-#        else
-#            define WHISPER_API __declspec(dllimport)
-#        endif
-#    else
-#        define WHISPER_API __attribute__ ((visibility ("default")))
-#    endif
-#else
-#    define WHISPER_API
-#endif
-#define WHISPER_SAMPLE_RATE 16000
-#define WHISPER_N_FFT       400
-#define WHISPER_N_MEL       80
-#define WHISPER_HOP_LENGTH  160
-#define WHISPER_CHUNK_SIZE  30
-#ifdef __cplusplus
-extern "C" {
-#endif
-    //
-    // C interface
-    //
-    // The following interface is thread-safe as long as the sample whisper_context is not used by multiple threads
-    // concurrently.
-    //
-    // Basic usage:
-    //
-    //     #include "whisper.h"
-    //
-    //     ...
-    //
-    //     struct whisper_context * ctx = whisper_init_from_file("/path/to/ggml-base.en.bin");
-    //
-    //     if (whisper_full(ctx, wparams, pcmf32.data(), pcmf32.size()) != 0) {
-    //         fprintf(stderr, "failed to process audio\n");
-    //         return 7;
-    //     }
-    //
-    //     const int n_segments = whisper_full_n_segments(ctx);
-    //     for (int i = 0; i < n_segments; ++i) {
-    //         const char * text = whisper_full_get_segment_text(ctx, i);
-    //         printf("%s", text);
-    //     }
-    //
-    //     whisper_free(ctx);
-    //
-    //     ...
-    //
-    // This is a demonstration of the most straightforward usage of the library.
-    // "pcmf32" contains the RAW audio data in 32-bit floating point format.
-    //
-    // The interface also allows for more fine-grained control over the computation, but it requires a deeper
-    // understanding of how the model works.
-    //
-    struct whisper_context;
-    typedef int whisper_token;
-    typedef struct whisper_token_data {
-        whisper_token id;  // token id
-        whisper_token tid; // forced timestamp token id
-        float p;           // probability of the token
-        float plog;        // log probability of the token
-        float pt;          // probability of the timestamp token
-        float ptsum;       // sum of probabilities of all timestamp tokens
-        // token-level timestamp data
-        // do not use if you haven't computed token-level timestamps
-        int64_t t0;        // start time of the token
-        int64_t t1;        //   end time of the token
-        float vlen;        // voice length of the token
-    } whisper_token_data;
-    typedef struct whisper_model_loader {
-        void * context;
-        size_t (*read)(void * ctx, void * output, size_t read_size);
-        bool    (*eof)(void * ctx);
-        void  (*close)(void * ctx);
-    } whisper_model_loader;
-    // Various functions for loading a ggml whisper model.
-    // Allocate (almost) all memory needed for the model.
-    // Return NULL on failure
-    WHISPER_API struct whisper_context * whisper_init_from_file(const char * path_model);
-    WHISPER_API struct whisper_context * whisper_init_from_buffer(void * buffer, size_t buffer_size);
-    WHISPER_API struct whisper_context * whisper_init(struct whisper_model_loader * loader);
-    // Frees all memory allocated by the model.
-    WHISPER_API void whisper_free(struct whisper_context * ctx);
-    // Convert RAW PCM audio to log mel spectrogram.
-    // The resulting spectrogram is stored inside the provided whisper context.
-    // Returns 0 on success
-    WHISPER_API int whisper_pcm_to_mel(
-            struct whisper_context * ctx,
-                       const float * samples,
-                               int   n_samples,
-                               int   n_threads);
-    // Convert RAW PCM audio to log mel spectrogram but applies a Phase Vocoder to speed up the audio x2.
-    // The resulting spectrogram is stored inside the provided whisper context.
-    // Returns 0 on success
-    WHISPER_API int whisper_pcm_to_mel_phase_vocoder(
-        struct whisper_context* ctx,
-        const float* samples,
-        int   n_samples,
-        int   n_threads);
-    // This can be used to set a custom log mel spectrogram inside the provided whisper context.
-    // Use this instead of whisper_pcm_to_mel() if you want to provide your own log mel spectrogram.
-    // n_mel must be 80
-    // Returns 0 on success
-    WHISPER_API int whisper_set_mel(
-            struct whisper_context * ctx,
-                       const float * data,
-                               int   n_len,
-                               int   n_mel);
-    // Run the Whisper encoder on the log mel spectrogram stored inside the provided whisper context.
-    // Make sure to call whisper_pcm_to_mel() or whisper_set_mel() first.
-    // offset can be used to specify the offset of the first frame in the spectrogram.
-    // Returns 0 on success
-    WHISPER_API int whisper_encode(
-            struct whisper_context * ctx,
-                               int   offset,
-                               int   n_threads);
-    // Run the Whisper decoder to obtain the logits and probabilities for the next token.
-    // Make sure to call whisper_encode() first.
-    // tokens + n_tokens is the provided context for the decoder.
-    // n_past is the number of tokens to use from previous decoder calls.
-    // Returns 0 on success
-    // TODO: add support for multiple decoders
-    WHISPER_API int whisper_decode(
-            struct whisper_context * ctx,
-               const whisper_token * tokens,
-                               int   n_tokens,
-                               int   n_past,
-                               int   n_threads);
-    // Convert the provided text into tokens.
-    // The tokens pointer must be large enough to hold the resulting tokens.
-    // Returns the number of tokens on success, no more than n_max_tokens
-    // Returns -1 on failure
-    // TODO: not sure if correct
-    WHISPER_API int whisper_tokenize(
-            struct whisper_context * ctx,
-                        const char * text,
-                     whisper_token * tokens,
-                               int   n_max_tokens);
-    // Largest language id (i.e. number of available languages - 1)
-    WHISPER_API int whisper_lang_max_id();
-    // Return the id of the specified language, returns -1 if not found
-    // Examples:
-    //   "de" -> 2
-    //   "german" -> 2
-    WHISPER_API int whisper_lang_id(const char * lang);
-    // Return the short string of the specified language id (e.g. 2 -> "de"), returns nullptr if not found
-    WHISPER_API const char * whisper_lang_str(int id);
-    // Use mel data at offset_ms to try and auto-detect the spoken language
-    // Make sure to call whisper_pcm_to_mel() or whisper_set_mel() first
-    // Returns the top language id or negative on failure
-    // If not null, fills the lang_probs array with the probabilities of all languages
-    // The array must be whispe_lang_max_id() + 1 in size
-    // ref: https://github.com/openai/whisper/blob/main/whisper/decoding.py#L18-L69
-    WHISPER_API int whisper_lang_auto_detect(
-            struct whisper_context * ctx,
-                               int   offset_ms,
-                               int   n_threads,
-                             float * lang_probs);
-    WHISPER_API int whisper_n_len          (struct whisper_context * ctx); // mel length
-    WHISPER_API int whisper_n_vocab        (struct whisper_context * ctx);
-    WHISPER_API int whisper_n_text_ctx     (struct whisper_context * ctx);
-    WHISPER_API int whisper_n_audio_ctx    (struct whisper_context * ctx);
-    WHISPER_API int whisper_is_multilingual(struct whisper_context * ctx);
-    // Token logits obtained from the last call to whisper_decode()
-    // The logits for the last token are stored in the last row
-    // Rows: n_tokens
-    // Cols: n_vocab
-    WHISPER_API float * whisper_get_logits(struct whisper_context * ctx);
-    // Token Id -> String. Uses the vocabulary in the provided context
-    WHISPER_API const char * whisper_token_to_str(struct whisper_context * ctx, whisper_token token);
-    // Special tokens
-    WHISPER_API whisper_token whisper_token_eot (struct whisper_context * ctx);
-    WHISPER_API whisper_token whisper_token_sot (struct whisper_context * ctx);
-    WHISPER_API whisper_token whisper_token_prev(struct whisper_context * ctx);
-    WHISPER_API whisper_token whisper_token_solm(struct whisper_context * ctx);
-    WHISPER_API whisper_token whisper_token_not (struct whisper_context * ctx);
-    WHISPER_API whisper_token whisper_token_beg (struct whisper_context * ctx);
-    WHISPER_API whisper_token whisper_token_lang(struct whisper_context * ctx, int lang_id);
-    // Task tokens
-    WHISPER_API whisper_token whisper_token_translate (void);
-    WHISPER_API whisper_token whisper_token_transcribe(void);
-    // Performance information
-    WHISPER_API void whisper_print_timings(struct whisper_context * ctx);
-    WHISPER_API void whisper_reset_timings(struct whisper_context * ctx);
-    // Print system information
-    WHISPER_API const char * whisper_print_system_info(void);
-    // Abort a running whisper_full_parallel or whisper_full
-    WHISPER_API void whisper_running_abort(struct whisper_context * ctx);
-    // Resume whisper context from an aborted state allowing it run again
-    WHISPER_API void whisper_running_restore(struct whisper_context * ctx);
-    // Check the whisper context state if true then it can run if false it can not
-    WHISPER_API bool whisper_running_state(struct whisper_context * ctx);
-    ////////////////////////////////////////////////////////////////////////////
-    // Available sampling strategies
-    enum whisper_sampling_strategy {
-        WHISPER_SAMPLING_GREEDY,      // similar to OpenAI's GreefyDecoder
-        WHISPER_SAMPLING_BEAM_SEARCH, // similar to OpenAI's BeamSearchDecoder
-    };
-    // Text segment callback
-    // Called on every newly generated text segment
-    // Use the whisper_full_...() functions to obtain the text segments
-    typedef void (*whisper_new_segment_callback)(struct whisper_context * ctx, int n_new, void * user_data);
-    // Encoder begin callback
-    // If not NULL, called before the encoder starts
-    // If it returns false, the computation is aborted
-    typedef bool (*whisper_encoder_begin_callback)(struct whisper_context * ctx, void * user_data);
-    // Logits filter callback
-    // Can be used to modify the logits before sampling
-    // If not NULL, called after applying temperature to logits
-    typedef void (*whisper_logits_filter_callback)(
-            struct whisper_context * ctx,
-          const whisper_token_data * tokens,
-                               int   n_tokens,
-                             float * logits,
-                              void * user_data);
-    // Parameters for the whisper_full() function
-    // If you chnage the order or add new parameters, make sure to update the default values in whisper.cpp:
-    // whisper_full_default_params()
-    struct whisper_full_params {
-        enum whisper_sampling_strategy strategy;
-        int n_threads;
-        int n_max_text_ctx;     // max tokens to use from past text as prompt for the decoder
-        int offset_ms;          // start offset in ms
-        int duration_ms;        // audio duration to process in ms
-        bool translate;
-        bool no_context;        // do not use past transcription (if any) as initial prompt for the decoder
-        bool single_segment;    // force single segment output (useful for streaming)
-        bool print_special;     // print special tokens (e.g. <SOT>, <EOT>, <BEG>, etc.)
-        bool print_progress;    // print progress information
-        bool print_realtime;    // print results from within whisper.cpp (avoid it, use callback instead)
-        bool print_timestamps;  // print timestamps for each text segment when printing realtime
-        // [EXPERIMENTAL] token-level timestamps
-        bool  token_timestamps; // enable token-level timestamps
-        float thold_pt;         // timestamp token probability threshold (~0.01)
-        float thold_ptsum;      // timestamp token sum probability threshold (~0.01)
-        int   max_len;          // max segment length in characters
-        bool  split_on_word;    // split on word rather than on token (when used with max_len)
-        int   max_tokens;       // max tokens per segment (0 = no limit)
-        // [EXPERIMENTAL] speed-up techniques
-        // note: these can significantly reduce the quality of the output
-        bool speed_up;          // speed-up the audio by 2x using Phase Vocoder
-        int  audio_ctx;         // overwrite the audio context size (0 = use default)
-        // tokens to provide to the whisper decoder as initial prompt
-        // these are prepended to any existing text context from a previous call
-        const whisper_token * prompt_tokens;
-        int prompt_n_tokens;
-        // for auto-detection, set to nullptr, "" or "auto"
-        const char * language;
-        // common decoding parameters:
-        bool suppress_blank;    // ref: https://github.com/openai/whisper/blob/f82bc59f5ea234d4b97fb2860842ed38519f7e65/whisper/decoding.py#L89
-        bool suppress_non_speech_tokens; // ref: https://github.com/openai/whisper/blob/7858aa9c08d98f75575035ecd6481f462d66ca27/whisper/tokenizer.py#L224-L253
-        float temperature;      // initial decoding temperature, ref: https://ai.stackexchange.com/a/32478
-        float max_initial_ts;   // ref: https://github.com/openai/whisper/blob/f82bc59f5ea234d4b97fb2860842ed38519f7e65/whisper/decoding.py#L97
-        float length_penalty;   // ref: https://github.com/openai/whisper/blob/f82bc59f5ea234d4b97fb2860842ed38519f7e65/whisper/transcribe.py#L267
-        // fallback parameters
-        // ref: https://github.com/openai/whisper/blob/f82bc59f5ea234d4b97fb2860842ed38519f7e65/whisper/transcribe.py#L274-L278
-        float temperature_inc;
-        float entropy_thold;    // similar to OpenAI's "compression_ratio_threshold"
-        float logprob_thold;
-        float no_speech_thold;  // TODO: not implemented
-        struct {
-            int best_of;    // ref: https://github.com/openai/whisper/blob/f82bc59f5ea234d4b97fb2860842ed38519f7e65/whisper/transcribe.py#L264
-        } greedy;
-        struct {
-            int beam_size;  // ref: https://github.com/openai/whisper/blob/f82bc59f5ea234d4b97fb2860842ed38519f7e65/whisper/transcribe.py#L265
-            float patience; // TODO: not implemented, ref: https://arxiv.org/pdf/2204.05424.pdf
-        } beam_search;
-        // called for every newly generated text segment
-        whisper_new_segment_callback new_segment_callback;
-        void * new_segment_callback_user_data;
-        // called each time before the encoder starts
-        whisper_encoder_begin_callback encoder_begin_callback;
-        void * encoder_begin_callback_user_data;
-        // called by each decoder to filter obtained logits
-        whisper_logits_filter_callback logits_filter_callback;
-        void * logits_filter_callback_user_data;
-    };
-    WHISPER_API struct whisper_full_params whisper_full_default_params(enum whisper_sampling_strategy strategy);
-    // Run the entire model: PCM -> log mel spectrogram -> encoder -> decoder -> text
-    // Uses the specified decoding strategy to obtain the text.
-    WHISPER_API int whisper_full(
-                struct whisper_context * ctx,
-            struct whisper_full_params   params,
-                           const float * samples,
-                                   int   n_samples);
-    // Split the input audio in chunks and process each chunk separately using whisper_full()
-    // It seems this approach can offer some speedup in some cases.
-    // However, the transcription accuracy can be worse at the beginning and end of each chunk.
-    WHISPER_API int whisper_full_parallel(
-                struct whisper_context * ctx,
-            struct whisper_full_params   params,
-                           const float * samples,
-                                   int   n_samples,
-                                   int   n_processors);
-    // Number of generated text segments.
-    // A segment can be a few words, a sentence, or even a paragraph.
-    WHISPER_API int whisper_full_n_segments(struct whisper_context * ctx);
-    // Language id associated with the current context
-    WHISPER_API int whisper_full_lang_id(struct whisper_context * ctx);
-    // Get the start and end time of the specified segment.
-    WHISPER_API int64_t whisper_full_get_segment_t0(struct whisper_context * ctx, int i_segment);
-    WHISPER_API int64_t whisper_full_get_segment_t1(struct whisper_context * ctx, int i_segment);
-    // Get the text of the specified segment.
-    WHISPER_API const char * whisper_full_get_segment_text(struct whisper_context * ctx, int i_segment);
-    // Get number of tokens in the specified segment.
-    WHISPER_API int whisper_full_n_tokens(struct whisper_context * ctx, int i_segment);
-    // Get the token text of the specified token in the specified segment.
-    WHISPER_API const char * whisper_full_get_token_text(struct whisper_context * ctx, int i_segment, int i_token);
-    WHISPER_API whisper_token whisper_full_get_token_id (struct whisper_context * ctx, int i_segment, int i_token);
-    // Get token data for the specified token in the specified segment.
-    // This contains probabilities, timestamps, etc.
-    WHISPER_API whisper_token_data whisper_full_get_token_data(struct whisper_context * ctx, int i_segment, int i_token);
-    // Get the probability of the specified token in the specified segment.
-    WHISPER_API float whisper_full_get_token_p(struct whisper_context * ctx, int i_segment, int i_token);
-    ////////////////////////////////////////////////////////////////////////////
-    // Temporary helpers needed for exposing ggml interface
-    WHISPER_API int whisper_bench_memcpy(int n_threads);
-    WHISPER_API int whisper_bench_ggml_mul_mat(int n_threads);
-#ifdef __cplusplus
-}
-#endif
-#endif