whisper.cpp

Running

App Files Files Community

danbev commited on May 29

Commit

0cae2d6

unverified ·

1 Parent(s): 1ee7297

whisper : remove whisper_load_backends function (#3196)

Browse files

* whisper : remove whisper_load_backends function

This commit removes the `whisper_load_backends` function, which was used
to load all GGML backends.

The motivation for this change push the responsibility of loading
backends to user applications to give them more control over which
backends to load and when. See the references below for more context.

Resolves: https://github.com/ggml-org/whisper.cpp/issues/3182
Refs: https://github.com/ggml-org/whisper.cpp/pull/3042#issuecomment-2801778733
Refs: https://github.com/ggml-org/whisper.cpp/pull/3042#issuecomment-2801928990

* ruby : add check for rwc is NULL

This commit adds a check to ensure that the `rwc` pointer is not NULL
before attempting to mark its members in the garbage collector.

The motivation for this is an attempt to see if this fixed the CI build
as I'm not able to reproduce the issue locally.

Refs: https://github.com/ggml-org/whisper.cpp/actions/runs/15299612277/job/43036694928?pr=3196

Files changed (12) hide show

bindings/ruby/ext/ruby_whisper_params.c +2 -0
examples/bench/bench.cpp +2 -0
examples/cli/cli.cpp +2 -1
examples/command/command.cpp +2 -0
examples/lsp/lsp.cpp +2 -0
examples/quantize/quantize.cpp +3 -0
examples/server/server.cpp +2 -0
examples/stream/stream.cpp +2 -0
examples/talk-llama/talk-llama.cpp +2 -0
examples/vad-speech-segments/speech.cpp +2 -0
examples/wchess/wchess.cmd/wchess.cmd.cpp +2 -0
src/whisper.cpp +0 -15

bindings/ruby/ext/ruby_whisper_params.c CHANGED Viewed

@@ -77,6 +77,8 @@ static ID id_vad_params;
 static void
 rb_whisper_callbcack_container_mark(ruby_whisper_callback_container *rwc)
 {
   rb_gc_mark(rwc->user_data);
   rb_gc_mark(rwc->callback);
   rb_gc_mark(rwc->callbacks);

 static void
 rb_whisper_callbcack_container_mark(ruby_whisper_callback_container *rwc)
 {
+  if (rwc == NULL) return;
   rb_gc_mark(rwc->user_data);
   rb_gc_mark(rwc->callback);
   rb_gc_mark(rwc->callbacks);

examples/bench/bench.cpp CHANGED Viewed

@@ -156,6 +156,8 @@ static int whisper_bench_full(const whisper_params & params) {
 }
 int main(int argc, char ** argv) {
     whisper_params params;
     if (whisper_params_parse(argc, argv, params) == false) {

 }
 int main(int argc, char ** argv) {
+    ggml_backend_load_all();
     whisper_params params;
     if (whisper_params_parse(argc, argv, params) == false) {

examples/cli/cli.cpp CHANGED Viewed

@@ -909,6 +909,8 @@ static void output_lrc(struct whisper_context * ctx, std::ofstream & fout, const
 static void cb_log_disable(enum ggml_log_level , const char * , void * ) { }
 int main(int argc, char ** argv) {
 #if defined(_WIN32)
     // Set the console output code page to UTF-8, while command line arguments
     // are still encoded in the system's code page. In this way, we can print
@@ -988,7 +990,6 @@ int main(int argc, char ** argv) {
     }
     // whisper init
     struct whisper_context_params cparams = whisper_context_default_params();
     cparams.use_gpu    = params.use_gpu;

 static void cb_log_disable(enum ggml_log_level , const char * , void * ) { }
 int main(int argc, char ** argv) {
+    ggml_backend_load_all();
 #if defined(_WIN32)
     // Set the console output code page to UTF-8, while command line arguments
     // are still encoded in the system's code page. In this way, we can print
     }
     // whisper init
     struct whisper_context_params cparams = whisper_context_default_params();
     cparams.use_gpu    = params.use_gpu;

examples/command/command.cpp CHANGED Viewed

@@ -678,6 +678,8 @@ static int process_general_transcription(struct whisper_context * ctx, audio_asy
 }
 int main(int argc, char ** argv) {
     whisper_params params;
     if (whisper_params_parse(argc, argv, params) == false) {

 }
 int main(int argc, char ** argv) {
+    ggml_backend_load_all();
     whisper_params params;
     if (whisper_params_parse(argc, argv, params) == false) {

examples/lsp/lsp.cpp CHANGED Viewed

@@ -424,6 +424,8 @@ static void process_loop(struct whisper_context * ctx, audio_async &audio, const
 }
 int main(int argc, char ** argv) {
     whisper_params params;
     if (whisper_params_parse(argc, argv, params) == false) {
         return 1;

 }
 int main(int argc, char ** argv) {
+    ggml_backend_load_all();
     whisper_params params;
     if (whisper_params_parse(argc, argv, params) == false) {
         return 1;

examples/quantize/quantize.cpp CHANGED Viewed

@@ -1,4 +1,5 @@
 #include "ggml.h"
 #include "common.h"
 #include "common-ggml.h"
@@ -176,6 +177,8 @@ static bool whisper_model_quantize(const std::string & fname_inp, const std::str
 }
 int main(int argc, char ** argv) {
     if (argc != 4) {
         fprintf(stderr, "usage: %s model-f32.bin model-quant.bin type\n", argv[0]);
         ggml_print_ftypes(stderr);

 #include "ggml.h"
+#include "ggml-backend.h"
 #include "common.h"
 #include "common-ggml.h"
 }
 int main(int argc, char ** argv) {
+    ggml_backend_load_all();
     if (argc != 4) {
         fprintf(stderr, "usage: %s model-f32.bin model-quant.bin type\n", argv[0]);
         ggml_print_ftypes(stderr);

examples/server/server.cpp CHANGED Viewed

@@ -516,6 +516,8 @@ void get_req_parameters(const Request & req, whisper_params & params)
 }  // namespace
 int main(int argc, char ** argv) {
     whisper_params params;
     server_params sparams;

 }  // namespace
 int main(int argc, char ** argv) {
+    ggml_backend_load_all();
     whisper_params params;
     server_params sparams;

examples/stream/stream.cpp CHANGED Viewed

@@ -116,6 +116,8 @@ void whisper_print_usage(int /*argc*/, char ** argv, const whisper_params & para
 }
 int main(int argc, char ** argv) {
     whisper_params params;
     if (whisper_params_parse(argc, argv, params) == false) {

 }
 int main(int argc, char ** argv) {
+    ggml_backend_load_all();
     whisper_params params;
     if (whisper_params_parse(argc, argv, params) == false) {

examples/talk-llama/talk-llama.cpp CHANGED Viewed

@@ -291,6 +291,8 @@ The transcript only includes text, it does not include markup like HTML and Mark
 {0}{4})";
 int main(int argc, char ** argv) {
     whisper_params params;
     if (whisper_params_parse(argc, argv, params) == false) {

 {0}{4})";
 int main(int argc, char ** argv) {
+    ggml_backend_load_all();
     whisper_params params;
     if (whisper_params_parse(argc, argv, params) == false) {

examples/vad-speech-segments/speech.cpp CHANGED Viewed

@@ -83,6 +83,8 @@ static bool vad_params_parse(int argc, char ** argv, cli_params & params) {
 static void cb_log_disable(enum ggml_log_level , const char * , void * ) { }
 int main(int argc, char ** argv) {
     cli_params cli_params;
     if (!vad_params_parse(argc, argv, cli_params)) {

 static void cb_log_disable(enum ggml_log_level , const char * , void * ) { }
 int main(int argc, char ** argv) {
+    ggml_backend_load_all();
     cli_params cli_params;
     if (!vad_params_parse(argc, argv, cli_params)) {

examples/wchess/wchess.cmd/wchess.cmd.cpp CHANGED Viewed

@@ -168,6 +168,8 @@ bool get_audio(std::vector<float> & pcmf32_cur) {
 }
 int main(int argc, char ** argv) {
     whisper_params params;
     if (whisper_params_parse(argc, argv, params) == false) {

 }
 int main(int argc, char ** argv) {
+    ggml_backend_load_all();
     whisper_params params;
     if (whisper_params_parse(argc, argv, params) == false) {

src/whisper.cpp CHANGED Viewed

@@ -206,15 +206,6 @@ static bool ggml_graph_compute_helper(
     return t;
 }
-static void whisper_load_backends() {
-#ifdef GGML_BACKEND_DL
-    static std::once_flag flag;
-    std::call_once(flag, []() {
-        ggml_backend_load_all();
-    });
-#endif
-}
 // TODO: move these functions to ggml-base with support for ggml-backend?
 static ggml_tensor * whisper_set_f32(struct ggml_tensor * t, float v) {
@@ -1322,8 +1313,6 @@ static size_t aheads_masks_nbytes(struct whisper_aheads_masks & aheads_masks) {
 static ggml_backend_t whisper_backend_init_gpu(const whisper_context_params & params) {
     ggml_log_set(g_state.log_callback, g_state.log_callback_user_data);
-    whisper_load_backends();
     ggml_backend_dev_t dev = nullptr;
     int cnt = 0;
@@ -4335,8 +4324,6 @@ static int whisper_has_openvino(void) {
 const char * whisper_print_system_info(void) {
     static std::string s;
-    whisper_load_backends();
     s  = "";
     s += "WHISPER : ";
     s += "COREML = "    + std::to_string(whisper_has_coreml())     + " | ";
@@ -8154,8 +8141,6 @@ WHISPER_API int whisper_bench_ggml_mul_mat(int n_threads) {
 }
 WHISPER_API const char * whisper_bench_ggml_mul_mat_str(int n_threads) {
-    whisper_load_backends();
     static std::string s;
     s = "";
     char strbuf[256];

     return t;
 }
 // TODO: move these functions to ggml-base with support for ggml-backend?
 static ggml_tensor * whisper_set_f32(struct ggml_tensor * t, float v) {
 static ggml_backend_t whisper_backend_init_gpu(const whisper_context_params & params) {
     ggml_log_set(g_state.log_callback, g_state.log_callback_user_data);
     ggml_backend_dev_t dev = nullptr;
     int cnt = 0;
 const char * whisper_print_system_info(void) {
     static std::string s;
     s  = "";
     s += "WHISPER : ";
     s += "COREML = "    + std::to_string(whisper_has_coreml())     + " | ";
 }
 WHISPER_API const char * whisper_bench_ggml_mul_mat_str(int n_threads) {
     static std::string s;
     s = "";
     char strbuf[256];