ggml-org
diff --git a/‎examples/command/command.cpp
Lines changed: 7 additions & 7 deletions b/‎examples/command/command.cpp
Lines changed: 7 additions & 7 deletions
diff --git a/‎examples/common-sdl.cpp
Lines changed: 2 additions & 2 deletions b/‎examples/common-sdl.cpp
Lines changed: 2 additions & 2 deletions
diff --git a/‎examples/common.h
Lines changed: 1 addition & 1 deletion b/‎examples/common.h
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/lsp/CMakeLists.txt
Lines changed: 2 additions & 0 deletions b/‎examples/lsp/CMakeLists.txt
Lines changed: 2 additions & 0 deletions
diff --git a/‎examples/lsp/lsp.cpp
Lines changed: 10 additions & 10 deletions b/‎examples/lsp/lsp.cpp
Lines changed: 10 additions & 10 deletions
diff --git a/‎examples/server/CMakeLists.txt
Lines changed: 1 addition & 0 deletions b/‎examples/server/CMakeLists.txt
Lines changed: 1 addition & 0 deletions
diff --git a/‎examples/stream/CMakeLists.txt
Lines changed: 2 additions & 0 deletions b/‎examples/stream/CMakeLists.txt
Lines changed: 2 additions & 0 deletions
diff --git a/‎examples/stream/stream.cpp
Lines changed: 8 additions & 8 deletions b/‎examples/stream/stream.cpp
Lines changed: 8 additions & 8 deletions
diff --git a/‎examples/talk-llama/CMakeLists.txt
Lines changed: 1 addition & 0 deletions b/‎examples/talk-llama/CMakeLists.txt
Lines changed: 1 addition & 0 deletions
diff --git a/‎examples/talk-llama/llama-adapter.cpp
Lines changed: 4 additions & 4 deletions b/‎examples/talk-llama/llama-adapter.cpp
Lines changed: 4 additions & 4 deletions
@@ -186,7 +186,7 @@ static std::string transcribe(
         }
     }
 
-    if (whisper_full(ctx, wparams, pcmf32.data(), pcmf32.size()) != 0) {
+    if (whisper_full(ctx, wparams, pcmf32.data(), (int)pcmf32.size()) != 0) {
         return "";
     }
 
@@ -368,10 +368,10 @@ static int process_command_list(struct whisper_context * ctx, audio_async &audio
             wparams.audio_ctx        = params.audio_ctx;
 
             wparams.prompt_tokens    = k_tokens.data();
-            wparams.prompt_n_tokens  = k_tokens.size();
+            wparams.prompt_n_tokens  = (int)k_tokens.size();
 
             // run the transformer and a single decoding pass
-            if (whisper_full(ctx, wparams, pcmf32_cur.data(), pcmf32_cur.size()) != 0) {
+            if (whisper_full(ctx, wparams, pcmf32_cur.data(), (int)pcmf32_cur.size()) != 0) {
                 fprintf(stderr, "%s: ERROR: whisper_full() failed\n", __func__);
                 break;
             }
@@ -415,7 +415,7 @@ static int process_command_list(struct whisper_context * ctx, audio_async &audio
 
                 // normalize
                 for (auto & p : probs_id) {
-                    p.first /= psum;
+                    p.first = (float)(p.first / psum);
                 }
 
                 // sort descending
@@ -474,7 +474,7 @@ static int always_prompt_transcription(struct whisper_context * ctx, audio_async
 
     const std::string k_prompt = params.prompt;
 
-    const int k_prompt_length = get_words(k_prompt).size();
+    const int k_prompt_length = (int)get_words(k_prompt).size();
 
     fprintf(stderr, "\n");
     fprintf(stderr, "%s: always-prompt mode\n", __func__);
@@ -624,7 +624,7 @@ static int process_general_transcription(struct whisper_context * ctx, audio_asy
                     //printf("len command: %.4f\n", pcmf32_cur.size() / (float) WHISPER_SAMPLE_RATE);
 
                     // prepend 3 second of silence
-                    pcmf32_cur.insert(pcmf32_cur.begin(), 3.0f*WHISPER_SAMPLE_RATE, 0.0f);
+                    pcmf32_cur.insert(pcmf32_cur.begin(), (size_t)(3.0f*WHISPER_SAMPLE_RATE), 0.0f);
 
                     // prepend the prompt audio
                     pcmf32_cur.insert(pcmf32_cur.begin(), pcmf32_prompt.begin(), pcmf32_prompt.end());
@@ -639,7 +639,7 @@ static int process_general_transcription(struct whisper_context * ctx, audio_asy
                     // find the prompt in the text
                     float best_sim = 0.0f;
                     size_t best_len = 0;
-                    for (size_t n = 0.8*k_prompt.size(); n <= 1.2*k_prompt.size(); ++n) {
+                    for (size_t n = (size_t)(0.8*k_prompt.size()); n <= 1.2*k_prompt.size(); ++n) {
                         if (n >= txt.size()) {
                             break;
                         }
 
@@ -194,9 +194,9 @@ void audio_async::get(int ms, std::vector<float> & result) {
 
         result.resize(n_samples);
 
-        int s0 = m_audio_pos - n_samples;
+        int s0 = (int)(m_audio_pos - n_samples);
         if (s0 < 0) {
-            s0 += m_audio.size();
+            s0 += (int)m_audio.size();
         }
 
         if (s0 + n_samples > m_audio.size()) {
 
@@ -264,7 +264,7 @@ float similarity(const std::string & s0, const std::string & s1);
 static int rgb2xterm256(int r, int g, int b) {
     unsigned char cube[] = {0, 0137, 0207, 0257, 0327, 0377};
     int av, ir, ig, ib, il, qr, qg, qb, ql;
-    av = r * .299 + g * .587 + b * .114 + .5;
+    av = (int)(r * .299 + g * .587 + b * .114 + .5);
     ql = (il = av > 238 ? 23 : (av - 3) / 10) * 10 + 8;
     qr = cube[(ir = UNCUBE(r))];
     qg = cube[(ig = UNCUBE(g))];
 
@@ -6,4 +6,6 @@ if (WHISPER_SDL2)
     include(DefaultTargetOptions)
 
     target_link_libraries(${TARGET} PRIVATE common json_cpp common-sdl whisper ${CMAKE_THREAD_LIBS_INIT})
+
+    target_compile_definitions(lsp PRIVATE _CRT_SECURE_NO_WARNINGS)
 endif ()
@@ -122,7 +122,7 @@ static uint64_t wait_for_vad(audio_async & audio, json jparams, const whisper_pa
         std::this_thread::sleep_for(milliseconds(500 - (time_now - start_time)));
         time_now = time_point_cast<milliseconds>(system_clock::now()).time_since_epoch().count();
     } else if (time_now - start_time > 1000) {
-        audio.get(time_now-start_time, pcmf32);
+        audio.get((int)(time_now-start_time), pcmf32);
         size_t max_offset = pcmf32.size() - WHISPER_SAMPLE_RATE;
         for(size_t offset=0;offset < max_offset;offset+=WHISPER_SAMPLE_RATE/10) {
             std::vector<float> audio_chunk(&pcmf32[offset], &pcmf32[offset+WHISPER_SAMPLE_RATE]);
@@ -138,17 +138,17 @@ static uint64_t wait_for_vad(audio_async & audio, json jparams, const whisper_pa
         }
     }
     size_t window_duration = std::max((uint64_t)1000, time_now-start_time);
-    audio.get(window_duration, pcmf32);
+    audio.get((int)window_duration, pcmf32);
     while (!::vad_simple(pcmf32, WHISPER_SAMPLE_RATE, 1000, params.vad_thold, params.freq_thold, params.print_energy)) {
         std::this_thread::sleep_for(milliseconds(100));
         time_now = time_point_cast<milliseconds>(system_clock::now()).time_since_epoch().count();
         window_duration = std::max((uint64_t)1000,time_now-start_time);
-        audio.get(window_duration, pcmf32);
+        audio.get((int)window_duration, pcmf32);
     }
     if (time_now - start_time > maxlength_ms) {
-        audio.get(maxlength_ms, pcmf32);
+        audio.get((int)maxlength_ms, pcmf32);
     } else {
-        audio.get(time_now - start_time, pcmf32);
+        audio.get((int)(time_now - start_time), pcmf32);
     }
 
     return time_now;
@@ -168,7 +168,7 @@ static json unguided_transcription(struct whisper_context * ctx, audio_async &au
         prompt_tokens.resize(n);
 
         wparams.prompt_tokens    = prompt_tokens.data();
-        wparams.prompt_n_tokens  = prompt_tokens.size();
+        wparams.prompt_n_tokens  = (int)prompt_tokens.size();
     }
     wparams.print_progress   = false;
     wparams.print_special    = params.print_special;
@@ -184,7 +184,7 @@ static json unguided_transcription(struct whisper_context * ctx, audio_async &au
     wparams.audio_ctx        = params.audio_ctx;
     wparams.suppress_nst     = true;
     // run the transformer and a single decoding pass
-    if (whisper_full(ctx, wparams, pcmf32.data(), pcmf32.size()) != 0) {
+    if (whisper_full(ctx, wparams, pcmf32.data(), (int)pcmf32.size()) != 0) {
         fprintf(stderr, "%s: ERROR: whisper_full() failed\n", __func__);
         throw json{
             {"code", -32803},
@@ -224,12 +224,12 @@ static json guided_transcription(struct whisper_context * ctx, audio_async &audi
     // TODO: Do some time testing. Does an overly long prompt slow down processing?
     // Set up command sets/precompute prompts
     wparams.prompt_tokens    = cs.prompt_tokens.data();
-    wparams.prompt_n_tokens  = cs.prompt_tokens.size();
+    wparams.prompt_n_tokens  = (int)cs.prompt_tokens.size();
     // TODO: properly expose as option
     wparams.suppress_nst     = true;
 
     // run the transformer and a single decoding pass
-    if (whisper_full(ctx, wparams, pcmf32.data(), pcmf32.size()) != 0) {
+    if (whisper_full(ctx, wparams, pcmf32.data(), (int)pcmf32.size()) != 0) {
         fprintf(stderr, "%s: ERROR: whisper_full() failed\n", __func__);
         throw json{
             {"code", -32803},
@@ -322,7 +322,7 @@ static json register_commandset(struct whisper_context * ctx, json jparams, std:
     int n = whisper_tokenize(ctx, k_prompt.c_str(), cs.prompt_tokens.data(), 1024);
     cs.prompt_tokens.resize(n);
     // prepare response
-    int index = commandset_list.size();
+    int index = (int)commandset_list.size();
     commandset_list.push_back(cs);
     return json{{"index",index}};
 }
 
@@ -7,6 +7,7 @@ target_link_libraries(${TARGET} PRIVATE common json_cpp whisper ${CMAKE_THREAD_L
 
 if (WIN32)
     target_link_libraries(${TARGET} PRIVATE ws2_32)
+    target_compile_definitions(${TARGET} PRIVATE _CRT_SECURE_NO_WARNINGS)
 endif()
 
 install(TARGETS ${TARGET} RUNTIME)
@@ -7,4 +7,6 @@ if (WHISPER_SDL2)
     target_link_libraries(${TARGET} PRIVATE common common-sdl whisper ${CMAKE_THREAD_LIBS_INIT})
 
     install(TARGETS ${TARGET} RUNTIME)
+
+    target_compile_definitions(${TARGET} PRIVATE _CRT_SECURE_NO_WARNINGS)
 endif ()
@@ -125,10 +125,10 @@ int main(int argc, char ** argv) {
     params.keep_ms   = std::min(params.keep_ms,   params.step_ms);
     params.length_ms = std::max(params.length_ms, params.step_ms);
 
-    const int n_samples_step = (1e-3*params.step_ms  )*WHISPER_SAMPLE_RATE;
-    const int n_samples_len  = (1e-3*params.length_ms)*WHISPER_SAMPLE_RATE;
-    const int n_samples_keep = (1e-3*params.keep_ms  )*WHISPER_SAMPLE_RATE;
-    const int n_samples_30s  = (1e-3*30000.0         )*WHISPER_SAMPLE_RATE;
+    const int n_samples_step = (int)(1e-3*params.step_ms  )*WHISPER_SAMPLE_RATE;
+    const int n_samples_len  = (int)(1e-3*params.length_ms)*WHISPER_SAMPLE_RATE;
+    const int n_samples_keep = (int)(1e-3*params.keep_ms  )*WHISPER_SAMPLE_RATE;
+    const int n_samples_30s  = (int)(1e-3*30000.0         )*WHISPER_SAMPLE_RATE;
 
     const bool use_vad = n_samples_step <= 0; // sliding window mode uses VAD
 
@@ -265,7 +265,7 @@ int main(int argc, char ** argv) {
                 std::this_thread::sleep_for(std::chrono::milliseconds(1));
             }
 
-            const int n_samples_new = pcmf32_new.size();
+            const int n_samples_new = (int)pcmf32_new.size();
 
             // take up to params.length_ms audio from previous iteration
             const int n_samples_take = std::min((int) pcmf32_old.size(), std::max(0, n_samples_keep + n_samples_len - n_samples_new));
@@ -328,9 +328,9 @@ int main(int argc, char ** argv) {
             wparams.temperature_inc  = params.no_fallback ? 0.0f : wparams.temperature_inc;
 
             wparams.prompt_tokens    = params.no_context ? nullptr : prompt_tokens.data();
-            wparams.prompt_n_tokens  = params.no_context ? 0       : prompt_tokens.size();
+            wparams.prompt_n_tokens  = params.no_context ? 0       : (int)prompt_tokens.size();
 
-            if (whisper_full(ctx, wparams, pcmf32.data(), pcmf32.size()) != 0) {
+            if (whisper_full(ctx, wparams, pcmf32.data(), (int)pcmf32.size()) != 0) {
                 fprintf(stderr, "%s: failed to process audio\n", argv[0]);
                 return 6;
             }
@@ -346,7 +346,7 @@ int main(int argc, char ** argv) {
                     printf("\33[2K\r");
                 } else {
                     const int64_t t1 = (t_last - t_start).count()/1000000;
-                    const int64_t t0 = std::max(0.0, t1 - pcmf32.size()*1000.0/WHISPER_SAMPLE_RATE);
+                    const int64_t t0 = (int64_t)std::max(0.0, t1 - pcmf32.size()*1000.0/WHISPER_SAMPLE_RATE);
 
                     printf("\n");
                     printf("### Transcription %d START | t0 = %d ms | t1 = %d ms\n", n_iter, (int) t0, (int) t1);
 
@@ -30,6 +30,7 @@ if (WHISPER_SDL2)
     if(WIN32)
         # It requires Windows 8.1 or later for PrefetchVirtualMemory
         target_compile_definitions(${TARGET} PRIVATE -D_WIN32_WINNT=0x0602)
+        target_compile_definitions(${TARGET} PRIVATE _CRT_SECURE_NO_WARNINGS)
     endif()
 
     include(DefaultTargetOptions)
 
@@ -64,7 +64,7 @@ bool llama_adapter_cvec::init(const llama_model & model) {
     tensors.reserve(hparams.n_layer);
     tensors.push_back(nullptr); // there's never a tensor for layer 0
     for (size_t il = 1; il < hparams.n_layer; il++) {
-        ggml_backend_buffer_type_t buft = model.select_buft(il);
+        ggml_backend_buffer_type_t buft = model.select_buft((int)il);
         ggml_context * ctx = ctx_for_buft(buft);
         if (!ctx) {
             LLAMA_LOG_ERROR("%s: failed to allocate context for control vector\n", __func__);
@@ -165,11 +165,11 @@ static void llama_adapter_lora_init_impl(struct llama_model & model, const char
     // check metadata
     {
         auto get_kv_str = [&](const std::string & key) -> std::string {
-            int id = gguf_find_key(ctx_gguf.get(), key.c_str());
+            int id = (int)gguf_find_key(ctx_gguf.get(), key.c_str());
             return id < 0 ? "" : std::string(gguf_get_val_str(ctx_gguf.get(), id));
         };
         auto get_kv_f32 = [&](const std::string & key) -> float {
-            int id = gguf_find_key(ctx_gguf.get(), key.c_str());
+            int id = (int)gguf_find_key(ctx_gguf.get(), key.c_str());
             return id < 0 ? 0.0f : gguf_get_val_f32(ctx_gguf.get(), id);
         };
         LLM_KV llm_kv = LLM_KV(LLM_ARCH_UNKNOWN);
@@ -193,7 +193,7 @@ static void llama_adapter_lora_init_impl(struct llama_model & model, const char
         adapter.alpha = get_kv_f32(llm_kv(LLM_KV_ADAPTER_LORA_ALPHA));
     }
 
-    int n_tensors = gguf_get_n_tensors(ctx_gguf.get());
+    int n_tensors = (int)gguf_get_n_tensors(ctx_gguf.get());
 
     // contexts for each buffer type
     std::map<ggml_backend_buffer_type_t, ggml_context *> ctx_map;
Original file line number	Diff line number	Diff line change
`@@ -194,9 +194,9 @@ void audio_async::get(int ms, std::vector<float> & result) {`
`194`	`194`
`195`	`195`	`result.resize(n_samples);`
`196`	`196`
`197`		`- int s0 = m_audio_pos - n_samples;`
	`197`	`+ int s0 = (int)(m_audio_pos - n_samples);`
`198`	`198`	`if (s0 < 0) {`
`199`		`- s0 += m_audio.size();`
	`199`	`+ s0 += (int)m_audio.size();`
`200`	`200`	`}`
`201`	`201`
`202`	`202`	`if (s0 + n_samples > m_audio.size()) {`