llama : wrap llama_new_context_with_model in try/catch

This fixes a crash where ggml_vk_allocate fails in llama_kv_cache_init, but the exception is never caught.
nomic-ai · dependabot · Nov 24, 2023 · Jan 31, 2024 · Jan 31, 2024 · Jan 31, 2024
commit b6891bc9b3298cc53f879aa606a0e9bd96135a9c
diff --git a/src/llama.cpp b/src/llama.cpp
@@ -18993,7 +18993,7 @@ void llama_free_model(struct llama_model * model) {
     delete model;
 }
 
-struct llama_context * llama_new_context_with_model(
+static struct llama_context * llama_new_context_with_model_internal(
                  struct llama_model * model,
         struct llama_context_params   params) {
 
@@ -19394,6 +19394,18 @@ struct llama_context * llama_new_context_with_model(
     return ctx;
 }
 
+struct llama_context * llama_new_context_with_model(
+    struct llama_model * model,
+    struct llama_context_params params
+) {
+    try {
+        return llama_new_context_with_model_internal(model, params);
+    } catch (const std::exception & err) {
+        LLAMA_LOG_ERROR("%s: failed to init context: %s\n", __func__, err.what());
+        return nullptr;
+    }
+}
+
 void llama_free(struct llama_context * ctx) {
     delete ctx;
 }