Fix crash for 65B model with pre-allocated memory (#485)

2024-11-14 00:59:43 +00:00 · 2023-03-24 23:38:14 -05:00 · 2023-03-24 23:38:14 -05:00 · 6f1ee4b640
commit 6f1ee4b640
parent 8520fc310e
1 changed files with 1 additions and 1 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -239,7 +239,7 @@ static bool kv_cache_init(
    const int n_mem      = n_layer*n_ctx;
    const int n_elements = n_embd*n_mem;

-    cache.buf.resize(2*n_elements*ggml_type_size(wtype) + 2u*MB);
+    cache.buf.resize(2u*n_elements*ggml_type_size(wtype) + 2u*MB);

    struct ggml_init_params params;
    params.mem_size   = cache.buf.size();