llama : use aligned memory during ggml_init call from loading saved sessions (#1934)

* fixed issue: memory is not guaranteed to be aligned properly during ggml_init call from loading saved sessions * - removed commented out old code from fix - updated another instance of same issue below original
2024-11-09 15:29:43 +00:00 · 2023-06-19 23:20:06 +08:00 · 2023-06-19 23:20:06 +08:00 · ba4e85a833
commit ba4e85a833
parent 23fc5c219a
1 changed files with 2 additions and 6 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -3126,9 +3126,7 @@ size_t llama_copy_state_data(struct llama_context * ctx, uint8_t * dst) {
        if (kv_size) {
            const size_t elt_size = ggml_element_size(kv_self.k);

-            char buffer[4096];
-
-            ggml_context * cpy_ctx = ggml_init({ sizeof(buffer), buffer, /* no_alloc */ true });
+            ggml_context * cpy_ctx = ggml_init({ 4096, NULL, /* no_alloc */ true });
            ggml_cgraph gf{};
            gf.n_threads = 1;

@ -3234,9 +3232,7 @@ size_t llama_set_state_data(struct llama_context * ctx, uint8_t * src) {

            const size_t elt_size = ggml_element_size(kv_self.k);

-            char buffer[4096];
-
-            ggml_context * cpy_ctx = ggml_init({ sizeof(buffer), buffer, /* no_alloc */ true });
+            ggml_context * cpy_ctx = ggml_init({ 4096, NULL, /* no_alloc */ true });
            ggml_cgraph gf{};
            gf.n_threads = 1;