From f3648fd20607f92f5fcf65ef7d7b52d919ae4909 Mon Sep 17 00:00:00 2001 From: Bruce MacDonald Date: Tue, 17 Oct 2023 16:55:16 -0400 Subject: [PATCH] Update llama.cpp gguf to latest (#710) --- llm/llama.cpp/gguf | 2 +- .../patches/0001-remove-warm-up-logging.patch | 18 +++++++++--------- 2 files changed, 10 insertions(+), 10 deletions(-) diff --git a/llm/llama.cpp/gguf b/llm/llama.cpp/gguf index bc9d3e39..40e5ce05 160000 --- a/llm/llama.cpp/gguf +++ b/llm/llama.cpp/gguf @@ -1 +1 @@ -Subproject commit bc9d3e3971e5607a10ff4c24e39568ce1ac87271 +Subproject commit 40e5ce054f4c4fa555e4510ea5f760bb29185332 diff --git a/llm/llama.cpp/patches/0001-remove-warm-up-logging.patch b/llm/llama.cpp/patches/0001-remove-warm-up-logging.patch index 04aa4802..662b651e 100644 --- a/llm/llama.cpp/patches/0001-remove-warm-up-logging.patch +++ b/llm/llama.cpp/patches/0001-remove-warm-up-logging.patch @@ -1,6 +1,6 @@ -From 07993bdc35345b67b27aa649a7c099ad42d80c4c Mon Sep 17 00:00:00 2001 -From: Michael Yang -Date: Thu, 21 Sep 2023 14:43:21 -0700 +From 8dbb5449db259a9c24796e7927d89bee98b6c8f5 Mon Sep 17 00:00:00 2001 +From: Bruce MacDonald +Date: Thu, 5 Oct 2023 11:21:12 -0400 Subject: [PATCH] remove warm up logging --- @@ -8,18 +8,18 @@ Subject: [PATCH] remove warm up logging 1 file changed, 2 deletions(-) diff --git a/common/common.cpp b/common/common.cpp -index 2597ba0..b56549b 100644 +index 7370017..c4433fe 100644 --- a/common/common.cpp +++ b/common/common.cpp -@@ -780,8 +780,6 @@ std::tuple llama_init_from_gpt_par +@@ -839,8 +839,6 @@ std::tuple llama_init_from_gpt_par } { - LOG("warming up the model with an empty run\n"); - - const std::vector tmp = { llama_token_bos(lctx), llama_token_eos(lctx), }; - llama_eval(lctx, tmp.data(), std::min(tmp.size(), (size_t) params.n_batch), 0, params.n_threads); - llama_reset_timings(lctx); + std::vector tmp = { llama_token_bos(lctx), llama_token_eos(lctx), }; + llama_decode(lctx, llama_batch_get_one(tmp.data(), std::min(tmp.size(), (size_t) params.n_batch), 0, 0)); + llama_kv_cache_tokens_rm(lctx, -1, -1); -- -2.42.0 +2.39.2 (Apple Git-143)