From 5220a991a5e92bddad9542267ab445a2c033681c Mon Sep 17 00:00:00 2001 From: Henri Vasserman Date: Mon, 5 Jun 2023 13:43:08 +0300 Subject: Increase 3B scratch buffers. (#1698) The 128 MB was too optimistic. Too bad it is not dynamically computed. --- llama.cpp | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/llama.cpp b/llama.cpp index 69bfdc1..a164501 100644 --- a/llama.cpp +++ b/llama.cpp @@ -63,7 +63,7 @@ static const size_t MB = 1024*1024; static const std::map & MEM_REQ_SCRATCH0() { static std::map k_sizes = { - { MODEL_3B, 128ull * MB }, + { MODEL_3B, 256ull * MB }, { MODEL_7B, 512ull * MB }, { MODEL_13B, 512ull * MB }, { MODEL_30B, 512ull * MB }, @@ -75,7 +75,7 @@ static const std::map & MEM_REQ_SCRATCH0() static const std::map & MEM_REQ_SCRATCH1() { static std::map k_sizes = { - { MODEL_3B, 128ull * MB }, + { MODEL_3B, 256ull * MB }, { MODEL_7B, 512ull * MB }, { MODEL_13B, 512ull * MB }, { MODEL_30B, 512ull * MB }, -- cgit v1.2.3