From dffd2a710def22009cedbea2dc07e6a40dad1021 Mon Sep 17 00:00:00 2001 From: Henri Vasserman Date: Mon, 5 Jun 2023 12:08:04 +0300 Subject: [PATCH] Increase 3B scratch buffers. The 128 MB was too optimistic. Too bad it is not dynamically computed. --- llama.cpp | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/llama.cpp b/llama.cpp index 69bfdc1a107b5..a16450173453a 100644 --- a/llama.cpp +++ b/llama.cpp @@ -63,7 +63,7 @@ static const size_t MB = 1024*1024; static const std::map & MEM_REQ_SCRATCH0() { static std::map k_sizes = { - { MODEL_3B, 128ull * MB }, + { MODEL_3B, 256ull * MB }, { MODEL_7B, 512ull * MB }, { MODEL_13B, 512ull * MB }, { MODEL_30B, 512ull * MB }, @@ -75,7 +75,7 @@ static const std::map & MEM_REQ_SCRATCH0() static const std::map & MEM_REQ_SCRATCH1() { static std::map k_sizes = { - { MODEL_3B, 128ull * MB }, + { MODEL_3B, 256ull * MB }, { MODEL_7B, 512ull * MB }, { MODEL_13B, 512ull * MB }, { MODEL_30B, 512ull * MB },