From 957c8ae21d1e7052ea45a40ee8c0407b909e90cc Mon Sep 17 00:00:00 2001 From: Georgi Gerganov Date: Mon, 24 Apr 2023 18:47:03 +0300 Subject: [PATCH] llama : increase scratch buffer size for 65B (ref #1152) Temporary solution --- llama.cpp | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/llama.cpp b/llama.cpp index bc0ef12..28d2791 100644 --- a/llama.cpp +++ b/llama.cpp @@ -54,7 +54,7 @@ static const std::map & MEM_REQ_SCRATCH0() { MODEL_7B, 512ull * MB }, { MODEL_13B, 512ull * MB }, { MODEL_30B, 512ull * MB }, - { MODEL_65B, 512ull * MB }, + { MODEL_65B, 1024ull * MB }, }; return _MEM_REQ_SCRATCH0; } @@ -65,7 +65,7 @@ static const std::map & MEM_REQ_SCRATCH1() { MODEL_7B, 512ull * MB }, { MODEL_13B, 512ull * MB }, { MODEL_30B, 512ull * MB }, - { MODEL_65B, 512ull * MB }, + { MODEL_65B, 1024ull * MB }, }; return _MEM_REQ_SCRATCH1; }