diff --git a/llama.cpp b/llama.cpp index fde4d25..7de3c19 100644 --- a/llama.cpp +++ b/llama.cpp @@ -9,6 +9,7 @@ #include #include #include +#include // determine number of model parts based on the dimension static const std::unordered_map LLAMA_N_PARTS = {