From 9e4f8b4acc387f3c0f0cdb62c2582dc01a67caad Mon Sep 17 00:00:00 2001 From: Adam Treat Date: Tue, 26 Sep 2023 11:58:39 -0400 Subject: [PATCH] Upload immediately to device. --- llama.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/llama.cpp b/llama.cpp index e8ca52d5f..1432696bd 100644 --- a/llama.cpp +++ b/llama.cpp @@ -2787,7 +2787,7 @@ static struct ggml_cgraph * llm_build_llama( ggml_free(ctx0); #if defined(GGML_USE_KOMPUTE) - if (lctx.ctx_kompute && N == 1) { + if (lctx.ctx_kompute) { if (!ggml_vk_has_h2d_all(lctx.ctx_kompute)) { ggml_vk_h2d_all(lctx.ctx_kompute); } else {