From bad0cafee98353c18175c4591c8a3962fa45f308 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Stanis=C5=82aw=20Szymczyk?= Date: Wed, 26 Jun 2024 17:38:13 +0200 Subject: [PATCH] llama : updated llm_build_ffn() calls to new API in build_t5() --- llama.cpp | 12 ++++++------ 1 file changed, 6 insertions(+), 6 deletions(-) diff --git a/llama.cpp b/llama.cpp index 8d4e3d31c..41daf9a0a 100644 --- a/llama.cpp +++ b/llama.cpp @@ -12395,9 +12395,9 @@ struct llm_build_context { // T5 uses relu, flan-T5 uses gelu-gated cur = llm_build_ffn(ctx0, cur, - model.layers[il].enc_ffn_up, NULL, - model.layers[il].enc_ffn_gate, NULL, - model.layers[il].enc_ffn_down, NULL, + model.layers[il].enc_ffn_up, NULL, NULL, + model.layers[il].enc_ffn_gate, NULL, NULL, + model.layers[il].enc_ffn_down, NULL, NULL, NULL, model.layers[il].enc_ffn_gate ? LLM_FFN_GELU : LLM_FFN_RELU, model.layers[il].enc_ffn_gate ? LLM_FFN_PAR : LLM_FFN_SEQ, @@ -12573,9 +12573,9 @@ struct llm_build_context { // T5 uses relu, flan-T5 uses gelu-gated cur = llm_build_ffn(ctx0, cur, - model.layers[il].ffn_up, NULL, - model.layers[il].ffn_gate, NULL, - model.layers[il].ffn_down, NULL, + model.layers[il].ffn_up, NULL, NULL, + model.layers[il].ffn_gate, NULL, NULL, + model.layers[il].ffn_down, NULL, NULL, NULL, model.layers[il].enc_ffn_gate ? LLM_FFN_GELU : LLM_FFN_RELU, model.layers[il].enc_ffn_gate ? LLM_FFN_PAR : LLM_FFN_SEQ,