From ca4ae7844d39ddb9425ef90cf5220730c54e46b0 Mon Sep 17 00:00:00 2001 From: JohannesGaessler Date: Sun, 18 Jun 2023 14:34:52 +0200 Subject: [PATCH] Fixed incorrectly applying RMS norm twice --- llama.cpp | 6 +----- 1 file changed, 1 insertion(+), 5 deletions(-) diff --git a/llama.cpp b/llama.cpp index dfbb85a682baa..45360cea37ba5 100644 --- a/llama.cpp +++ b/llama.cpp @@ -1657,11 +1657,7 @@ static bool llama_eval_internal( { cur = ggml_rms_norm(ctx0, inpL); offload_func_nr(cur); - ggml_set_name(cur, "rms_norm_inpL"); - - cur = ggml_rms_norm(ctx0, cur); - offload_func_nr(cur); - ggml_set_name(cur, "rms_norm_after"); + ggml_set_name(cur, "rms_norm_2"); // cur = cur*norm(broadcasted) cur = ggml_mul(ctx0, cur, model.norm);