aboutsummaryrefslogtreecommitdiff
path: root/llama.cpp
diff options
context:
space:
mode:
authorJohannes Gäßler <johannesg@5d6.de>2023-06-18 16:07:09 +0200
committerGitHub <noreply@github.com>2023-06-18 16:07:09 +0200
commit0ede372a51fd8160688e01b587582666c14e94e5 (patch)
treec76fb86ae1ad41003a6350c92006712d62a0ba3b /llama.cpp
parent8596af427722775f0df4a7c90b9af067ba90d4ef (diff)
Fixed incorrectly applying RMS norm twice (#1925)
Diffstat (limited to 'llama.cpp')
-rw-r--r--llama.cpp6
1 files changed, 1 insertions, 5 deletions
diff --git a/llama.cpp b/llama.cpp
index dfbb85a..45360ce 100644
--- a/llama.cpp
+++ b/llama.cpp
@@ -1657,11 +1657,7 @@ static bool llama_eval_internal(
{
cur = ggml_rms_norm(ctx0, inpL);
offload_func_nr(cur);
- ggml_set_name(cur, "rms_norm_inpL");
-
- cur = ggml_rms_norm(ctx0, cur);
- offload_func_nr(cur);
- ggml_set_name(cur, "rms_norm_after");
+ ggml_set_name(cur, "rms_norm_2");
// cur = cur*norm(broadcasted)
cur = ggml_mul(ctx0, cur, model.norm);