cur = ggml_add(ctx0, cur, ffn_inp);
cb(cur, "l_out", il);
+ cur = build_cvec(cur, il);
+ cb(cur, "l_out", il);
+
// input for next layer
inpL = cur;
}
}
- inpL = ggml_add(ctx0, cur, ffn_inp);
- cb(inpL, "l_out", il);
+ cur = ggml_add(ctx0, cur, ffn_inp);
+
+ cur = build_cvec(cur, il);
+ cb(cur, "l_out", il);
+
+ // input for next layer
+ inpL = cur;
}
cur = build_norm(inpL,
cur = ggml_add(ctx0, cur, ffn_inp);
cb(cur, "ffn_out", il);
+ cur = build_cvec(cur, il);
+ cb(cur, "l_out", il);
+
+ // input for next layer
inpL = cur;
}
cur = ggml_add(ctx0, cur, ffn_inp);
+ // input for next layer
inpL = cur;
}
cur = inpL;
LLM_FFN_SILU, LLM_FFN_PAR, il);
cb(cur, "ffn_out", il);
}
- inpL = ggml_add(ctx0, cur, ffn_inp);
- cb(inpL, "l_out", il);
+
+ cur = ggml_add(ctx0, cur, ffn_inp);
+
+ cur = build_cvec(cur, il);
+ cb(cur, "l_out", il);
+
+ // input for next layer
+ inpL = cur;
}
cur = build_norm(inpL,
model.output_norm,
cur = build_cvec(cur, il);
cb(cur, "l_out", il);
+ // input for next layer
inpL = cur;
}
cur = inpL;
cb(ffn_norm_out, "model.layers.{}.ffn_out", il);
cur = ggml_add(ctx0, cur, ffn_out);
+
+ cur = build_cvec(cur, il);
+ cb(cur, "l_out", il);
}
cur = build_norm(cur, model.output_norm, NULL, LLM_NORM_RMS, -1);
cur = ggml_add(ctx0, cur, residual);
cb(cur, "ffn_residual", il);
+ // input for next layer
inpL = cur;
}
cur = build_cvec(cur, il);
cb(cur, "l_out", il);
+
+ // input for next layer
inpL = cur;
}
cur = ggml_add(ctx0, cur, ffn_residual);
cb(cur, "post_ffn", il);
+ cur = build_cvec(cur, il);
+ cb(cur, "l_out", il);
+
// Input for next layer
inpL = cur;
}
cur = ggml_add(ctx0, cur, ffn_residual);
cb(cur, "post_moe", il);
+ cur = build_cvec(cur, il);
+ cb(cur, "l_out", il);
+
// Input for next layer
inpL = cur;
}
cur = ggml_add(ctx0, cur, ffn_residual);
cb(cur, "post_moe", il);
+ cur = build_cvec(cur, il);
+ cb(cur, "l_out", il);
+
// Input for next layer
inpL = cur;
}
cur = ffn_out;
cur = ggml_add(ctx0, cur, ffn_inp);
+
cur = build_cvec(cur, il);
cb(cur, "l_out", il);
cb(cur, "ffn_out", il);
}
cur = ggml_add(ctx0, cur, ffn_inp);
+
cur = build_cvec(cur, il);
cb(cur, "l_out", il);
+ // input for next layer
inpL = cur;
}