use split activations when possible (#12293)

* use ggml_*_split activations when possible * forward qkv
2025-12-23 23:18:26 +00:00 · 2025-09-16 09:51:19 -07:00
parent c253433d68
commit ad95d5b30b
16 changed files with 59 additions and 50 deletions
--- a/model/models/qwen2/model.go
+++ b/model/models/qwen2/model.go
@@ -59,7 +59,7 @@ type MLP struct {
 }

 func (mlp MLP) Forward(ctx ml.Context, hiddenStates ml.Tensor) ml.Tensor {
-	hiddenStates = mlp.Gate.Forward(ctx, hiddenStates).SILU(ctx).Mul(ctx, mlp.Up.Forward(ctx, hiddenStates))
+	hiddenStates = mlp.Gate.Forward(ctx, hiddenStates).SILU(ctx, mlp.Up.Forward(ctx, hiddenStates))
 	return mlp.Down.Forward(ctx, hiddenStates)
 }