batch: use tensors for outputs (#12185)

this cleans up the model interface slightly without too much impact in other areas
2025-12-22 06:43:57 +00:00 · 2025-09-15 14:33:06 -07:00
parent 92b96d54ef
commit 6f7117145f
14 changed files with 27 additions and 37 deletions
--- a/model/models/llama/model.go
+++ b/model/models/llama/model.go
@@ -160,7 +160,7 @@ func (m *Model) Forward(ctx ml.Context, batch input.Batch) (ml.Tensor, error) {

 		var outputs ml.Tensor
 		if i == len(m.Layers)-1 {
-			outputs = ctx.Input().FromIntSlice(batch.Outputs, len(batch.Outputs))
+			outputs = batch.Outputs
 		}

 		hiddenState = layer.Forward(ctx, hiddenState, positions, outputs, m.Cache, m.Options)