mirror of
https://github.com/likelovewant/ollama-for-amd.git
synced 2025-12-21 22:33:56 +00:00
comment split
This commit is contained in:
committed by
Michael Yang
parent
e0cd511661
commit
629db9dc43
@@ -86,6 +86,8 @@ func (m *gptossModel) Tensors(ts []Tensor) []*ggml.Tensor {
|
|||||||
mxfp4s[name].scales = t
|
mxfp4s[name].scales = t
|
||||||
}
|
}
|
||||||
} else if strings.HasSuffix(t.Name(), "gate_up_exps.bias") {
|
} else if strings.HasSuffix(t.Name(), "gate_up_exps.bias") {
|
||||||
|
// gate_up_exps is interleaved, need to split into gate_exps and up_exps
|
||||||
|
// e.g. gate_exps, up_exps = gate_up_exps[:, 0::2, ...], gate_up_exps[:, 1::2, ...]
|
||||||
out = append(out, slices.Collect(splitDim(t, 1,
|
out = append(out, slices.Collect(splitDim(t, 1,
|
||||||
split{
|
split{
|
||||||
Replacer: strings.NewReplacer("gate_up_exps", "gate_exps"),
|
Replacer: strings.NewReplacer("gate_up_exps", "gate_exps"),
|
||||||
@@ -116,6 +118,8 @@ func (m *gptossModel) Tensors(ts []Tensor) []*ggml.Tensor {
|
|||||||
WriterTo: mxfp4,
|
WriterTo: mxfp4,
|
||||||
})
|
})
|
||||||
} else if strings.Contains(name, "ffn_gate_up_exps") {
|
} else if strings.Contains(name, "ffn_gate_up_exps") {
|
||||||
|
// gate_up_exps is interleaved, need to split into gate_exps and up_exps
|
||||||
|
// e.g. gate_exps, up_exps = gate_up_exps[:, 0::2, ...], gate_up_exps[:, 1::2, ...]
|
||||||
out = append(out, &ggml.Tensor{
|
out = append(out, &ggml.Tensor{
|
||||||
Name: strings.Replace(name, "gate_up", "gate", 1) + ".weight",
|
Name: strings.Replace(name, "gate_up", "gate", 1) + ".weight",
|
||||||
Kind: uint32(ggml.TensorTypeMXFP4),
|
Kind: uint32(ggml.TensorTypeMXFP4),
|
||||||
|
|||||||
Reference in New Issue
Block a user