llama/parsers/renderers: nemotron 3 nano (#13489)

--------- Co-authored-by: Daniel Hiltgen <daniel@ollama.com>
2025-12-24 07:28:27 +00:00 · 2025-12-15 18:00:08 -08:00
parent 7b95087b9d
commit 7e3ea813c1
13 changed files with 2364 additions and 15 deletions
--- a/llama/llama.cpp/src/llama-graph.cpp
+++ b/llama/llama.cpp/src/llama-graph.cpp
@@ -1089,6 +1089,16 @@ ggml_tensor * llm_graph_context::build_moe_ffn(
                cur = ggml_relu(ctx0, cur);
                cb(cur, "ffn_moe_relu", il);
            } break;
+        case LLM_FFN_RELU_SQR:
+            if (gate_exps) {
+                // TODO: add support for gated squared relu
+                GGML_ABORT("fatal error: gated squared relu not implemented");
+            } else {
+                cur = ggml_relu(ctx0, cur);
+                cur = ggml_sqr(ctx0, cur);
+                cb(cur, "ffn_moe_relu_sqr", il);
+            }
+            break;
        default:
            GGML_ABORT("fatal error");
    }