llama: allocate grammar buffer based on schema length (#10649)

2025-12-21 22:33:56 +00:00 · 2025-05-10 20:57:30 +02:00
parent 69ce44b33c
commit ecf14a220f
1 changed files with 2 additions and 2 deletions
--- a/llama/llama.go
+++ b/llama/llama.go
@@ -637,8 +637,8 @@ func SchemaToGrammar(schema []byte) []byte {
 	cStr := C.CString(string(schema))
 	defer C.free(unsafe.Pointer(cStr))
-	// Allocate buffer for grammar output with reasonable size
+	// Allocate buffer for grammar based on schema length but with upper bound
-	const maxLen = 32768 // 32KB
+	maxLen := min(1024*1024, len(schema)*4)
 	buf := make([]byte, maxLen)
 	// Call C function to convert schema to grammar