mirror of
https://github.com/likelovewant/ollama-for-amd.git
synced 2025-12-21 22:33:56 +00:00
llama: allocate grammar buffer based on schema length (#10649)
This commit is contained in:
@@ -637,8 +637,8 @@ func SchemaToGrammar(schema []byte) []byte {
|
|||||||
cStr := C.CString(string(schema))
|
cStr := C.CString(string(schema))
|
||||||
defer C.free(unsafe.Pointer(cStr))
|
defer C.free(unsafe.Pointer(cStr))
|
||||||
|
|
||||||
// Allocate buffer for grammar output with reasonable size
|
// Allocate buffer for grammar based on schema length but with upper bound
|
||||||
const maxLen = 32768 // 32KB
|
maxLen := min(1024*1024, len(schema)*4)
|
||||||
buf := make([]byte, maxLen)
|
buf := make([]byte, maxLen)
|
||||||
|
|
||||||
// Call C function to convert schema to grammar
|
// Call C function to convert schema to grammar
|
||||||
|
|||||||
Reference in New Issue
Block a user