From 742e731e966b1b59cedad36301e32fc7613e4bce Mon Sep 17 00:00:00 2001 From: Akarshan Biswas Date: Mon, 26 May 2025 16:20:42 +0530 Subject: [PATCH] Add --reasoning_budget option --- core/src/browser/extensions/engines/AIEngine.ts | 1 + extensions/llamacpp-extension/settings.json | 13 +++++++++++++ extensions/llamacpp-extension/src/index.ts | 3 +++ 3 files changed, 17 insertions(+) diff --git a/core/src/browser/extensions/engines/AIEngine.ts b/core/src/browser/extensions/engines/AIEngine.ts index 5998fd847..3138caa95 100644 --- a/core/src/browser/extensions/engines/AIEngine.ts +++ b/core/src/browser/extensions/engines/AIEngine.ts @@ -126,6 +126,7 @@ export interface loadOptions { rope_scale?: number rope_freq_base?: number rope_freq_scale?: number + reasoning_budget?: number } export interface sessionInfo { diff --git a/extensions/llamacpp-extension/settings.json b/extensions/llamacpp-extension/settings.json index af8a42c51..9ac59a28b 100644 --- a/extensions/llamacpp-extension/settings.json +++ b/extensions/llamacpp-extension/settings.json @@ -447,5 +447,18 @@ "placeholder": "path/to/schema.json", "type": "text" } + }, + { + "key": "reasoning_budget", + "title": "controls the amount of thinking allowed; currently only one of: -1 for unrestricted thinking budget, or 0 to disable thinking (default: -1)", + "description": "Mirostat target entropy (tau).", + "controllerType": "input", + "controllerProps": { + "value": 0, + "options": [ + { "value": -1, "name": "unrestricted thinking budget" }, + { "value": 0, "name": "disable thinking" } + ] + } } ] diff --git a/extensions/llamacpp-extension/src/index.ts b/extensions/llamacpp-extension/src/index.ts index 9701e9b62..c634e85a0 100644 --- a/extensions/llamacpp-extension/src/index.ts +++ b/extensions/llamacpp-extension/src/index.ts @@ -347,6 +347,9 @@ export default class llamacpp_extension extends AIEngine { if (opts.rope_freq_scale !== undefined) { args.push('--rope-freq-scale', String(opts.rope_freq_scale)) } + if (opts.reasoning_budget !== undefined) { + args.push('--reasoning-budget', String(opts.reasoning_budget)) + } console.log('Calling Tauri command llama_load with args:', args) try {