From 7967919cc90ef6d1318e3527173b15c1864090ba Mon Sep 17 00:00:00 2001 From: shatfield4 Date: Wed, 30 Apr 2025 16:16:18 -0700 Subject: [PATCH] add option to control koboldcpp max response tokens --- .../LLMSelection/KoboldCPPOptions/index.jsx | 27 +++++++++++++++++++ server/.env.example | 1 + server/models/systemSettings.js | 1 + server/utils/AiProviders/koboldCPP/index.js | 3 +++ server/utils/helpers/updateENV.js | 4 +++ 5 files changed, 36 insertions(+) diff --git a/frontend/src/components/LLMSelection/KoboldCPPOptions/index.jsx b/frontend/src/components/LLMSelection/KoboldCPPOptions/index.jsx index ac4db91aae5..0c774112fc6 100644 --- a/frontend/src/components/LLMSelection/KoboldCPPOptions/index.jsx +++ b/frontend/src/components/LLMSelection/KoboldCPPOptions/index.jsx @@ -22,11 +22,18 @@ export default function KoboldCPPOptions({ settings }) { const [tokenLimit, setTokenLimit] = useState( settings?.KoboldCPPTokenLimit || 4096 ); + const [maxTokens, setMaxTokens] = useState( + settings?.KoboldCPPMaxTokens || 2048 + ); const handleTokenLimitChange = (e) => { setTokenLimit(Number(e.target.value)); }; + const handleMaxTokensChange = (e) => { + setMaxTokens(Number(e.target.value)); + }; + return (
@@ -54,6 +61,26 @@ export default function KoboldCPPOptions({ settings }) { Maximum number of tokens for context and response.

+
+ + e.target.blur()} + required={true} + autoComplete="off" + /> +

+ Maximum number of tokens for the response. +

+