mirror of
https://github.com/k8sgpt-ai/k8sgpt.git
synced 2025-05-03 13:46:29 +00:00
fix: add maxTokens to serve mode (#1280)
Signed-off-by: samir-tahir <samirtahir91@gmail.com> Co-authored-by: Alex Jones <alexsimonjones@gmail.com>
This commit is contained in:
parent
da266b3c82
commit
a50375c960
@ -30,6 +30,7 @@ const (
|
|||||||
defaultTemperature float32 = 0.7
|
defaultTemperature float32 = 0.7
|
||||||
defaultTopP float32 = 1.0
|
defaultTopP float32 = 1.0
|
||||||
defaultTopK int32 = 50
|
defaultTopK int32 = 50
|
||||||
|
defaultMaxTokens int = 2048
|
||||||
)
|
)
|
||||||
|
|
||||||
var (
|
var (
|
||||||
@ -102,6 +103,18 @@ var ServeCmd = &cobra.Command{
|
|||||||
}
|
}
|
||||||
return int32(topK)
|
return int32(topK)
|
||||||
}
|
}
|
||||||
|
maxTokens := func() int {
|
||||||
|
env := os.Getenv("K8SGPT_MAX_TOKENS")
|
||||||
|
if env == "" {
|
||||||
|
return defaultMaxTokens
|
||||||
|
}
|
||||||
|
maxTokens, err := strconv.ParseInt(env, 10, 32)
|
||||||
|
if err != nil {
|
||||||
|
color.Red("Unable to convert maxTokens value: %v", err)
|
||||||
|
os.Exit(1)
|
||||||
|
}
|
||||||
|
return int(maxTokens)
|
||||||
|
}
|
||||||
// Check for env injection
|
// Check for env injection
|
||||||
backend = os.Getenv("K8SGPT_BACKEND")
|
backend = os.Getenv("K8SGPT_BACKEND")
|
||||||
password := os.Getenv("K8SGPT_PASSWORD")
|
password := os.Getenv("K8SGPT_PASSWORD")
|
||||||
@ -125,6 +138,7 @@ var ServeCmd = &cobra.Command{
|
|||||||
Temperature: temperature(),
|
Temperature: temperature(),
|
||||||
TopP: topP(),
|
TopP: topP(),
|
||||||
TopK: topK(),
|
TopK: topK(),
|
||||||
|
MaxTokens: maxTokens(),
|
||||||
}
|
}
|
||||||
|
|
||||||
configAI.Providers = append(configAI.Providers, *aiProvider)
|
configAI.Providers = append(configAI.Providers, *aiProvider)
|
||||||
|
Loading…
Reference in New Issue
Block a user