fix: reduce context length to avoid token overflow

feiskyer · feiskyer · commit b4bcc4b621fd · 2025-03-13T16:41:03.000+08:00
diff --git a/README.md b/README.md
@@ -83,6 +83,7 @@ For Ollama or other OpenAI compatible LLMs, set the following environment variab
 
 - `OPENAI_API_KEY=<your-api-key>`
 - `OPENAI_API_BASE='http://localhost:11434/v1'` (or your own base URL)
+
 </details>
 
 ## Key Features
@@ -100,8 +101,8 @@ Usage:
 
 Flags:
   -h, --help               help for analyze
-      --name string        Resource name
-  -n, --namespace string   Resource namespace (default "default")
+  -n, --name string        Resource name
+  -s, --namespace string   Resource namespace (default "default")
   -r, --resource string    Resource type (default "pod")
 
 Global Flags:
@@ -111,6 +112,7 @@ Global Flags:
   -m, --model string         OpenAI model to use (default "gpt-4o")
   -v, --verbose              Enable verbose output
 ```
+
 </details>
 
 <details>
@@ -126,8 +128,8 @@ Usage:
 
 Flags:
   -h, --help               help for audit
-      --name string        Pod name
-  -n, --namespace string   Pod namespace (default "default")
+  -n, --name string        Resource name
+  -s, --namespace string   Resource namespace (default "default")
 
 Global Flags:
   -c, --count-tokens         Print tokens count
@@ -136,6 +138,7 @@ Global Flags:
   -m, --model string         OpenAI model to use (default "gpt-4o")
   -v, --verbose              Enable verbose output
 ```
+
 </details>
 
 
@@ -152,8 +155,8 @@ Usage:
 
 Flags:
   -h, --help               help for diagnose
-      --name string        Pod name
-  -n, --namespace string   Pod namespace (default "default")
+  -n, --name string        Resource name
+  -s, --namespace string   Resource namespace (default "default")
 
 Global Flags:
   -c, --count-tokens         Print tokens count
@@ -162,6 +165,7 @@ Global Flags:
   -m, --model string         OpenAI model to use (default "gpt-4o")
   -v, --verbose              Enable verbose output
 ```
+
 </details>
 
 <details>
@@ -178,7 +182,7 @@ Usage:
 
 Flags:
   -h, --help                  help for execute
-      --instructions string   instructions to execute
+  -i, --instructions string   instructions to execute
 
 Global Flags:
   -c, --count-tokens         Print tokens count
@@ -187,6 +191,7 @@ Global Flags:
   -m, --model string         OpenAI model to use (default "gpt-4o")
   -v, --verbose              Enable verbose output
 ```
+
 </details>
 
 <details>
@@ -213,6 +218,7 @@ Global Flags:
   -m, --model string         OpenAI model to use (default "gpt-4o")
   -v, --verbose              Enable verbose output
 ```
+
 </details>
 
 ## Integrations
diff --git a/cmd/kube-copilot/analyze.go b/cmd/kube-copilot/analyze.go
@@ -30,8 +30,8 @@ var analysisNamespace string
 var analysisResource string
 
 func init() {
-	analyzeCmd.PersistentFlags().StringVarP(&analysisName, "name", "", "", "Resource name")
-	analyzeCmd.PersistentFlags().StringVarP(&analysisNamespace, "namespace", "n", "default", "Resource namespace")
+	analyzeCmd.PersistentFlags().StringVarP(&analysisName, "name", "n", "", "Resource name")
+	analyzeCmd.PersistentFlags().StringVarP(&analysisNamespace, "namespace", "s", "default", "Resource namespace")
 	analyzeCmd.PersistentFlags().StringVarP(&analysisResource, "resource", "r", "pod", "Resource type")
 	analyzeCmd.MarkFlagRequired("name")
 }
diff --git a/cmd/kube-copilot/audit.go b/cmd/kube-copilot/audit.go
@@ -30,8 +30,8 @@ var (
 )
 
 func init() {
-	auditCmd.PersistentFlags().StringVarP(&auditName, "name", "", "", "Pod name")
-	auditCmd.PersistentFlags().StringVarP(&auditNamespace, "namespace", "n", "default", "Pod namespace")
+	auditCmd.PersistentFlags().StringVarP(&auditName, "name", "n", "", "Pod name")
+	auditCmd.PersistentFlags().StringVarP(&auditNamespace, "namespace", "s", "default", "Pod namespace")
 	auditCmd.MarkFlagRequired("name")
 }
 
diff --git a/cmd/kube-copilot/diagnose.go b/cmd/kube-copilot/diagnose.go
@@ -27,8 +27,8 @@ var diagnoseName string
 var diagnoseNamespace string
 
 func init() {
-	diagnoseCmd.PersistentFlags().StringVarP(&diagnoseName, "name", "", "", "Pod name")
-	diagnoseCmd.PersistentFlags().StringVarP(&diagnoseNamespace, "namespace", "n", "default", "Pod namespace")
+	diagnoseCmd.PersistentFlags().StringVarP(&diagnoseName, "name", "n", "", "Pod name")
+	diagnoseCmd.PersistentFlags().StringVarP(&diagnoseNamespace, "namespace", "s", "default", "Pod namespace")
 	diagnoseCmd.MarkFlagRequired("name")
 }
 
diff --git a/cmd/kube-copilot/execute.go b/cmd/kube-copilot/execute.go
@@ -30,7 +30,7 @@ var instructions string
 func init() {
 	tools.CopilotTools["trivy"] = tools.Trivy
 
-	executeCmd.PersistentFlags().StringVarP(&instructions, "instructions", "", "", "instructions to execute")
+	executeCmd.PersistentFlags().StringVarP(&instructions, "instructions", "i", "", "instructions to execute")
 	executeCmd.MarkFlagRequired("instructions")
 }
 
diff --git a/cmd/kube-copilot/version.go b/cmd/kube-copilot/version.go
@@ -23,7 +23,7 @@ import (
 
 const (
 	// VERSION is the version of kube-copilot.
-	VERSION = "v0.6.5"
+	VERSION = "v0.6.6"
 )
 
 var versionCmd = &cobra.Command{
diff --git a/pkg/tools/kubectl.go b/pkg/tools/kubectl.go
@@ -16,6 +16,7 @@ limitations under the License.
 package tools
 
 import (
+	"errors"
 	"os/exec"
 	"strings"
 )
@@ -26,8 +27,11 @@ func Kubectl(command string) (string, error) {
 		command = strings.TrimSpace(strings.TrimPrefix(command, "kubectl"))
 	}
 
-	cmd := exec.Command("kubectl", strings.Split(command, " ")...)
+	if strings.HasPrefix(command, "edit") {
+		return "", errors.New("interactive command kubectl edit is not supported")
+	}
 
+	cmd := exec.Command("kubectl", strings.Split(command, " ")...)
 	output, err := cmd.CombinedOutput()
 	if err != nil {
 		return strings.TrimSpace(string(output)), err
diff --git a/pkg/workflows/prompts.go b/pkg/workflows/prompts.go
@@ -0,0 +1,160 @@
+/*
+Copyright 2023 - Present, Pengfei Ni
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+	http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+*/
+package workflows
+
+const outputPrompt = `
+# Output Format
+
+Your final output must strictly adhere to this JSON structure:
+
+{
+  "question": "<input question>",
+  "thought": "<your detailed thought process>",
+  "steps": [
+    {
+      "name": "<descriptive name of step 1>",
+      "description": "<detailed description of what this step will do>",
+      "action": {
+        "name": "<tool to call for current step: kubectl, python, or trivy>",
+        "input": "<exact command or script with all required context>"
+      },
+      "status": "<one of: pending, in_progress, completed, failed>",
+      "observation": "<result from the tool call of the action, to be filled in after action execution>",
+    },
+    {
+      "name": "<descriptive name of step 2>",
+      "description": "<detailed description of what this step will do>",
+      "action": {
+        "name": "<tool to call for current step: kubectl, python, or trivy>",
+        "input": "<exact command or script with all required context>"
+      },
+      "observation": "<result from the tool call of the action, to be filled in after action execution>",
+      "status": "<status of this step>"
+    },
+    ...more steps...
+  ],
+  "current_step_index": <index of the current step being executed, zero-based>,
+  "final_answer": "<your final findings; only fill this when no further actions are required>"
+}
+
+# Important:
+- Always use function calls via the 'action' field for tool invocations. NEVER output plain text instructions for the user to run a command manually.
+- Ensure that the chain-of-thought (fields 'thought' and 'steps') is clear and concise, leading logically to the tool call if needed.
+- The final answer should only be provided when all necessary tool invocations have been completed and the issue is fully resolved.
+- The 'steps' array should contain ALL steps needed to solve the problem, with appropriate status updates as you progress (simulated data shouldn't be used here).
+- NEVER remove steps from the 'steps' array once added, only update their status.
+- Initial step statuses should be "pending", change to "in_progress" when starting a step, and then "completed" or "failed" when done.
+`
+
+const kubectlManual = `
+
+# Kubectl manual
+
+kubectl get services                          # List all services in the namespace
+kubectl get pods --all-namespaces             # List all pods in all namespaces
+kubectl get pods -o wide                      # List all pods in the current namespace, with more details
+kubectl get deployment my-dep                 # List a particular deployment
+kubectl get pods                              # List all pods in the namespace
+kubectl get pod my-pod -o yaml                # Get a pod's YAML
+
+// List pods Sorted by Restart Count
+kubectl get pods --sort-by='.status.containerStatuses[0].restartCount'
+// List PersistentVolumes sorted by capacity
+kubectl get pv --sort-by=.spec.capacity.storage
+// All images running in a cluster
+// List all warning events
+kubectl events --types=Warning
+kubectl get pods -A -o=custom-columns='DATA:spec.containers[*].image'
+// All images running in namespace: default, grouped by Pod
+kubectl get pods --namespace default --output=custom-columns="NAME:.metadata.name,IMAGE:.spec.containers[*].image"
+// dump Pod logs for a Deployment (single-container case)
+kubectl logs deploy/my-deployment
+// dump Pod logs for a Deployment (multi-container case)
+kubectl logs deploy/my-deployment -c my-container
+// dump pod logs (stdout, DO NOT USE -f)
+kubectl logs my-pod
+// dump pod container logs (stdout, multi-container case, DO NOT USE -f)
+kubectl logs my-pod -c my-container
+// Partially update a node
+kubectl patch node k8s-node-1 -p '{"spec":{"unschedulable":true}}'
+// Update a container's image; spec.containers[*].name is required because it's a merge key
+kubectl patch pod valid-pod -p '{"spec":{"containers":[{"name":"kubernetes-serve-hostname","image":"new image"}]}}'
+// Update a container's image using a json patch with positional arrays
+kubectl patch pod valid-pod --type='json' -p='[{"op": "replace", "path": "/spec/containers/0/image", "value":"new image"}]'
+// Disable a deployment livenessProbe using a json patch with positional arrays
+kubectl patch deployment valid-deployment  --type json   -p='[{"op": "remove", "path": "/spec/template/spec/containers/0/livenessProbe"}]'
+// Add a new element to a positional array
+kubectl patch sa default --type='json' -p='[{"op": "add", "path": "/secrets/1", "value": {"name": "whatever" } }]'
+// Update a deployment's replica count by patching its scale subresource
+kubectl patch deployment nginx-deployment --subresource='scale' --type='merge' -p '{"spec":{"replicas":2}}'
+// Rolling update "www" containers of "frontend" deployment, updating the image
+kubectl set image deployment/frontend www=image:v2
+`
+
+const planPrompt = `
+You are an expert Planning Agent tasked with solving Kubernetes and cloud-native networking problems efficiently through structured plans.
+Your job is to:
+
+1. Analyze the user's instruction and their intent carefully to understand the issue or goal.
+2. Create a clear and actionable plan to achieve the goal and user intent. Document this plan in the 'steps' field as a structured array.
+3. For any troubleshooting step that requires tool execution, include a function call by populating the 'action' field with:
+   - 'name': one of [kubectl, python, trivy].
+   - 'input': the exact command or script, including any required context (e.g., raw YAML, error logs, image name).
+4. Track progress and adapt plans when necessary
+5. Do not set the 'final_answer' field when a tool call is pending; only set 'final_answer' when no further tool calls are required.
+
+
+# Available Tools
+
+- kubectl: Execute Kubernetes commands. DO NOT use interactive commands (e.g. kubectl edit or kubectl logs -f). Use options like '--sort-by=memory' or '--sort-by=cpu' with 'kubectl top' when necessary and user '--all-namespaces' for cluster-wide information. Input: a single kubectl command (multiple commands are not supported). Output: the command result.
+- python: Run Python scripts that leverage the Kubernetes Python SDK client. Ensure that output is generated using 'print(...)'. Input: a Python script (multiple scripts are not supported). Output: the stdout and stderr.
+- trivy: Scan container images for vulnerabilities using the 'trivy image' command. Only use trivy when user question is security related. Input: an image name. Output: a report of vulnerabilities.
+` + outputPrompt
+
+const nextStepPrompt = `You are an expert Planning Agent tasked with solving Kubernetes and cloud-native networking problems efficiently through structured plans.
+Your job is to:
+
+1. Review the tool execution results and the current plan.
+2. Fix the tool parameters if the tool call failed (e.g. refer the kubectl manual to fix the kubectl command).
+3. Determine if the plan is sufficient, or if it needs refinement.
+4. Choose the most efficient path forward and update the plan accordingly (e.g. update the action inputs for next step or add new steps).
+5. If the task is complete, set 'final_answer' right away.
+
+Be concise in your reasoning, then select the appropriate tool or action.
+` + kubectlManual + outputPrompt
+
+const reactPrompt = `As a technical expert in Kubernetes and cloud-native networking, you are required to help user to resolve their problem using a detailed chain-of-thought methodology.
+Your responses must follow a strict JSON format and simulate tool execution via function calls without instructing the user to manually run any commands.
+
+# Available Tools
+
+- kubectl: Execute Kubernetes commands. DO NOT use interactive commands (e.g. kubectl edit or kubectl logs -f). Use options like '--sort-by=memory' or '--sort-by=cpu' with 'kubectl top' when necessary and user '--all-namespaces' for cluster-wide information. Input: a single kubectl command (multiple commands are not supported). Output: the command result.
+- python: Run Python scripts that leverage the Kubernetes Python SDK client. Ensure that output is generated using 'print(...)'. Input: a Python script (multiple scripts are not supported). Output: the stdout and stderr.
+- trivy: Scan container images for vulnerabilities using the 'trivy image' command. Only use trivy when user question is security related. Input: an image name. Output: a report of vulnerabilities.
+
+# Guidelines
+
+1. Analyze the user's instruction and their intent carefully to understand the issue or goal.
+2. Formulate a detailed, step-by-step plan to achieve the goal and user intent. Document this plan in the 'steps' field as a structured array.
+3. For any troubleshooting step that requires tool execution, include a function call by populating the 'action' field with:
+   - 'name': one of [kubectl, python, trivy].
+   - 'input': the exact command or script, including any required context (e.g., raw YAML, error logs, image name).
+4. DO NOT instruct the user to manually run any commands. All tool calls must be performed by the assistant through the 'action' field.
+5. After a tool is invoked, analyze its result (which will be provided in the 'observation' field) and update your chain-of-thought accordingly.
+6. Do not set the 'final_answer' field when a tool call is pending; only set 'final_answer' when no further tool calls are required.
+7. Maintain a clear and concise chain-of-thought in the 'thought' field. Include a detailed, step-by-step process in the 'steps' field.
+8. Your entire response must be a valid JSON object with exactly the following keys: 'question', 'thought', 'steps', 'current_step_index', 'action', 'observation', and 'final_answer'. Do not include any additional text or markdown formatting.
+` + outputPrompt
diff --git a/pkg/workflows/reactflow.go b/pkg/workflows/reactflow.go

Original file line number	Diff line number	Diff line change
`@@ -30,8 +30,8 @@ var (`
`30`	`30`	`)`
`31`	`31`
`32`	`32`	`func init() {`
`33`		`- auditCmd.PersistentFlags().StringVarP(&auditName, "name", "", "", "Pod name")`
`34`		`- auditCmd.PersistentFlags().StringVarP(&auditNamespace, "namespace", "n", "default", "Pod namespace")`
	`33`	`+ auditCmd.PersistentFlags().StringVarP(&auditName, "name", "n", "", "Pod name")`
	`34`	`+ auditCmd.PersistentFlags().StringVarP(&auditNamespace, "namespace", "s", "default", "Pod namespace")`
`35`	`35`	`auditCmd.MarkFlagRequired("name")`
`36`	`36`	`}`
`37`	`37`
Original file line number	Diff line number	Diff line change
`@@ -27,8 +27,8 @@ var diagnoseName string`
`27`	`27`	`var diagnoseNamespace string`
`28`	`28`
`29`	`29`	`func init() {`
`30`		`- diagnoseCmd.PersistentFlags().StringVarP(&diagnoseName, "name", "", "", "Pod name")`
`31`		`- diagnoseCmd.PersistentFlags().StringVarP(&diagnoseNamespace, "namespace", "n", "default", "Pod namespace")`
	`30`	`+ diagnoseCmd.PersistentFlags().StringVarP(&diagnoseName, "name", "n", "", "Pod name")`
	`31`	`+ diagnoseCmd.PersistentFlags().StringVarP(&diagnoseNamespace, "namespace", "s", "default", "Pod namespace")`
`32`	`32`	`diagnoseCmd.MarkFlagRequired("name")`
`33`	`33`	`}`
`34`	`34`
Original file line number	Diff line number	Diff line change
`@@ -30,7 +30,7 @@ var instructions string`
`30`	`30`	`func init() {`
`31`	`31`	`tools.CopilotTools["trivy"] = tools.Trivy`
`32`	`32`
`33`		`- executeCmd.PersistentFlags().StringVarP(&instructions, "instructions", "", "", "instructions to execute")`
	`33`	`+ executeCmd.PersistentFlags().StringVarP(&instructions, "instructions", "i", "", "instructions to execute")`
`34`	`34`	`executeCmd.MarkFlagRequired("instructions")`
`35`	`35`	`}`
`36`	`36`
Original file line number	Diff line number	Diff line change
`@@ -23,7 +23,7 @@ import (`
`23`	`23`
`24`	`24`	`const (`
`25`	`25`	`// VERSION is the version of kube-copilot.`
`26`		`- VERSION = "v0.6.5"`
	`26`	`+ VERSION = "v0.6.6"`
`27`	`27`	`)`
`28`	`28`
`29`	`29`	`var versionCmd = &cobra.Command{`