Spaces:

manojthapaa
/

planck-ai

Running

App Files Files Community

Manoj Thapa commited on 2 days ago

Commit

5b1b7c1

1 Parent(s): e59469c

Fix: Improve language context switching by appending explicit instruction to user prompt

Browse files

Files changed (2) hide show

backend/agent/graph.py +33 -38
backend/tools/code_executor.py +29 -3

backend/agent/graph.py CHANGED Viewed

@@ -201,6 +201,14 @@ class AgentRunner:
         # Append Language Instruction
         if language and language != "English":
             formatted_system_prompt += f"\n\nIMPORTANT: You must respond in {language}. Translate your internal reasoning if necessary, but the final output must be in {language}."
         messages = [{"role": "system", "content": formatted_system_prompt}]
         # Smart Context Management
@@ -208,49 +216,36 @@ class AgentRunner:
         # Github Models Free Tier has a strict 8k token limit for ALL models
         # 8k tokens ~= 32k chars. We use 30k to be safe.
         MAX_HISTORY_CHARS = 30000
-        current_chars = 0
-        selected_history = []
         if conversation_history:
-            # Iterate backwards to keep most recent first
-            for msg in reversed(conversation_history):
-                content = msg.get("content") or ""
-                # Truncate extremely long individual text messages
-                if content and len(content) > 2000:
-                    content = content[:2000] + "... [truncated]"
-                # Estimate size (including tool call overhead)
-                msg_len = len(content) + 200 # Buffer for metadata
-                if current_chars + msg_len > MAX_HISTORY_CHARS:
-                    # Soft limit hit - stop adding history
                     break
-                # Reconstruct message preserving CRITICAL fields for API validity
-                clean_msg = {
-                    "role": msg["role"],
                     "content": content
-                }
-                if "tool_calls" in msg:
-                    clean_msg["tool_calls"] = msg["tool_calls"]
-                if "tool_call_id" in msg:
-                    clean_msg["tool_call_id"] = msg["tool_call_id"]
-                if "name" in msg:
-                    clean_msg["name"] = msg["name"]
-                selected_history.insert(0, clean_msg)
-                current_chars += msg_len
-        # SAFETY: Ensure history doesn't start with a 'tool' result (orphan)
-        # API requires: User/System -> Assistant -> Tool -> Assistant ...
-        # If we cut in the middle, we might start with 'tool'.
-        while selected_history and selected_history[0].get("role") == "tool":
-            selected_history.pop(0)
-        # Add trimmed history to messages
-        messages.extend(selected_history)
         # Add file context if any
         file_context = ""

         # Append Language Instruction
         if language and language != "English":
             formatted_system_prompt += f"\n\nIMPORTANT: You must respond in {language}. Translate your internal reasoning if necessary, but the final output must be in {language}."
+        # Override History Bias:
+        # If the conversation history has a different language, the model might get confused.
+        # We explicitly append the instruction to the *current* user message to force the switch.
+        current_user_content = user_message
+        if language and language != "English":
+            current_user_content += f"\n\n(Please answer in {language})"
         messages = [{"role": "system", "content": formatted_system_prompt}]
         # Smart Context Management
         # Github Models Free Tier has a strict 8k token limit for ALL models
         # 8k tokens ~= 32k chars. We use 30k to be safe.
         MAX_HISTORY_CHARS = 30000
         if conversation_history:
+            # Sort by timestamp just in case
+            sorted_history = sorted(conversation_history, key=lambda x: x.get("timestamp", ""))
+            # Simple truncation strategy
+            truncated_history = []
+            current_chars = 0
+            # Add history from newest to oldest until limit
+            for msg in reversed(sorted_history):
+                content_len = len(msg.get("documents", [""])[0] if isinstance(msg.get("documents"), list) else str(msg.get("content", "")))
+                if current_chars + content_len > MAX_HISTORY_CHARS:
                     break
+                truncated_history.insert(0, msg)
+                current_chars += content_len
+            # Convert to OpenAI format
+            for msg in truncated_history:
+                # Handle stored document format vs raw content
+                content = msg.get("documents", [""])[0] if isinstance(msg.get("documents"), list) else msg.get("content", "")
+                # Skip system messages in history if any
+                if msg.get("role") == "system":
+                    continue
+                messages.append({
+                    "role": msg.get("role"),
                     "content": content
+                })
         # Add file context if any
         file_context = ""

backend/tools/code_executor.py CHANGED Viewed

@@ -66,7 +66,7 @@ def code_executor_tool(code: str, language: str = "python") -> str:
 def _execute_python(code: str, result: Dict[str, Any]) -> str:
-    """Executes Python code in-process using exec()."""
     stdout_capture = io.StringIO()
     stderr_capture = io.StringIO()
@@ -83,14 +83,40 @@ def _execute_python(code: str, result: Dict[str, Any]) -> str:
     exec_globals = {'__builtins__': safe_builtins}
     exec_locals = {}
     try:
         with redirect_stdout(stdout_capture), redirect_stderr(stderr_capture):
             try:
-                exec_result = eval(code, exec_globals, exec_locals)
-                result["result"] = str(exec_result) if exec_result is not None else None
             except SyntaxError:
                 exec(code, exec_globals, exec_locals)
         result["stdout"] = stdout_capture.getvalue()
         result["stderr"] = stderr_capture.getvalue()
         result["success"] = True

 def _execute_python(code: str, result: Dict[str, Any]) -> str:
+    """Executes Python code in-process using AST to capture last expression."""
     stdout_capture = io.StringIO()
     stderr_capture = io.StringIO()
     exec_globals = {'__builtins__': safe_builtins}
     exec_locals = {}
+    import ast
     try:
         with redirect_stdout(stdout_capture), redirect_stderr(stderr_capture):
+            # Parse the code into an AST
             try:
+                tree = ast.parse(code)
             except SyntaxError:
+                # If parsing fails, fall back to simple exec to let it raise the error naturally
                 exec(code, exec_globals, exec_locals)
+            # Check if likely an expression at the end
+            last_node = None
+            if tree.body and isinstance(tree.body[-1], ast.Expr):
+                last_node = tree.body.pop()
+            # Execute the main block (all statements except the last expression)
+            if tree.body:
+                # Compile as a module
+                module = ast.Module(body=tree.body, type_ignores=[])
+                # We must fix locations for the new AST to be compilable
+                ast.fix_missing_locations(module)
+                compiled_module = compile(module, filename="<string>", mode="exec")
+                exec(compiled_module, exec_globals, exec_locals)
+            # Evaluate the last expression (if any)
+            if last_node:
+                expr = ast.Expression(body=last_node.value)
+                ast.fix_missing_locations(expr)
+                compiled_expr = compile(expr, filename="<string>", mode="eval")
+                exec_result = eval(compiled_expr, exec_globals, exec_locals)
+                # Store the result
+                result["result"] = str(exec_result) if exec_result is not None else None
         result["stdout"] = stdout_capture.getvalue()
         result["stderr"] = stderr_capture.getvalue()
         result["success"] = True