pti stream fixes. adding reasoning content to streams.

cagostino · cagostino · commit 657ab860a5a0 · 2025-05-05T19:27:59.000-04:00
diff --git a/mkdocs.yml b/mkdocs.yml
@@ -45,4 +45,6 @@ nav:
   - TLDR Cheat Sheet: TLDR_Cheat_sheet.md
   - API:
     - Image: api/image.md
-    - LLM Functions: api/llm_funcs.md
+    - LLM Functions: api/llm_funcs.md
+    - NPC, Team, Tool: api/npc.md
+    - NPC Sys Env Helpers: api/npc_sys_env_helpers.md
diff --git a/npcpy/llm_funcs.py b/npcpy/llm_funcs.py
@@ -1025,28 +1025,3 @@ def check_llm_command(
     else:
         print("Error: Invalid action in LLM response")
         return "Error: Invalid action in LLM response"
-
-
-def rehash_last_message(
-    conversation_id: str,
-    model: str,
-    provider: str,
-    npc: Any = None,
-    stream: bool = False,
-) -> dict:
-    from npcpy.memory.command_history import CommandHistory    
-    command_history = CommandHistory()
-    last_message = command_history.get_last_conversation(conversation_id)
-    if last_message is None:
-        convo_id = command_history.get_most_recent_conversation_id()[0]
-        last_message = command_history.get_last_conversation(convo_id)
-
-    user_command = last_message[3]  # Assuming content is in the 4th column
-    return check_llm_command(
-        user_command,
-        model=model,
-        provider=provider,
-        npc=npc,
-        messages=None,
-        stream=stream,
-    )
diff --git a/npcpy/memory/command_history.py b/npcpy/memory/command_history.py
@@ -882,7 +882,8 @@ def get_available_tables(db_path: str) -> str:
     Returns:
         str: The available tables in the database.
     """
-
+    if '~' in db_path:
+        db_path = os.path.expanduser(db_path)
     try:
         with sqlite3.connect(db_path) as conn:
             cursor = conn.cursor()
diff --git a/npcpy/modes/pti.py b/npcpy/modes/pti.py
@@ -157,7 +157,7 @@ def enter_reasoning_human_in_the_loop(
                                                          reasoning_model=reasoning_model, 
                                                          reasoning_provider=reasoning_provider, answer_only=False)
             else:
-                message= "Think first though and use <think> tags. Once finished, either answer plainly or write a request for input by beginning with the <request_for_input> tag. and close it with a </request_for_input>"
+                message= "Think first though and use <think> tags in your chain of thought. Once finished, either answer plainly or write a request for input by beginning with the <request_for_input> tag. and close it with a </request_for_input>"
                 if user_input is None:
                     user_input = input('user>')
                 
@@ -183,13 +183,31 @@ def enter_reasoning_human_in_the_loop(
                 assistant_reply, messages = response['response'], response['messages']
                 thoughts = []
                 response_chunks = []
-                in_think_block = False
-                for chunk in assistant_reply:            
+                in_think_block = False # the thinking chain generated after reasoning
+                
+                thinking = False # the reasoning content 
+                
+
+                for chunk in assistant_reply:       
+                    if thinking:
+                        if not in_think_block:
+                            in_think_block = True
                     try:
+                        
                         if reasoning_provider == "ollama":
                             chunk_content = chunk.get("message", {}).get("content", "")
                         else:
-                            chunk_content = "".join(
+                            chunk_content = ''
+                            reasoning_content = ''
+                            for c in chunk.choices:
+                                if hasattr(c.delta, "reasoning_content"):
+                                    
+                                    reasoning_content += c.delta.reasoning_content
+                                    
+                            if reasoning_content:
+                                thinking = True
+                                chunk_content = reasoning_content
+                            chunk_content += "".join(
                                 choice.delta.content
                                 for choice in chunk.choices
                                 if choice.delta.content is not None
@@ -198,14 +216,9 @@ def enter_reasoning_human_in_the_loop(
                         print(chunk_content, end='')
                         combined_text = "".join(response_chunks)
 
-                        # Check for LLM request block
-                        if (
-                            "<think>" in combined_text
-                            and "</think>" not in combined_text
-                        ):
-                            in_think_block = True
-
                         if in_think_block:
+                            if '</thinking>' in combined_text:
+                                in_think_block = False
                             thoughts.append(chunk_content)
                             
                         if "</request_for_input>" in combined_text:
diff --git a/npcpy/npc_sysenv.py b/npcpy/npc_sysenv.py
@@ -1335,11 +1335,15 @@ def print_and_process_stream_with_markdown(response,
         dot_count += 1
 
         if provider == "ollama":
+            
             chunk_content = chunk["message"]["content"]
         else:
-            chunk_content = "".join(
+            
+            chunk_content = "".join(c.delta.reasoning_content for c in chunk.choices if c.delta.reasoning_content)
+            
+            chunk_content += "".join(
                 c.delta.content for c in chunk.choices if c.delta.content
-            )
+            ) 
         if not chunk_content:
             continue
         str_output += chunk_content         
diff --git a/npcpy/routes.py b/npcpy/routes.py
@@ -17,11 +17,10 @@
 )
 
 from npcpy.llm_funcs import (
+    check_llm_command,
     get_llm_response,
-    execute_llm_command,
     rehash_last_message,
     gen_image,
-    handle_tool_call,
     generate_video,
 )
 from npcpy.npc_compiler import NPC, Team, Tool
@@ -382,6 +381,31 @@ def rag_handler(command: str, **kwargs):
         traceback.print_exc()
         return {"output": f"Error executing RAG command: {e}", "messages": messages}
 
+
+def rehash_last_message(
+    conversation_id: str,
+    model: str,
+    provider: str,
+    npc: Any = None,
+    stream: bool = False,
+) -> dict:
+    from npcpy.memory.command_history import CommandHistory    
+    command_history = CommandHistory()
+    last_message = command_history.get_last_conversation(conversation_id)
+    if last_message is None:
+        convo_id = command_history.get_most_recent_conversation_id()[0]
+        last_message = command_history.get_last_conversation(convo_id)
+
+    user_command = last_message[3]  # Assuming content is in the 4th column
+    return check_llm_command(
+        user_command,
+        model=model,
+        provider=provider,
+        npc=npc,
+        messages=None,
+        stream=stream,
+    )
+
 @router.route("rehash", "Re-execute the last LLM command with the same input", shell_only=True)
 def rehash_handler(command: str, **kwargs):
     messages = safe_get(kwargs, "messages", [])
diff --git a/tests/mcp_tool_test.py b/tests/mcp_tool_test.py
@@ -0,0 +1,162 @@
+import os
+import asyncio
+import json
+import sys
+from contextlib import AsyncExitStack
+from typing import Any, Dict, List
+
+# --- MCP Imports ---
+try:
+    from mcp import ClientSession, StdioServerParameters
+    from mcp.client.stdio import stdio_client
+    MCP_AVAILABLE = True
+except ImportError:
+    print("FATAL: 'mcp' library is required. Install it (`pip install mcp`).")
+    exit(1)
+
+# --- Synchronous MCP Tool Execution Helper (Uses asyncio.run) ---
+
+async def _async_call_mcp_tool(
+    abs_server_path: str,
+    tool_name: str,
+    tool_args: Dict,
+    debug: bool = True # Add debug flag back
+) -> Any:
+    if not MCP_AVAILABLE:
+        raise ImportError("MCP library not installed.")
+
+    result_content: Any = {"error": "MCP call failed to complete"} # Default error
+    server_name = os.path.basename(abs_server_path) # For logging
+
+    # Define log helper inside
+    def _log(msg):
+        if debug: print(f"[_async_call_mcp: {server_name}/{tool_name}] {msg}")
+
+    _log(f"Attempting to connect to {abs_server_path}...")
+    command = "python" if abs_server_path.endswith('.py') else "node"
+    server_params = StdioServerParameters(
+        command=command,
+        args=[abs_server_path],
+        env=os.environ.copy()
+    )
+    timeout_seconds = 30.0
+
+    try:
+        async with AsyncExitStack() as stack:
+            _log(f"Awaiting connect_and_call() with timeout {timeout_seconds}s...")
+            async def connect_and_call():
+                nonlocal result_content
+                _log(f"Entering stdio_client context...")
+                stdio_transport = await stack.enter_async_context(stdio_client(server_params))
+                _log(f"Entering ClientSession context...")
+                session = await stack.enter_async_context(ClientSession(*stdio_transport))
+                _log(f"Awaiting session.initialize()...")
+                await session.initialize()
+                _log(f"Session initialized. Awaiting session.call_tool({tool_name}, {tool_args})...")
+                call_result = await session.call_tool(tool_name, tool_args)
+                _log(f"session.call_tool completed. Raw result: {call_result}") # Log raw result
+
+                content = call_result.content
+                _log(f"Extracted content type: {type(content)}")
+
+                # --- Corrected Content Handling ---
+                if isinstance(content, list) and content and all(hasattr(item, 'text') for item in content):
+                    result_content = [item.text for item in content]
+                    _log(f"Processed list of TextContent: {result_content}")
+                elif isinstance(content, list) and len(content) == 1 and hasattr(content[0], 'text'):
+                     result_content = content[0].text
+                     _log(f"Processed single TextContent in list: {result_content!r}")
+                elif hasattr(content, 'text'):
+                    result_content = content.text
+                    _log(f"Processed direct TextContent: {result_content!r}")
+                else:
+                    result_content = content
+                    _log(f"Using content directly (not TextContent): {str(result_content)[:200]}...")
+                # --- End Corrected Content Handling ---
+
+            await asyncio.wait_for(connect_and_call(), timeout=timeout_seconds)
+            _log(f"connect_and_call() finished successfully.")
+
+    except asyncio.TimeoutError:
+        _log(f"Timeout Error!")
+        result_content = {"error": f"Timeout executing MCP tool '{tool_name}'"}
+    except Exception as e:
+        _log(f"Exception: {type(e).__name__} - {e}")
+        # import traceback # Optional for more detail
+        # traceback.print_exc() # Optional
+        result_content = {"error": f"Error executing MCP tool '{tool_name}': {type(e).__name__} - {e}"}
+
+    return result_content
+
+# --- execute_mcp_tool_sync (Passes debug flag) ---
+def execute_mcp_tool_sync(
+    server_path: str,
+    tool_name: str,
+    tool_args: Dict,
+    debug: bool = True # Add debug flag
+) -> Any:
+    if not MCP_AVAILABLE:
+        return {"error": "MCP library not installed."}
+
+    abs_server_path = os.path.abspath(server_path)
+    if not os.path.exists(abs_server_path):
+        return {"error": f"Server path not found: {abs_server_path}"}
+    if not (abs_server_path.endswith('.py') or abs_server_path.endswith('.js')):
+         return {"error": f"Server path must be .py or .js: {abs_server_path}"}
+
+    try:
+        asyncio.get_running_loop()
+        if debug: print("[execute_mcp_tool_sync] Error: Cannot run sync within active async loop.")
+        return {"error": "Cannot run MCP tool sync within active async context."}
+    except RuntimeError:
+        pass # No loop running
+
+    if debug: print(f"[execute_mcp_tool_sync] Calling asyncio.run for {tool_name} on {os.path.basename(abs_server_path)}...")
+    try:
+        # Pass debug flag down
+        result = asyncio.run(_async_call_mcp_tool(abs_server_path, tool_name, tool_args, debug))
+        if debug: print(f"[execute_mcp_tool_sync] asyncio.run completed.")
+        return result
+    except Exception as e:
+        if debug: print(f"[execute_mcp_tool_sync] Error during asyncio.run: {e}")
+        return {"error": f"Failed to run MCP tool '{tool_name}' synchronously: {e}"}
+
+
+# --- Example Usage (Passes debug=True) ---
+if __name__ == "__main__":
+    if len(sys.argv) != 4:
+        print(f"Usage: python {sys.argv[0]} <mcp_server_script_path> <tool_name> '<json_arguments>'")
+        print(f"Example using your server: python {sys.argv[0]} ../npcpy/work/mcp_server.py get_available_tables '{{\"db_path\": \"~/npcsh_history.db\"}}'")
+        sys.exit(1)
+
+    server_script_path = sys.argv[1]
+    tool_to_call = sys.argv[2]
+    args_json_string = sys.argv[3]
+
+    try:
+        tool_arguments = json.loads(args_json_string)
+        if not isinstance(tool_arguments, dict):
+            raise ValueError("Arguments must be a JSON object.")
+    except Exception as e:
+        print(f"Error parsing arguments JSON: {e}")
+        sys.exit(1)
+
+    print(f"--- Attempting Synchronous MCP Tool Call ---")
+    print(f"Server: {server_script_path}")
+    print(f"Tool:   {tool_to_call}")
+    print(f"Args:   {tool_arguments}")
+    print(f"---------------------------------------------")
+
+    # Execute with debug=True to see internal logs
+    result = execute_mcp_tool_sync(server_script_path, tool_to_call, tool_arguments, debug=True)
+
+    # --- Result Printing (Remains the same) ---
+    print("\n--- Result ---")
+    print(f"Type: {type(result)}")
+    print("Content:")
+    if isinstance(result, (dict, list)):
+        print(json.dumps(result, indent=2))
+    elif isinstance(result, str):
+        print(repr(result))
+    else:
+        print(result)
diff --git a/tests/test_mcp_tool_loading.py b/tests/test_mcp_tool_loading.py