All-Hands-AI · AutoLTX · Feb 10, 2025 · Feb 10, 2025 · Feb 10, 2025 · Feb 10, 2025
diff --git a/frontend/src/components/shared/task-form.tsx b/frontend/src/components/shared/task-form.tsx
@@ -32,6 +32,7 @@ export function TaskForm({ ref }: TaskFormProps) {
   });
   const [inputIsFocused, setInputIsFocused] = React.useState(false);
   const { mutate: createConversation, isPending } = useCreateConversation();
+  const [estimateCost, setEstimateCost] = React.useState(false);
 
   const onRefreshSuggestion = () => {
     const suggestions = SUGGESTIONS["non-repo"];
@@ -103,6 +104,31 @@ export function TaskForm({ ref }: TaskFormProps) {
             />
           )}
         </div>
+        <div className="flex items-center gap-2">
+          <span className="text-sm text-neutral-400">Estimate cost</span>
+          <button
+            type="button"
+            role="switch"
+            aria-checked={estimateCost}
+            onClick={() => setEstimateCost(!estimateCost)}
+            className={cn(
+              "relative inline-flex h-6 w-11 items-center rounded-full",
+              "transition-colors duration-200 ease-in-out",
+              estimateCost ? "bg-green-500" : "bg-neutral-600",
+              "focus:outline-none focus-visible:ring-2 focus-visible:ring-white focus-visible:ring-opacity-75"
+            )}
+          >
+            <span className="sr-only">Enable cost estimation</span>
+            <span
+              className={cn(
+                "inline-block h-4 w-4 transform rounded-full bg-white",
+                "transition duration-200 ease-in-out",
+                "shadow-lg",
+                estimateCost ? "translate-x-6" : "translate-x-1"
+              )}
+            />
+          </button>
+        </div>
       </form>
       <UploadImageInput
         onUpload={async (uploadedFiles) => {

diff --git a/frontend/src/services/observations.ts b/frontend/src/services/observations.ts
@@ -12,8 +12,26 @@ import {
 } from "#/state/chat-slice";
 
 export function handleObservationMessage(message: ObservationMessage) {
+  console.log("Processing observation message:", message);
+
+  // Handle llm_metrics and usage together
+  if (message.llm_metrics || message.tool_call_metadata?.model_response?.usage) {
+    const usage = message.tool_call_metadata?.model_response?.usage;
+    const metrics = message.llm_metrics;
+    console.log("Processing metrics:", metrics);
+    console.log("Processing usage:", usage);
+
+    alert([
+      'LLM Information',
+      metrics ? `Accumulated Cost: $${metrics.accumulated_cost.toFixed(4)}` : '',
+      usage ? `Prompt Tokens: ${usage.prompt_tokens}` : '',
+      usage ? `Completion Tokens: ${usage.completion_tokens}` : '',
+      usage ? `Total Tokens: ${usage.total_tokens}` : ''
+    ].filter(line => line !== '').join('\n'));  // Filter out empty lines
+  }
+
   switch (message.observation) {
-    case ObservationType.RUN: {
+    case ObservationType.RUN:
       if (message.extras.hidden) break;
       let { content } = message;
 
@@ -24,9 +42,7 @@ export function handleObservationMessage(message: ObservationMessage) {
 
       store.dispatch(appendOutput(content));
       break;
-    }
     case ObservationType.RUN_IPYTHON:
-      // FIXME: render this as markdown
       store.dispatch(appendJupyterOutput(message.content));
       break;
     case ObservationType.BROWSE:

diff --git a/frontend/src/types/message.tsx b/frontend/src/types/message.tsx
@@ -38,6 +38,25 @@ export interface ObservationMessage {
 
   // The timestamp of the message
   timestamp: string;
+
+  // 添加 tool_call_metadata 字段
+  tool_call_metadata?: {
+    model_response?: {
+      usage?: {
+        prompt_tokens: number;
+        completion_tokens: number;
+        total_tokens: number;
+      };
+    };
+  };
+
+  llm_metrics?: {
+    accumulated_cost: number;
+    response_latencies: Array<{
+      latency: number;
+      timestamp: string;
+    }>;
+  };
 }
 
 export interface StatusMessage {

diff --git a/openhands/agenthub/codeact_agent/function_calling.py b/openhands/agenthub/codeact_agent/function_calling.py
@@ -16,6 +16,7 @@
     FunctionCallNotExistsError,
     FunctionCallValidationError,
 )
+from openhands.core.logger import openhands_logger as logger
 from openhands.events.action import (
     Action,
     AgentDelegateAction,
@@ -590,6 +591,13 @@ def response_to_actions(response: ModelResponse) -> list[Action]:
                 total_calls_in_response=len(assistant_msg.tool_calls),
             )
             actions.append(action)
+
+        # Add logging for each created action
+        for action in actions:
+            accumulated_cost = action.llm_metrics.accumulated_cost if action.llm_metrics else None
+            logger.info(f"Action created - Accumulated Cost: {accumulated_cost}")
+            logger.info(f"Action type: {type(action)}")
+
     else:
         actions.append(
             MessageAction(content=assistant_msg.content, wait_for_response=True)

diff --git a/openhands/controller/agent_controller.py b/openhands/controller/agent_controller.py
@@ -203,6 +203,10 @@ def update_state_before_step(self):
     async def update_state_after_step(self):
         # update metrics especially for cost. Use deepcopy to avoid it being modified by agent._reset()
         self.state.local_metrics = copy.deepcopy(self.agent.llm.metrics)
+
+        # Add logging for metrics update
+        accumulated_cost = self.state.local_metrics.accumulated_cost if self.state.local_metrics else None
+        logger.info(f"After update_state_after_step - State Local Metrics Accumulated Cost: {accumulated_cost}")
 
     async def _react_to_exception(
         self,
@@ -379,6 +383,17 @@ async def _handle_observation(self, observation: Observation) -> None:
         if observation.llm_metrics is not None:
             self.agent.llm.metrics.merge(observation.llm_metrics)
 
+        logger.info("Mark the position of _handle_observation")
+        # Log state metrics before assignment
+        if self.state and self.state.local_metrics:
+            logger.info(f"State local_metrics before assignment - accumulated cost: {self.state.local_metrics.accumulated_cost}")
+
+        # Add local metrics to observation
+        if self.state and self.state.local_metrics:
+            observation.llm_metrics = copy.deepcopy(self.state.local_metrics)
+            # Log observation metrics after assignment
+            logger.info(f"Observation metrics after assignment - accumulated cost: {observation.llm_metrics.accumulated_cost}")
+
         if self._pending_action and self._pending_action.id == observation.cause:
             if self.state.agent_state == AgentState.AWAITING_USER_CONFIRMATION:
                 return

diff --git a/openhands/events/serialization/event.py b/openhands/events/serialization/event.py
@@ -9,6 +9,7 @@
 from openhands.events.serialization.observation import observation_from_dict
 from openhands.events.serialization.utils import remove_fields
 from openhands.events.tool import ToolCallMetadata
+from openhands.core.logger import openhands_logger as logger
 
 # TODO: move `content` into `extras`
 TOP_KEYS = [
@@ -20,6 +21,7 @@
     'action',
     'observation',
     'tool_call_metadata',
+    'llm_metrics'
 ]
 UNDERSCORE_KEYS = ['id', 'timestamp', 'source', 'cause', 'tool_call_metadata']
 
@@ -80,7 +82,12 @@ def event_to_dict(event: 'Event') -> dict:
         if key == 'source' and 'source' in d:
             d['source'] = d['source'].value
         if key == 'tool_call_metadata' and 'tool_call_metadata' in d:
+            logger.info(f"Mark the position of tool_call_metadata processing in event_to_dict")
             d['tool_call_metadata'] = d['tool_call_metadata'].model_dump()
+        if key == 'llm_metrics' and 'llm_metrics' in d:
+            logger.info(f"Before llm_metrics processing - metrics in d: {d['llm_metrics']}")
+            d['llm_metrics'] = d['llm_metrics'].get()
+            logger.info(f"After llm_metrics processing - metrics result: {d['llm_metrics']}")
         props.pop(key, None)
     if 'security_risk' in props and props['security_risk'] is None:
         props.pop('security_risk')

diff --git a/openhands/events/stream.py b/openhands/events/stream.py
@@ -50,6 +50,10 @@ async def __aiter__(self):
 
         # Create an async generator that yields events
         for event in self.event_stream.get_events(*self.args, **self.kwargs):
+            # Log event type and metrics if present
+            logger.info(f"AsyncEventStreamWrapper - Event type: {type(event)}")
+            if hasattr(event, 'llm_metrics') and event.llm_metrics:
+                logger.info(f"AsyncEventStreamWrapper - Accumulated Cost: {event.llm_metrics.accumulated_cost}")
             # Run the blocking get_events() in a thread pool
             yield await loop.run_in_executor(None, lambda e=event: e)  # type: ignore
 
@@ -262,6 +266,10 @@ def unsubscribe(self, subscriber_id: EventStreamSubscriber, callback_id: str):
         self._clean_up_subscriber(subscriber_id, callback_id)
 
     def add_event(self, event: Event, source: EventSource):
+        # Add logs for accumulated cost debugging.
+        accumulated_cost = event.llm_metrics.accumulated_cost if event.llm_metrics else None
+        logger.info(f"Adding event to stream - Accumulated Cost: {accumulated_cost}")
+
         if hasattr(event, '_id') and event.id is not None:
             raise ValueError(
                 f'Event already has an ID:{event.id}. It was probably added back to the EventStream from inside a handler, triggering a loop.'

diff --git a/openhands/runtime/impl/action_execution/action_execution_client.py b/openhands/runtime/impl/action_execution/action_execution_client.py
@@ -38,6 +38,7 @@
 from openhands.runtime.plugins import PluginRequirement
 from openhands.runtime.utils.request import send_request
 from openhands.utils.http_session import HttpSession
+from openhands.core.logger import openhands_logger as logger
 
 
 class ActionExecutionClient(Runtime):
@@ -217,6 +218,11 @@ def get_vscode_token(self) -> str:
             return ''
 
     def send_action_for_execution(self, action: Action) -> Observation:
+        # Log: check if incoming action has metrics
+        logger.info(f"Action type before execution: {type(action)}")
+        if hasattr(action, 'llm_metrics') and action.llm_metrics:
+            logger.info(f"Action llm_metrics before execution - accumulated cost: {action.llm_metrics.accumulated_cost}")
+
         if (
             isinstance(action, FileEditAction)
             and action.impl_source == FileEditSource.LLM_BASED_EDIT

diff --git a/openhands/server/session/session.py b/openhands/server/session/session.py
@@ -175,11 +175,18 @@ async def _on_event(self, event: Event):
         Args:
             event: The agent event (Observation or Action).
         """
+        # Add logs: Record received events and metrics
+        logger.info(f"Session received event type: {type(event)}")
+        if hasattr(event, 'llm_metrics') and event.llm_metrics:
+            logger.info(f"Event accumulated cost: {event.llm_metrics.accumulated_cost}")
+
         if isinstance(event, NullAction):
             return
         if isinstance(event, NullObservation):
             return
         if event.source == EventSource.AGENT:
+            # Add logs：Record agent->metrics
+            logger.info(f"Processing AGENT event accumulated cost: {event.llm_metrics.accumulated_cost if hasattr(event, 'llm_metrics') and event.llm_metrics else None}")
             await self.send(event_to_dict(event))
         elif event.source == EventSource.USER:
             await self.send(event_to_dict(event))