gptme
diff --git a/‎gptme/tools/time_awareness.py‎
Lines changed: 130 additions & 0 deletions b/‎gptme/tools/time_awareness.py‎
Lines changed: 130 additions & 0 deletions
diff --git a/‎gptme/tools/token_awareness.py‎
Lines changed: 171 additions & 0 deletions b/‎gptme/tools/token_awareness.py‎
Lines changed: 171 additions & 0 deletions
@@ -0,0 +1,130 @@
+"""
+Time awareness tool.
+
+Provides time feedback during conversations to help the assistant manage
+long-running sessions effectively.
+
+This helps the assistant:
+- Understand conversation duration
+- Plan work within time constraints
+- Manage long-running autonomous sessions effectively
+- Avoid timeouts and performance issues
+
+Shows time elapsed messages at: 1min, 5min, 10min, 15min, 20min, then every 10min.
+"""
+
+import logging
+from collections.abc import Generator
+from datetime import datetime
+from pathlib import Path
+
+from ..hooks import HookType
+from ..logmanager import Log
+from ..message import Message
+from .base import ToolSpec
+
+logger = logging.getLogger(__name__)
+
+# Track conversation start times per workspace
+_conversation_start_times: dict[str, datetime] = {}
+
+# Track which time milestones have been shown per workspace
+_shown_milestones: dict[str, set[int]] = {}
+
+
+def add_time_message(
+    log: Log, workspace: Path | None, manager=None
+) -> Generator[Message, None, None]:
+    """Add time elapsed message after message processing.
+
+    Shows messages at: 1min, 5min, 10min, 15min, 20min, then every 10min.
+    """
+    try:
+        if workspace is None:
+            return
+
+        workspace_str = str(workspace)
+
+        # Initialize conversation start time if first message
+        if workspace_str not in _conversation_start_times:
+            _conversation_start_times[workspace_str] = datetime.now()
+            _shown_milestones[workspace_str] = set()
+            return
+
+        # Calculate elapsed time in minutes
+        elapsed = datetime.now() - _conversation_start_times[workspace_str]
+        elapsed_minutes = int(elapsed.total_seconds() / 60)
+
+        # Determine which milestone to show
+        milestone = _get_next_milestone(elapsed_minutes)
+
+        # Check if we should show this milestone
+        if milestone and milestone not in _shown_milestones[workspace_str]:
+            _shown_milestones[workspace_str].add(milestone)
+
+            # Format time message
+            hours = elapsed_minutes // 60
+            minutes = elapsed_minutes % 60
+
+            time_str = datetime.now().strftime("%H:%M")
+            if hours > 0:
+                elapsed_str = f"{hours}h {minutes}min" if minutes > 0 else f"{hours}h"
+            else:
+                elapsed_str = f"{minutes}min"
+
+            message = Message(
+                "system",
+                f"<system_info>The time is now {time_str}. Time elapsed: {elapsed_str}</system_info>",
+                hide=True,
+            )
+            yield message
+
+    except Exception as e:
+        logger.exception(f"Error adding time message: {e}")
+
+
+def _get_next_milestone(elapsed_minutes: int) -> int | None:
+    """Get the next milestone to show based on elapsed minutes.
+
+    Milestones: 1, 5, 10, 15, 20, then every 10 minutes.
+    """
+    if elapsed_minutes < 1:
+        return None
+    elif elapsed_minutes < 5:
+        return 1
+    elif elapsed_minutes < 10:
+        return 5
+    elif elapsed_minutes < 15:
+        return 10
+    elif elapsed_minutes < 20:
+        return 15
+    elif elapsed_minutes < 30:
+        return 20
+    else:
+        # Every 10 minutes after 20
+        return (elapsed_minutes // 10) * 10
+
+
+# Tool specification
+tool = ToolSpec(
+    name="time-awareness",
+    desc="Time tracking awareness for conversations",
+    instructions="""
+This tool provides time awareness to help manage long-running conversations.
+
+The assistant receives periodic updates about how much time has elapsed:
+<system_info>Time elapsed: Xmin</system_info>
+
+Time messages are shown at: 1min, 5min, 10min, 15min, 20min, then every 10 minutes.
+""".strip(),
+    available=True,
+    hooks={
+        "time_message": (
+            HookType.MESSAGE_POST_PROCESS.value,
+            add_time_message,
+            0,  # Normal priority
+        ),
+    },
+)
+
+__all__ = ["tool"]
@@ -0,0 +1,171 @@
+"""
+Token budget awareness tool.
+
+Implements context/token budget awareness similar to Claude 4.5's built-in feature,
+but works across all LLM providers and tool formats.
+
+Adds:
+- <budget:token_budget>XXX</budget:token_budget> at session start
+- <system_warning>Token usage: X/Y; Z remaining</system_warning> after message processing
+"""
+
+import logging
+from collections.abc import Generator
+from pathlib import Path
+
+from ..hooks import HookType
+from ..logmanager import Log
+from ..message import Message, len_tokens
+from .base import ToolSpec
+
+logger = logging.getLogger(__name__)
+
+# Cache for incremental token counting (avoids O(N²) behavior)
+_token_totals: dict[str, int] = {}
+_message_counts: dict[str, int] = {}
+
+
+def add_token_budget(
+    logdir: Path, workspace: Path | None, initial_msgs: list[Message], **kwargs
+) -> Generator[Message, None, None]:
+    """Add token budget tag at session start.
+
+    Args:
+        logdir: Log directory path
+        workspace: Workspace directory path
+        initial_msgs: Initial messages in the conversation
+
+    Yields:
+        System message with token budget tag
+    """
+    try:
+        from ..llm.models import get_default_model
+
+        model = get_default_model()
+        if not model:
+            logger.debug("No model loaded, skipping token budget")
+            return
+
+        budget = model.context
+
+        # Add budget tag as a system message
+        # Using hide=True so it doesn't show in terminal but is sent to the model
+        yield Message(
+            "system",
+            f"<budget:token_budget>{budget}</budget:token_budget>",
+            hide=True,
+        )
+
+        logger.debug(f"Added token budget: {budget}")
+
+    except Exception as e:
+        logger.exception(f"Error adding token budget: {e}")
+
+
+def add_token_usage_warning(
+    log: Log, workspace: Path | None, **kwargs
+) -> Generator[Message, None, None]:
+    """Add token usage warning after message processing.
+
+    Uses incremental token counting to avoid O(N²) behavior.
+
+    Args:
+        log: The conversation log
+        workspace: Workspace directory path
+
+    Yields:
+        System message with token usage warning
+    """
+    try:
+        from ..llm.models import get_default_model
+
+        model = get_default_model()
+        if not model:
+            logger.debug("No model loaded, skipping token usage warning")
+            return
+
+        budget = model.context
+
+        # Use workspace as unique identifier for the conversation
+        # If workspace is None, fall back to recounting (less efficient but correct)
+        log_id = str(workspace) if workspace else None
+
+        # Calculate token usage
+        if log_id is None:
+            # No workspace identifier: fall back to counting all messages
+            # This is less efficient (O(N) per call) but ensures correctness
+            used = len_tokens(log.messages, model.model)
+        else:
+            # Incremental counting (O(1) amortized per message)
+            current_count = len(log.messages)
+            previous_count = _message_counts.get(log_id, 0)
+
+            if previous_count == 0:
+                # First time: count all messages
+                used = len_tokens(log.messages, model.model)
+                _token_totals[log_id] = used
+                _message_counts[log_id] = current_count
+            else:
+                # Subsequent times: only count new messages
+                new_messages = log.messages[previous_count:]
+                if new_messages:
+                    new_tokens = len_tokens(new_messages, model.model)
+                    used = _token_totals.get(log_id, 0) + new_tokens
+                    _token_totals[log_id] = used
+                    _message_counts[log_id] = current_count
+                else:
+                    # No new messages (shouldn't happen but handle gracefully)
+                    used = _token_totals.get(log_id, 0)
+
+        remaining = budget - used
+
+        # Add usage warning as a system message
+        # Using hide=True so it doesn't show in terminal but is sent to the model
+        yield Message(
+            "system",
+            f"<system_warning>Token usage: {used}/{budget}; {remaining} remaining</system_warning>",
+            hide=True,
+        )
+
+        logger.debug(
+            f"Token usage: {used}/{budget}; {remaining} remaining (incremental)"
+        )
+
+    except Exception as e:
+        logger.exception(f"Error adding token usage warning: {e}")
+
+
+# Tool specification
+tool = ToolSpec(
+    name="token-awareness",
+    desc="Token budget awareness for conversations",
+    instructions="""
+This tool provides token budget awareness to the assistant across all LLM providers.
+
+At the start of each conversation, the assistant receives information about the total token budget:
+<budget:token_budget>XXX</budget:token_budget>
+
+After each message is processed, the assistant receives an update on token usage:
+<system_warning>Token usage: X/Y; Z remaining</system_warning>
+
+This helps the assistant:
+- Understand how much context capacity remains
+- Plan responses to fit within the budget
+- Manage long-running conversations effectively
+""".strip(),
+    available=True,
+    hooks={
+        "token_budget": (
+            HookType.SESSION_START.value,
+            add_token_budget,
+            10,  # High priority to run early
+        ),
+        "token_usage": (
+            HookType.MESSAGE_POST_PROCESS.value,
+            add_token_usage_warning,
+            0,  # Normal priority
+        ),
+    },
+)
+
+__all__ = ["tool"]