StackOneHQ
diff --git a/‎README.md‎
Lines changed: 70 additions & 0 deletions b/‎README.md‎
Lines changed: 70 additions & 0 deletions
diff --git a/‎stackone_ai/__init__.py‎
Lines changed: 8 additions & 1 deletion b/‎stackone_ai/__init__.py‎
Lines changed: 8 additions & 1 deletion
diff --git a/‎stackone_ai/feedback/__init__.py‎
Lines changed: 5 additions & 0 deletions b/‎stackone_ai/feedback/__init__.py‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎stackone_ai/feedback/tool.py‎
Lines changed: 163 additions & 0 deletions b/‎stackone_ai/feedback/tool.py‎
Lines changed: 163 additions & 0 deletions
diff --git a/‎stackone_ai/implicit_feedback/__init__.py‎
Lines changed: 21 additions & 0 deletions b/‎stackone_ai/implicit_feedback/__init__.py‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎stackone_ai/implicit_feedback/analyzer.py‎
Lines changed: 83 additions & 0 deletions b/‎stackone_ai/implicit_feedback/analyzer.py‎
Lines changed: 83 additions & 0 deletions
@@ -75,6 +75,51 @@ employee = employee_tool.call(id="employee-id")
 employee = employee_tool.execute({"id": "employee-id"})
 ```
 
+## Implicit Feedback (Beta)
+
+The Python SDK can emit implicit behavioural feedback to LangSmith so you can triage low-quality tool results without manually tagging runs.
+
+### Automatic configuration
+
+Set `LANGSMITH_API_KEY` in your environment and the SDK will initialise the implicit feedback manager on first tool execution. You can optionally fine-tune behaviour with:
+
+- `STACKONE_IMPLICIT_FEEDBACK_ENABLED` (`true`/`false`, defaults to `true` when an API key is present)
+- `STACKONE_IMPLICIT_FEEDBACK_PROJECT` to pin a LangSmith project name
+- `STACKONE_IMPLICIT_FEEDBACK_TAGS` with a comma-separated list of tags applied to every run
+
+### Manual configuration
+
+If you want custom session or user resolvers, call `configure_implicit_feedback` during start-up:
+
+```python
+from stackone_ai import configure_implicit_feedback
+
+configure_implicit_feedback(
+    api_key="/path/to/langsmith.key",
+    project_name="stackone-agents",
+    default_tags=["python-sdk"],
+)
+```
+
+Providing your own `session_resolver`/`user_resolver` callbacks lets you derive identifiers from the request context before events are sent to LangSmith.
+
+### Attaching session context to tool calls
+
+Both `tool.execute` and `tool.call` accept an `options` keyword that is excluded from the API request but forwarded to the feedback manager:
+
+```python
+tool.execute(
+    {"id": "employee-id"},
+    options={
+        "feedback_session_id": "chat-42",
+        "feedback_user_id": "user-123",
+        "feedback_metadata": {"conversation_id": "abc"},
+    },
+)
+```
+
+When two calls for the same session happen within a few seconds, the SDK emits a `refinement_needed` event, and you can inspect suitability scores directly in LangSmith.
+
 ## Integration Examples
 
 <details>
@@ -148,6 +193,31 @@ result = crew.kickoff()
 
 </details>
 
+## Feedback Collection
+
+The SDK includes a feedback collection tool (`meta_collect_tool_feedback`) that allows users to submit feedback about their experience with StackOne tools. This tool is automatically included in the toolset and is designed to be invoked by AI agents after user permission.
+
+```python
+from stackone_ai import StackOneToolSet
+
+toolset = StackOneToolSet()
+
+# Get the feedback tool (included with "meta_*" pattern or all tools)
+tools = toolset.get_tools("meta_*")
+feedback_tool = tools.get_tool("meta_collect_tool_feedback")
+
+# Submit feedback (typically invoked by AI after user consent)
+result = feedback_tool.call(
+    feedback="The HRIS tools are working great! Very fast response times.",
+    account_id="acc_123456",
+    tool_names=["hris_list_employees", "hris_get_employee"]
+)
+```
+
+**Important**: The AI agent should always ask for user permission before submitting feedback:
+- "Are you ok with sending feedback to StackOne? The LLM will take care of sending it."
+- Only call the tool after the user explicitly agrees.
+
 ## Meta Tools (Beta)
 
 Meta tools enable dynamic tool discovery and execution without hardcoding tool names:
 
@@ -1,7 +1,14 @@
 """StackOne AI SDK"""
 
+from .implicit_feedback import configure_implicit_feedback, get_implicit_feedback_manager
 from .models import StackOneTool, Tools
 from .toolset import StackOneToolSet
 
-__all__ = ["StackOneToolSet", "StackOneTool", "Tools"]
+__all__ = [
+    "StackOneToolSet",
+    "StackOneTool",
+    "Tools",
+    "configure_implicit_feedback",
+    "get_implicit_feedback_manager",
+]
 __version__ = "0.3.2"
@@ -0,0 +1,5 @@
+"""Feedback collection tool for StackOne."""
+
+from .tool import create_feedback_tool
+
+__all__ = ["create_feedback_tool"]
@@ -0,0 +1,163 @@
+"""Feedback collection tool for StackOne."""
+
+# TODO: Remove when Python 3.9 support is dropped
+from __future__ import annotations
+
+import json
+
+from pydantic import BaseModel, Field, field_validator
+
+from ..models import (
+    ExecuteConfig,
+    JsonDict,
+    ParameterLocation,
+    StackOneError,
+    StackOneTool,
+    ToolParameters,
+)
+
+
+class FeedbackInput(BaseModel):
+    """Input schema for feedback tool."""
+
+    feedback: str = Field(..., min_length=1, description="User feedback text")
+    account_id: str = Field(..., min_length=1, description="Account identifier")
+    tool_names: list[str] = Field(..., min_length=1, description="List of tool names")
+
+    @field_validator("feedback", "account_id")
+    @classmethod
+    def validate_non_empty_trimmed(cls, v: str) -> str:
+        """Validate that string is non-empty after trimming."""
+        trimmed = v.strip()
+        if not trimmed:
+            raise ValueError("Field must be a non-empty string")
+        return trimmed
+
+    @field_validator("tool_names")
+    @classmethod
+    def validate_tool_names(cls, v: list[str]) -> list[str]:
+        """Validate and clean tool names."""
+        cleaned = [name.strip() for name in v if name.strip()]
+        if not cleaned:
+            raise ValueError("At least one tool name is required")
+        return cleaned
+
+
+class FeedbackTool(StackOneTool):
+    """Extended tool for collecting feedback with enhanced validation."""
+
+    def execute(
+        self, arguments: str | JsonDict | None = None, *, options: JsonDict | None = None
+    ) -> JsonDict:
+        """
+        Execute the feedback tool with enhanced validation.
+
+        Args:
+            arguments: Tool arguments as string or dict
+            options: Execution options
+
+        Returns:
+            Response from the API
+
+        Raises:
+            StackOneError: If validation or API call fails
+        """
+        try:
+            # Parse input
+            if isinstance(arguments, str):
+                raw_params = json.loads(arguments)
+            else:
+                raw_params = arguments or {}
+
+            # Validate with Pydantic
+            parsed_params = FeedbackInput(**raw_params)
+
+            # Build validated request body
+            validated_arguments = {
+                "feedback": parsed_params.feedback,
+                "account_id": parsed_params.account_id,
+                "tool_names": parsed_params.tool_names,
+            }
+
+            # Use the parent execute method with validated arguments
+            return super().execute(validated_arguments, options=options)
+
+        except json.JSONDecodeError as exc:
+            raise StackOneError(f"Invalid JSON in arguments: {exc}") from exc
+        except ValueError as exc:
+            raise StackOneError(f"Validation error: {exc}") from exc
+        except Exception as error:
+            if isinstance(error, StackOneError):
+                raise
+            raise StackOneError(f"Error executing feedback tool: {error}") from error
+
+
+def create_feedback_tool(
+    api_key: str,
+    account_id: str | None = None,
+    base_url: str = "https://api.stackone.com",
+) -> FeedbackTool:
+    """
+    Create a feedback collection tool.
+
+    Args:
+        api_key: API key for authentication
+        account_id: Optional account ID
+        base_url: Base URL for the API
+
+    Returns:
+        FeedbackTool configured for feedback collection
+    """
+    name = "meta_collect_tool_feedback"
+    description = (
+        "Collects user feedback on StackOne tool performance. "
+        "First ask the user, \"Are you ok with sending feedback to StackOne?\" "
+        "and mention that the LLM will take care of sending it. "
+        "Call this tool only when the user explicitly answers yes."
+    )
+
+    parameters = ToolParameters(
+        type="object",
+        properties={
+            "account_id": {
+                "type": "string",
+                "description": 'Account identifier (e.g., "acc_123456")',
+            },
+            "feedback": {
+                "type": "string",
+                "description": "Verbatim feedback from the user about their experience with StackOne tools.",
+            },
+            "tool_names": {
+                "type": "array",
+                "items": {
+                    "type": "string",
+                },
+                "description": "Array of tool names being reviewed",
+            },
+        },
+    )
+
+    execute_config = ExecuteConfig(
+        name=name,
+        method="POST",
+        url=f"{base_url}/ai/tool-feedback",
+        body_type="json",
+        parameter_locations={
+            "feedback": ParameterLocation.BODY,
+            "account_id": ParameterLocation.BODY,
+            "tool_names": ParameterLocation.BODY,
+        },
+    )
+
+    # Create instance by calling parent class __init__ directly since FeedbackTool is a subclass
+    tool = FeedbackTool.__new__(FeedbackTool)
+    StackOneTool.__init__(
+        tool,
+        description=description,
+        parameters=parameters,
+        _execute_config=execute_config,
+        _api_key=api_key,
+        _account_id=account_id,
+    )
+
+    return tool
@@ -0,0 +1,21 @@
+"""Implicit feedback instrumentation for the StackOne Python SDK."""
+
+from .analyzer import BehaviorAnalyzer, BehaviorAnalyzerConfig
+from .data import ImplicitFeedbackEvent, ToolCallQualitySignals, ToolCallRecord
+from .langsmith_client import LangsmithFeedbackClient
+from .manager import ImplicitFeedbackManager, configure_implicit_feedback, get_implicit_feedback_manager
+from .session import SessionTracker
+
+__all__ = [
+    "BehaviorAnalyzer",
+    "BehaviorAnalyzerConfig",
+    "ImplicitFeedbackEvent",
+    "ImplicitFeedbackManager",
+    "LangsmithFeedbackClient",
+    "SessionTracker",
+    "ToolCallQualitySignals",
+    "ToolCallRecord",
+    "configure_implicit_feedback",
+    "get_implicit_feedback_manager",
+]
+
@@ -0,0 +1,83 @@
+from __future__ import annotations
+
+from dataclasses import dataclass
+from typing import Sequence
+
+from .data import ToolCallQualitySignals, ToolCallRecord
+
+
+@dataclass(frozen=True)
+class BehaviorAnalyzerConfig:
+    quick_refinement_window_seconds: float = 12.0
+    task_switch_window_seconds: float = 180.0
+    failure_penalty: float = 0.3
+    quick_refinement_penalty: float = 0.25
+    task_switch_penalty: float = 0.2
+
+
+class BehaviorAnalyzer:
+    """Derive behavioural quality signals from a stream of tool calls."""
+
+    def __init__(self, config: BehaviorAnalyzerConfig | None = None) -> None:
+        self._config = config or BehaviorAnalyzerConfig()
+
+    def analyze(self, history: Sequence[ToolCallRecord], current: ToolCallRecord) -> ToolCallQualitySignals:
+        """Compute quality signals for a tool call."""
+
+        session_history = [call for call in history if call.session_id == current.session_id and call.call_id != current.call_id]
+
+        quick_refinement, refinement_window = self._detect_quick_refinement(session_history, current)
+        task_switch = self._detect_task_switch(session_history, current)
+        suitability_score = self._compute_suitability_score(current.status, quick_refinement, task_switch)
+
+        return ToolCallQualitySignals(
+            quick_refinement=quick_refinement,
+            task_switch=task_switch,
+            suitability_score=suitability_score,
+            refinement_window_seconds=refinement_window,
+        )
+
+    def _detect_quick_refinement(
+        self, history: Sequence[ToolCallRecord], current: ToolCallRecord
+    ) -> tuple[bool, float | None]:
+        if not current.session_id or not history:
+            return False, None
+
+        last_event = history[-1]
+        elapsed = (current.start_time - last_event.end_time).total_seconds()
+        if elapsed < 0:
+            # Ignore out-of-order events
+            return False, None
+
+        if (
+            last_event.tool_name == current.tool_name
+            and elapsed <= self._config.quick_refinement_window_seconds
+        ):
+            return True, elapsed
+
+        return False, None
+
+    def _detect_task_switch(self, history: Sequence[ToolCallRecord], current: ToolCallRecord) -> bool:
+        if not current.session_id or not history:
+            return False
+
+        for previous in reversed(history):
+            elapsed = (current.start_time - previous.end_time).total_seconds()
+            if elapsed < 0:
+                continue
+            if elapsed > self._config.task_switch_window_seconds:
+                break
+            if previous.tool_name != current.tool_name:
+                return True
+
+        return False
+
+    def _compute_suitability_score(self, status: str, quick_refinement: bool, task_switch: bool) -> float:
+        score = 1.0
+        if status != "success":
+            score -= self._config.failure_penalty
+        if quick_refinement:
+            score -= self._config.quick_refinement_penalty
+        if task_switch:
+            score -= self._config.task_switch_penalty
+        return max(0.0, min(1.0, score))