Stirling-Tools
diff --git a/‎.gitignore‎
Lines changed: 3 additions & 0 deletions b/‎.gitignore‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎engine/config/.env.example‎
Lines changed: 5 additions & 0 deletions b/‎engine/config/.env.example‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎engine/pyproject.toml‎
Lines changed: 2 additions & 0 deletions b/‎engine/pyproject.toml‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎engine/src/stirling/api/app.py‎
Lines changed: 10 additions & 1 deletion b/‎engine/src/stirling/api/app.py‎
Lines changed: 10 additions & 1 deletion
diff --git a/‎engine/src/stirling/api/middleware.py‎
Lines changed: 23 additions & 0 deletions b/‎engine/src/stirling/api/middleware.py‎
Lines changed: 23 additions & 0 deletions
diff --git a/‎engine/src/stirling/config/settings.py‎
Lines changed: 4 additions & 0 deletions b/‎engine/src/stirling/config/settings.py‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎engine/src/stirling/services/__init__.py‎
Lines changed: 2 additions & 0 deletions b/‎engine/src/stirling/services/__init__.py‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎engine/src/stirling/services/tracking.py‎
Lines changed: 233 additions & 0 deletions b/‎engine/src/stirling/services/tracking.py‎
Lines changed: 233 additions & 0 deletions
diff --git a/‎engine/tests/conftest.py‎
Lines changed: 38 additions & 0 deletions b/‎engine/tests/conftest.py‎
Lines changed: 38 additions & 0 deletions
@@ -255,3 +255,6 @@ docs/type3/signatures/
 
 # Type3 sample PDFs (development only)
 **/type3/samples/
+
+# Claude
+.claude/
@@ -8,6 +8,11 @@ STIRLING_FAST_MODEL=anthropic:claude-haiku-4-5
 STIRLING_SMART_MODEL_MAX_TOKENS=8192
 STIRLING_FAST_MODEL_MAX_TOKENS=2048
 
+# PostHog analytics. Set STIRLING_POSTHOG_ENABLED=true and provide an API key to enable.
+STIRLING_POSTHOG_ENABLED=false
+STIRLING_POSTHOG_API_KEY=phc_VOdeYnlevc2T63m3myFGjeBlRcIusRgmhfx6XL5a1iz
+STIRLING_POSTHOG_HOST=https://eu.i.posthog.com
+
 # Log level for the stirling logger hierarchy (DEBUG, INFO, WARNING, ERROR)
 STIRLING_LOG_LEVEL=INFO
 
 
@@ -10,6 +10,8 @@ dependencies = [
     "pydantic-settings>=2.0.0",
     "python-dotenv>=1.2.1",
     "uvicorn>=0.35.0",
+    "opentelemetry-sdk>=1.39.0",
+    "posthog>=3.0.0",
 ]
 
 [dependency-groups]
 
@@ -4,9 +4,12 @@
 from typing import Annotated
 
 from fastapi import Depends, FastAPI
+from pydantic_ai import Agent
+from pydantic_ai.models.instrumented import InstrumentationSettings
 
 from stirling.agents import ExecutionPlanningAgent, OrchestratorAgent, PdfEditAgent, PdfQuestionAgent, UserSpecAgent
 from stirling.agents.ledger import MathAuditorAgent
+from stirling.api.middleware import UserIdMiddleware
 from stirling.api.routes import (
     agent_draft_router,
     execution_router,
@@ -17,7 +20,7 @@
 )
 from stirling.config import AppSettings, load_settings
 from stirling.contracts import HealthResponse
-from stirling.services import build_runtime
+from stirling.services import build_runtime, setup_posthog_tracking
 
 
 def _load_startup_settings(fast_api: FastAPI) -> AppSettings:
@@ -40,10 +43,16 @@ async def lifespan(fast_api: FastAPI):
     fast_api.state.user_spec_agent = UserSpecAgent(runtime)
     fast_api.state.execution_planning_agent = ExecutionPlanningAgent(runtime)
     fast_api.state.math_auditor_agent = MathAuditorAgent(runtime)
+    tracer_provider = setup_posthog_tracking(settings)
+    if tracer_provider:
+        Agent.instrument_all(InstrumentationSettings(tracer_provider=tracer_provider))
     yield
+    if tracer_provider:
+        tracer_provider.shutdown()
 
 
 app = FastAPI(title="Stirling AI Engine", lifespan=lifespan, version="0.1.0")
+app.add_middleware(UserIdMiddleware)
 app.include_router(orchestrator_router)
 app.include_router(pdf_edit_router)
 app.include_router(pdf_question_router)
 
@@ -0,0 +1,23 @@
+from __future__ import annotations
+
+from starlette.middleware.base import BaseHTTPMiddleware, RequestResponseEndpoint
+from starlette.requests import Request
+from starlette.responses import Response
+
+from stirling.services.tracking import current_user_id
+
+_USER_ID_HEADER = "X-User-Id"
+
+
+class UserIdMiddleware(BaseHTTPMiddleware):
+    """Extract X-User-Id header and set it as the current user for PostHog tracking."""
+
+    async def dispatch(self, request: Request, call_next: RequestResponseEndpoint) -> Response:
+        user_id = request.headers.get(_USER_ID_HEADER)
+        if user_id:
+            token = current_user_id.set(user_id)
+            try:
+                return await call_next(request)
+            finally:
+                current_user_id.reset(token)
+        return await call_next(request)
@@ -50,6 +50,10 @@ def _configure_logging(level_name: str, log_file: str) -> None:
         fh.setLevel(level)
         root.addHandler(fh)
 
+    posthog_enabled: bool = Field(validation_alias="STIRLING_POSTHOG_ENABLED")
+    posthog_api_key: str = Field(validation_alias="STIRLING_POSTHOG_API_KEY")
+    posthog_host: str = Field(validation_alias="STIRLING_POSTHOG_HOST")
+
 
 @lru_cache(maxsize=1)
 def load_settings() -> AppSettings:
 
@@ -1,9 +1,11 @@
 """Shared services used by the Stirling AI runtime."""
 
 from .runtime import AppRuntime, build_model_settings, build_runtime
+from .tracking import setup_posthog_tracking
 
 __all__ = [
     "AppRuntime",
     "build_model_settings",
     "build_runtime",
+    "setup_posthog_tracking",
 ]
@@ -0,0 +1,233 @@
+from __future__ import annotations
+
+import json
+from collections import OrderedDict
+from collections.abc import Mapping
+from contextvars import ContextVar
+from typing import Any
+
+from opentelemetry.context import Context
+from opentelemetry.sdk.trace import ReadableSpan, SpanProcessor, TracerProvider
+from opentelemetry.semconv._incubating.attributes.gen_ai_attributes import (  # No public import for these constants yet
+    GEN_AI_INPUT_MESSAGES,
+    GEN_AI_OPERATION_NAME,
+    GEN_AI_OUTPUT_MESSAGES,
+    GEN_AI_REQUEST_MAX_TOKENS,
+    GEN_AI_REQUEST_MODEL,
+    GEN_AI_REQUEST_TEMPERATURE,
+    GEN_AI_RESPONSE_MODEL,
+    GEN_AI_SYSTEM,
+    GEN_AI_TOOL_DEFINITIONS,
+    GEN_AI_USAGE_INPUT_TOKENS,
+    GEN_AI_USAGE_OUTPUT_TOKENS,
+    GenAiOperationNameValues,
+)
+from opentelemetry.semconv.attributes.server_attributes import SERVER_ADDRESS, SERVER_PORT
+from opentelemetry.trace import Span
+from posthog.client import Client as PostHogClient
+
+from stirling.config import AppSettings
+
+# Per-request user ID, set by middleware from the X-User-Id header.
+# When not set, PostHog generates a random ID and marks the event as personless.
+current_user_id: ContextVar[str | None] = ContextVar("current_user_id", default=None)
+
+
+class LRUSet:
+    """Least Recently Used Set: a set with a maximum size that evicts the oldest entries first."""
+
+    def __init__(self, max_size: int) -> None:
+        self._max_size = max_size
+        self._data: OrderedDict[str, None] = OrderedDict()
+
+    def __contains__(self, key: str) -> bool:
+        return key in self._data
+
+    def add(self, key: str) -> None:
+        self._data[key] = None
+        if len(self._data) > self._max_size:
+            self._data.popitem(last=False)
+
+
+def _parse_json_attr(attrs: Mapping[str, Any], key: str) -> Any | None:
+    """Parse a JSON string span attribute, returning None on failure."""
+    raw = attrs.get(key)
+    if raw is None:
+        return None
+    try:
+        return json.loads(str(raw))
+    except (json.JSONDecodeError, TypeError):
+        return None
+
+
+def _transform_output_choices(choices: list[Any]) -> list[Any]:
+    """Transform Pydantic AI's parts-based output format to PostHog-compatible format.
+
+    Pydantic AI emits: ``[{"role": "assistant", "parts": [{"type": "tool_call", "name": "..."}]}]``
+    PostHog expects: ``[{"role": "assistant", "tool_calls": [{"type": "function", "function": {"name": "..."}}]}]``
+    """
+    for choice in choices:
+        if not isinstance(choice, dict) or "parts" not in choice:
+            continue
+        tool_calls = []
+        for part in choice.get("parts", []):
+            if isinstance(part, dict) and part.get("type") == "tool_call":
+                tool_calls.append(
+                    {
+                        "type": "function",
+                        "id": part.get("id", ""),
+                        "function": {"name": part.get("name", "")},
+                    }
+                )
+        if tool_calls:
+            choice["tool_calls"] = tool_calls
+        choice["content"] = choice.pop("parts")
+    return choices
+
+
+def _extract_user_message(attrs: Mapping[str, Any]) -> str:
+    """Extract the last user message text from the input messages span attribute."""
+    messages = _parse_json_attr(attrs, GEN_AI_INPUT_MESSAGES)
+    if not isinstance(messages, list):
+        return ""
+    for msg in reversed(messages):
+        if not isinstance(msg, dict):
+            continue
+        if msg.get("role") == "user":
+            for part in msg.get("parts", []):
+                if isinstance(part, dict) and part.get("type") == "text":
+                    return str(part.get("content", ""))
+    return ""
+
+
+# TODO: Replace with an official PostHog integration if one ever exists
+class PostHogSpanProcessor(SpanProcessor):
+    """Translates Pydantic AI OpenTelemetry spans into PostHog $ai_generation events."""
+
+    def __init__(self, client: PostHogClient) -> None:
+        self._client = client
+        self._seen_traces = LRUSet(max_size=10_000)
+
+    def on_start(self, span: Span, parent_context: Context | None = None) -> None:
+        pass
+
+    def on_end(self, span: ReadableSpan) -> None:
+        attrs = dict(span.attributes or {})
+        if attrs.get(GEN_AI_OPERATION_NAME) != GenAiOperationNameValues.CHAT.value:
+            return
+
+        properties = self._build_generation_properties(span, attrs)
+        self._maybe_emit_trace_event(span, attrs, properties)
+        self._client.capture(
+            distinct_id=current_user_id.get(),
+            event="$ai_generation",
+            properties=properties,
+        )
+
+    def _build_generation_properties(self, span: ReadableSpan, attrs: Mapping[str, Any]) -> dict[str, object]:
+        """Build the $ai_generation event properties from span data."""
+        properties: dict[str, object] = {
+            "$ai_provider": attrs.get(GEN_AI_SYSTEM, ""),
+            "$ai_model": attrs.get(GEN_AI_RESPONSE_MODEL) or attrs.get(GEN_AI_REQUEST_MODEL, ""),
+            "$ai_input_tokens": attrs.get(GEN_AI_USAGE_INPUT_TOKENS, 0),
+            "$ai_output_tokens": attrs.get(GEN_AI_USAGE_OUTPUT_TOKENS, 0),
+        }
+
+        if span.context:
+            properties["$ai_trace_id"] = format(span.context.trace_id, "032x")
+            properties["$ai_span_id"] = format(span.context.span_id, "016x")
+        if span.parent and span.parent.span_id:
+            properties["$ai_parent_id"] = format(span.parent.span_id, "016x")
+        if span.start_time and span.end_time:
+            properties["$ai_latency"] = (span.end_time - span.start_time) / 1e9
+
+        self._add_message_properties(properties, attrs)
+        self._add_model_parameters(properties, attrs)
+        self._add_tool_definitions(properties, attrs)
+        self._add_base_url(properties, attrs)
+
+        return properties
+
+    def _maybe_emit_trace_event(
+        self, span: ReadableSpan, attrs: Mapping[str, Any], properties: dict[str, object]
+    ) -> None:
+        """Emit an $ai_trace event for the first span seen per trace ID."""
+        trace_id = str(properties.get("$ai_trace_id", ""))
+        if not trace_id or trace_id in self._seen_traces:
+            return
+
+        self._seen_traces.add(trace_id)
+        trace_properties: dict[str, object] = {
+            "$ai_trace_id": trace_id,
+            "$ai_trace_name": _extract_user_message(attrs),
+            "$ai_provider": attrs.get(GEN_AI_SYSTEM, ""),
+        }
+        if span.start_time and span.end_time:
+            trace_properties["$ai_latency"] = (span.end_time - span.start_time) / 1e9
+        self._client.capture(
+            distinct_id=current_user_id.get(),
+            event="$ai_trace",
+            properties=trace_properties,
+        )
+
+    @staticmethod
+    def _add_message_properties(properties: dict[str, object], attrs: Mapping[str, Any]) -> None:
+        input_messages = _parse_json_attr(attrs, GEN_AI_INPUT_MESSAGES)
+        if input_messages is not None:
+            properties["$ai_input"] = input_messages
+
+        output_messages = _parse_json_attr(attrs, GEN_AI_OUTPUT_MESSAGES)
+        if isinstance(output_messages, list):
+            properties["$ai_output_choices"] = _transform_output_choices(output_messages)
+        elif output_messages is not None:
+            properties["$ai_output_choices"] = output_messages
+
+    @staticmethod
+    def _add_model_parameters(properties: dict[str, object], attrs: Mapping[str, Any]) -> None:
+        model_parameters: dict[str, object] = {}
+        if GEN_AI_REQUEST_TEMPERATURE in attrs:
+            model_parameters["temperature"] = attrs[GEN_AI_REQUEST_TEMPERATURE]
+        if GEN_AI_REQUEST_MAX_TOKENS in attrs:
+            model_parameters["max_tokens"] = attrs[GEN_AI_REQUEST_MAX_TOKENS]
+        if model_parameters:
+            properties["$ai_model_parameters"] = model_parameters
+
+    @staticmethod
+    def _add_tool_definitions(properties: dict[str, object], attrs: Mapping[str, Any]) -> None:
+        tools = _parse_json_attr(attrs, GEN_AI_TOOL_DEFINITIONS)
+        if tools is not None:
+            properties["$ai_tools"] = tools
+
+    @staticmethod
+    def _add_base_url(properties: dict[str, object], attrs: Mapping[str, Any]) -> None:
+        parts: list[str] = []
+        if host := attrs.get(SERVER_ADDRESS):
+            parts.append(str(host))
+        if port := attrs.get(SERVER_PORT):
+            parts.append(str(port))
+        if parts:
+            properties["$ai_base_url"] = ":".join(parts)
+
+    def shutdown(self) -> None:
+        self._client.shutdown()
+
+    def force_flush(self, timeout_millis: int = 30000) -> bool:
+        self._client.flush()
+        return True
+
+
+def setup_posthog_tracking(settings: AppSettings) -> TracerProvider | None:
+    """Configure OpenTelemetry with a PostHog span processor for LLM analytics.
+
+    Returns the TracerProvider so it can be shut down on app exit,
+    or None when tracking is disabled.
+    """
+    if not settings.posthog_enabled or not settings.posthog_api_key:
+        return None
+
+    client = PostHogClient(project_api_key=settings.posthog_api_key, host=settings.posthog_host)
+    processor = PostHogSpanProcessor(client)
+
+    provider = TracerProvider()
+    provider.add_span_processor(processor)
+    return provider
@@ -0,0 +1,38 @@
+from __future__ import annotations
+
+from collections.abc import Iterator
+
+import pytest
+
+from stirling.config import AppSettings, load_settings
+from stirling.services import build_runtime
+from stirling.services.runtime import AppRuntime
+
+
+@pytest.fixture(autouse=True)
+def clear_settings_cache() -> Iterator[None]:
+    load_settings.cache_clear()
+    yield
+    load_settings.cache_clear()
+
+
+def build_app_settings() -> AppSettings:
+    return AppSettings(
+        smart_model_name="test",
+        fast_model_name="test",
+        smart_model_max_tokens=8192,
+        fast_model_max_tokens=2048,
+        posthog_enabled=False,
+        posthog_api_key="",
+        posthog_host="https://eu.i.posthog.com",
+    )
+
+
+@pytest.fixture
+def app_settings() -> AppSettings:
+    return build_app_settings()
+
+
+@pytest.fixture
+def runtime(app_settings: AppSettings) -> AppRuntime:
+    return build_runtime(app_settings)
Original file line number	Diff line number	Diff line change
`@@ -10,6 +10,8 @@ dependencies = [`
`10`	`10`	`"pydantic-settings>=2.0.0",`
`11`	`11`	`"python-dotenv>=1.2.1",`
`12`	`12`	`"uvicorn>=0.35.0",`
	`13`	`+ "opentelemetry-sdk>=1.39.0",`
	`14`	`+ "posthog>=3.0.0",`
`13`	`15`	`]`
`14`	`16`
`15`	`17`	`[dependency-groups]`