.

arthurbrenno · arthurbrenno · commit 7ac31c273544 · 2025-10-22T16:15:17.000-03:00
diff --git a/.kiro/specs/responder-otel-integration/tasks.md b/.kiro/specs/responder-otel-integration/tasks.md
@@ -94,7 +94,7 @@
   - Store as instance attribute
   - _Requirements: 2.2, 2.3_
 
-- [x] 6.2 Update `from_openrouter` and `from_openai` class methods
+- [x] 6.2 Update `openrouter` and `openai` class methods
   - Pass pricing_service parameter through
   - _Requirements: 2.2, 2.3_
 
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -12,7 +12,7 @@
   - Comprehensive response streaming with `AsyncStream` implementation
   - Integration with `orjson` for improved JSON handling performance
   - Support for reasoning, background processing, and conversation management
-  - Factory methods for easy instantiation (`from_openrouter()`, `from_openai()`)
+  - Factory methods for easy instantiation (`openrouter()`, `openai()`)
 
 ### 🌐 **Web Extraction & Automation**
 - **feat(web)**: Complete web extraction and automation system
diff --git a/agentle/responses/pricing/default_pricing_service.py b/agentle/responses/pricing/default_pricing_service.py
@@ -242,6 +242,8 @@ class DefaultPricingService(BaseModel):
     Prices are approximate and based on publicly available pricing information.
     """
 
+    type: str = "default"
+
     def __init__(
         self,
         custom_pricing: dict[str, dict[str, dict[str, float]]] | None = None,
@@ -253,6 +255,7 @@ def __init__(
             custom_pricing: Optional dictionary to override or extend default pricing.
                            Format: {"model": {"modality": {"input": float, "cached_input": float, "output": float}}}
         """
+        super().__init__()
         self.pricing = MODEL_PRICING.copy()
         if custom_pricing:
             # Deep merge custom pricing
diff --git a/agentle/responses/pricing/openrouter_pricing_service.py b/agentle/responses/pricing/openrouter_pricing_service.py
@@ -0,0 +1,245 @@
+"""OpenRouter pricing service with dynamic pricing from API."""
+
+import logging
+from typing import Any
+
+import httpx
+from rsb.models.base_model import BaseModel
+
+from agentle.responses.pricing.modality import Modality
+
+logger = logging.getLogger(__name__)
+
+
+class OpenRouterPricingService(BaseModel):
+    """
+    OpenRouter implementation of PricingService using dynamic pricing from API.
+
+    This service fetches pricing information from OpenRouter's /models API endpoint
+    and caches it for performance. Pricing is fetched lazily on first request.
+
+    The OpenRouter API returns pricing per token, which is converted to per million tokens
+    for consistency with other pricing services.
+
+    Attributes:
+        api_key: OpenRouter API key for authentication
+        base_url: Base URL for OpenRouter API (defaults to https://openrouter.ai/api/v1)
+        http_client: Optional custom HTTP client for requests
+        _models_cache: Internal cache of model pricing data
+    """
+
+    type: str = "openrouter"
+    api_key: str | None = None
+    base_url: str = "https://openrouter.ai/api/v1"
+    http_client: httpx.AsyncClient | None = None
+    _models_cache: dict[str, dict[str, Any]] | None = None
+
+    def __init__(
+        self,
+        api_key: str | None = None,
+        base_url: str = "https://openrouter.ai/api/v1",
+        http_client: httpx.AsyncClient | None = None,
+    ):
+        """
+        Initialize the OpenRouter pricing service.
+
+        Args:
+            api_key: OpenRouter API key. If not provided, reads from OPENROUTER_API_KEY env var.
+            base_url: Base URL for OpenRouter API
+            http_client: Optional custom HTTP client for requests
+        """
+        super().__init__()
+        self.api_key = api_key
+        self.base_url = base_url
+        self.http_client = http_client
+        self._models_cache = None
+
+    async def _fetch_models(self) -> dict[str, dict[str, Any]]:
+        """
+        Fetch available models from OpenRouter API and cache them.
+
+        Returns:
+            Dictionary mapping model IDs to model information including pricing
+
+        Raises:
+            Exception: If API request fails
+        """
+        if self._models_cache is not None:
+            return self._models_cache
+
+        # Get API key from instance or environment
+        from os import getenv
+
+        _api_key = self.api_key or getenv("OPENROUTER_API_KEY")
+        if not _api_key:
+            logger.warning(
+                "No OpenRouter API key provided, pricing will not be available"
+            )
+            self._models_cache = {}
+            return self._models_cache
+
+        headers = {
+            "Authorization": f"Bearer {_api_key}",
+            "Content-Type": "application/json",
+        }
+
+        client = self.http_client or httpx.AsyncClient()
+
+        try:
+            response = await client.get(
+                f"{self.base_url}/models",
+                headers=headers,
+                timeout=30.0,
+            )
+            response.raise_for_status()
+
+            models_response = response.json()
+            self._models_cache = {
+                model["id"]: model for model in models_response.get("data", [])
+            }
+
+            logger.debug(
+                f"Fetched pricing for {len(self._models_cache)} models from OpenRouter"
+            )
+
+            return self._models_cache
+        except Exception as e:
+            logger.warning(f"Failed to fetch models from OpenRouter: {e}")
+            # Return empty cache on failure
+            self._models_cache = {}
+            return self._models_cache
+        finally:
+            if self.http_client is None:
+                await client.aclose()
+
+    async def get_input_price_per_million(
+        self,
+        model: str,
+        modality: Modality = "text",
+        cached: bool = False,
+    ) -> float | None:
+        """
+        Get the input token price per million tokens for a given model.
+
+        Fetches pricing from OpenRouter's /models API endpoint and converts
+        from per-token to per-million-tokens pricing.
+
+        Args:
+            model: The model identifier (e.g., "anthropic/claude-3-opus")
+            modality: The type of input ("text", "image", "audio", "video")
+                     Note: OpenRouter primarily uses "text" modality for prompt pricing
+            cached: Whether this is cached input (for models that support caching)
+                   Note: OpenRouter has input_cache_read/write pricing for some models
+
+        Returns:
+            Price per million input tokens in USD, or None if pricing is unknown
+        """
+        try:
+            models = await self._fetch_models()
+
+            if model not in models:
+                logger.debug(
+                    f"OpenRouter model '{model}' not found in models list. Available models: {len(models)}"
+                )
+                return None
+
+            model_info = models[model]
+            pricing = model_info.get("pricing", {})
+
+            # Handle cached input pricing if requested
+            if cached:
+                # Check for input_cache_read pricing (for prompt caching)
+                input_cache_read = pricing.get("input_cache_read")
+                if input_cache_read is not None:
+                    # Convert string to float if needed
+                    if isinstance(input_cache_read, str):
+                        try:
+                            input_cache_read = float(input_cache_read)
+                        except ValueError:
+                            logger.warning(
+                                f"Could not parse input_cache_read price '{input_cache_read}' for model {model}"
+                            )
+                            return None
+
+                    # OpenRouter returns price per token, convert to per million
+                    return float(input_cache_read) * 1_000_000
+
+            # Get standard prompt pricing
+            prompt_price = pricing.get("prompt", 0.0)
+
+            # Convert string prices to float if needed
+            if isinstance(prompt_price, str):
+                try:
+                    prompt_price = float(prompt_price)
+                except ValueError:
+                    logger.warning(
+                        f"Could not parse prompt price '{prompt_price}' for model {model}"
+                    )
+                    return None
+
+            # OpenRouter returns price per token, convert to price per million tokens
+            return float(prompt_price) * 1_000_000
+
+        except Exception as e:
+            logger.error(
+                f"Error fetching input pricing for model {model}: {e}. Returning None"
+            )
+            return None
+
+    async def get_output_price_per_million(
+        self, model: str, modality: Modality = "text"
+    ) -> float | None:
+        """
+        Get the output token price per million tokens for a given model.
+
+        Fetches pricing from OpenRouter's /models API endpoint and converts
+        from per-token to per-million-tokens pricing.
+
+        Args:
+            model: The model identifier (e.g., "anthropic/claude-3-opus")
+            modality: The type of output ("text", "image", "audio", "video")
+                     Note: OpenRouter primarily uses "text" modality for completion pricing
+
+        Returns:
+            Price per million output tokens in USD, or None if pricing is unknown
+        """
+        try:
+            models = await self._fetch_models()
+
+            if model not in models:
+                logger.debug(
+                    f"OpenRouter model '{model}' not found in models list. Available models: {len(models)}"
+                )
+                return None
+
+            model_info = models[model]
+            pricing = model_info.get("pricing", {})
+            completion_price = pricing.get("completion", 0.0)
+
+            # Convert string prices to float if needed
+            if isinstance(completion_price, str):
+                try:
+                    completion_price = float(completion_price)
+                except ValueError:
+                    logger.warning(
+                        f"Could not parse completion price '{completion_price}' for model {model}"
+                    )
+                    return None
+
+            # OpenRouter returns price per token, convert to price per million tokens
+            return float(completion_price) * 1_000_000
+
+        except Exception as e:
+            logger.error(
+                f"Error fetching output pricing for model {model}: {e}. Returning None"
+            )
+            return None
+
+    def clear_cache(self) -> None:
+        """
+        Clear the cached model pricing data.
+
+        Useful for forcing a refresh of pricing information from the API.
+        """
+        self._models_cache = None
+        logger.debug("Cleared OpenRouter pricing cache")
diff --git a/agentle/responses/pricing/pricing_service.py b/agentle/responses/pricing/pricing_service.py
@@ -5,9 +5,12 @@
 from pydantic import Field
 
 from agentle.responses.pricing.default_pricing_service import DefaultPricingService
+from agentle.responses.pricing.openrouter_pricing_service import (
+    OpenRouterPricingService,
+)
 
 # Discriminated union type for all pricing service configurations
 PricingService = Annotated[
-    Union[DefaultPricingService],
+    Union[DefaultPricingService, OpenRouterPricingService],
     Field(discriminator="type"),
 ]
diff --git a/agentle/responses/responder.py b/agentle/responses/responder.py
@@ -48,6 +48,9 @@
 )
 from agentle.responses.definitions.tool_choice_types import ToolChoiceTypes
 from agentle.responses.definitions.truncation import Truncation
+from agentle.responses.pricing.openrouter_pricing_service import (
+    OpenRouterPricingService,
+)
 from agentle.responses.pricing.pricing_service import PricingService
 
 logger = logging.getLogger(__name__)
@@ -82,7 +85,7 @@ class Responder(BaseModel):
             base_url.
 
         base_url: Base URL for the API endpoint. Defaults to OpenRouter's API endpoint.
-            Use from_openrouter() or from_openai() class methods for convenience.
+            Use openrouter() or openai() class methods for convenience.
 
         pricing_service: Service for looking up model pricing to calculate costs.
             Defaults to DefaultPricingService which includes pricing for common models.
@@ -108,7 +111,7 @@ class Responder(BaseModel):
 
     Example:
         Basic usage without tracing:
-        >>> responder = Responder.from_openrouter(api_key="your-key")
+        >>> responder = Responder.openrouter(api_key="your-key")
         >>> response = await responder.respond_async(
         ...     input="What is the capital of France?",
         ...     model="openai/gpt-4"
@@ -117,15 +120,15 @@ class Responder(BaseModel):
         With observability integration:
         >>> from agentle.generations.tracing.langfuse_otel_client import LangfuseOtelClient
         >>> otel_client = LangfuseOtelClient()
-        >>> responder = Responder.from_openrouter(otel_clients=[otel_client])
+        >>> responder = Responder.openrouter(otel_clients=[otel_client])
         >>> response = await responder.respond_async(
         ...     input="What is the capital of France?",
         ...     model="openai/gpt-4"
         ... )
         # Automatically traces the request with usage and cost metrics
 
         Adding observability dynamically:
-        >>> responder = Responder.from_openrouter()
+        >>> responder = Responder.openrouter()
         >>> # Later, add observability
         >>> otel_client = LangfuseOtelClient()
         >>> responder.append_otel_client(otel_client)
@@ -164,10 +167,9 @@ class Responder(BaseModel):
     )
 
     @classmethod
-    def from_openrouter(
+    def openrouter(
         cls,
         api_key: str | None = None,
-        pricing_service: PricingService | None = None,
         otel_clients: Sequence[OtelClientType] | None = None,
     ) -> Responder:
         """
@@ -181,33 +183,22 @@ def from_openrouter(
         Returns:
             Configured Responder instance for OpenRouter.
         """
-        if pricing_service is not None and otel_clients is not None:
+        pricing_service = OpenRouterPricingService()
+        if otel_clients is not None:
             return cls(
                 api_key=api_key or os.getenv("OPENROUTER_API_KEY"),
                 base_url="https://openrouter.ai/api/v1",
                 pricing_service=pricing_service,
                 otel_clients=list(otel_clients),
             )
-        elif pricing_service is not None:
-            return cls(
-                api_key=api_key or os.getenv("OPENROUTER_API_KEY"),
-                base_url="https://openrouter.ai/api/v1",
-                pricing_service=pricing_service,
-            )
-        elif otel_clients is not None:
-            return cls(
-                api_key=api_key or os.getenv("OPENROUTER_API_KEY"),
-                base_url="https://openrouter.ai/api/v1",
-                otel_clients=list(otel_clients),
-            )
         else:
             return cls(
                 api_key=api_key or os.getenv("OPENROUTER_API_KEY"),
                 base_url="https://openrouter.ai/api/v1",
             )
 
     @classmethod
-    def from_openai(
+    def openai(
         cls,
         api_key: str | None = None,
         pricing_service: PricingService | None = None,
@@ -260,7 +251,7 @@ def append_otel_client(self, client: OtelClientType) -> None:
             client: An OtelClient instance to add to the responder's client list.
 
         Example:
-            >>> responder = Responder.from_openrouter()
+            >>> responder = Responder.openrouter()
             >>> langfuse_client = LangfuseOtelClient()
             >>> responder.append_otel_client(langfuse_client)
             >>> # Now all API calls will be traced to Langfuse
diff --git a/agentle/web/extractor.py b/agentle/web/extractor.py
diff --git a/examples/openrouter_responses_example.py b/examples/openrouter_responses_example.py