andrewyng · rohitprasad15 · Oct 14, 2025 · Oct 14, 2025 · Oct 14, 2025 · Oct 14, 2025
diff --git a/aisuite/client.py b/aisuite/client.py
@@ -1,15 +1,19 @@
 from .provider import ProviderFactory
 import os
 from .utils.tools import Tools
-from typing import Union, BinaryIO, Optional, Any
+from typing import Union, BinaryIO, Optional, Any, Literal
 from .framework.message import (
-    TranscriptionOptions,
     TranscriptionResponse,
 )
+from .framework.asr_params import ParamValidator
 
 
 class Client:
-    def __init__(self, provider_configs: dict = {}):
+    def __init__(
+        self,
+        provider_configs: dict = {},
+        extra_param_mode: Literal["strict", "warn", "permissive"] = "warn",
+    ):
         """
         Initialize the client with provider configurations.
         Use the ProviderFactory to create provider instances.
@@ -27,9 +31,15 @@ def __init__(self, provider_configs: dict = {}):
                         "aws_region": "us-west-2"
                     }
                 }
+            extra_param_mode (str): How to handle unknown ASR parameters.
+                - "strict": Raise ValueError on unknown params (production)
+                - "warn": Log warning on unknown params (default, development)
+                - "permissive": Allow all params without validation (testing)
         """
         self.providers = {}
         self.provider_configs = provider_configs
+        self.extra_param_mode = extra_param_mode
+        self.param_validator = ParamValidator(extra_param_mode)
         self._chat = None
         self._audio = None
 
@@ -282,51 +292,73 @@ def create(
         *,
         model: str,
         file: Union[str, BinaryIO],
-        options: Optional[TranscriptionOptions] = None,
         **kwargs,
     ) -> TranscriptionResponse:
         """
-        Create a transcription using the specified model and file.
+        Create audio transcription with parameter validation.
+
+        This method uses a pass-through approach with validation:
+        - Common parameters (OpenAI-style) are auto-mapped to provider equivalents
+        - Provider-specific parameters are passed through directly
+        - Unknown parameters are handled based on extra_param_mode
 
         Args:
             model: Provider and model in format 'provider:model' (e.g., 'openai:whisper-1')
             file: Audio file to transcribe (file path or file-like object)
-            options: TranscriptionOptions instance with unified parameters (includes stream control)
-            **kwargs: Additional parameters (used if options is None, assumed to be OpenAI format)
+            **kwargs: Transcription parameters (provider-specific or common)
+                Common parameters (portable across providers):
+                    - language: Language code (e.g., "en")
+                    - prompt: Context for the transcription
+                    - temperature: Sampling temperature (0-1, OpenAI only)
+                Provider-specific parameters are passed through directly.
+                See provider documentation for valid parameters.
 
         Returns:
-            TranscriptionResponse: Unified response (batch or streaming based on options.stream)
+            TranscriptionResponse: Unified response (batch or streaming)
+
+        Raises:
+            ValueError: If model format invalid, provider not supported,
+                       or unknown params in strict mode
+
+        Examples:
+            # Portable code (OpenAI-style params)
+            >>> result = client.audio.transcriptions.create(
+            ...     model="openai:whisper-1",
+            ...     file="audio.mp3",
+            ...     language="en"
+            ... )
+
+            # Provider-specific features
+            >>> result = client.audio.transcriptions.create(
+            ...     model="deepgram:nova-2",
+            ...     file="audio.mp3",
+            ...     language="en",  # Common param
+            ...     punctuate=True,  # Deepgram-specific
+            ...     diarize=True     # Deepgram-specific
+            ... )
         """
-        # Validate options and kwargs
-        if options is not None:
-            if not options.has_any_parameters():
-                raise ValueError(
-                    "TranscriptionOptions provided but no parameters are set. "
-                    "Please set at least one parameter or pass None to use kwargs."
-                )
-            # TranscriptionOptions takes precedence, ignore kwargs
-            if kwargs:
-                import warnings
-
-                warnings.warn(
-                    "Both TranscriptionOptions and kwargs provided. Using TranscriptionOptions and ignoring kwargs.",
-                    UserWarning,
-                )
-        elif not kwargs:
-            # Neither options nor kwargs provided
-            raise ValueError(
-                "Either TranscriptionOptions or kwargs must be provided for transcription parameters."
-            )
-
-        # Check that correct format is used
+        # Validate model format
         if ":" not in model:
             raise ValueError(
                 f"Invalid model format. Expected 'provider:model', got '{model}'"
             )
 
-        # Extract the provider key from the model identifier
+        # Extract provider and model name
         provider_key, model_name = model.split(":", 1)
 
+        # Validate provider is supported
+        supported_providers = ProviderFactory.get_supported_providers()
+        if provider_key not in supported_providers:
+            raise ValueError(
+                f"Invalid provider key '{provider_key}'. "
+                f"Supported providers: {supported_providers}"
+            )
+
+        # Validate and map parameters
+        validated_params = self.client.param_validator.validate_and_map(
+            provider_key, kwargs
+        )
+
         # Initialize provider if not already initialized
         if provider_key not in self.client.providers:
             config = self.client.provider_configs.get(provider_key, {})
@@ -348,33 +380,29 @@ def create(
             )
 
         # Determine if streaming is requested
-        should_stream = False  # Default to batch processing
-        if options and options.stream is not None:
-            should_stream = options.stream
-        elif kwargs.get("stream"):
-            should_stream = kwargs.get("stream", False)
+        should_stream = validated_params.get("stream", False)
 
-        # Delegate the transcription to the correct provider's implementation
+        # Delegate to provider implementation
         try:
             if should_stream:
                 # Check if provider supports output streaming
                 if hasattr(provider.audio, "transcriptions") and hasattr(
                     provider.audio.transcriptions, "create_stream_output"
                 ):
                     return provider.audio.transcriptions.create_stream_output(
-                        model_name, file, options=options, **kwargs
+                        model_name, file, **validated_params
                     )
                 else:
                     raise ValueError(
-                        f"Provider '{provider_key}' does not support output streaming transcription."
+                        f"Provider '{provider_key}' does not support streaming transcription."
                     )
             else:
                 # Non-streaming (batch) transcription
                 if hasattr(provider.audio, "transcriptions") and hasattr(
                     provider.audio.transcriptions, "create"
                 ):
                     return provider.audio.transcriptions.create(
-                        model_name, file, options=options, **kwargs
+                        model_name, file, **validated_params
                     )
                 else:
                     raise ValueError(

diff --git a/aisuite/design-notes/asr-parameter-design-motivation.md b/aisuite/design-notes/asr-parameter-design-motivation.md
@@ -0,0 +1,155 @@
+# ASR - API Parameter Design Philosophy
+
+## Design Goal: Portable Code with Provider Flexibility
+
+The ASR parameter system is designed around a core principle: **developers should write portable code that works across providers, while retaining the ability to use provider-specific features when needed**. This document explains the rationale behind our parameter classification and validation approach.
+
+---
+
+## Mandatory Parameters and Common Mappings
+
+### The Foundation: Minimal Requirements
+
+Every transcription needs just two things:
+- **`model`**: Which model/provider to use
+- **`file`**: What audio to transcribe
+
+By keeping mandatory parameters minimal, we maximize compatibility and reduce the barrier to getting started.
+
+### Common Parameters: Write Once, Run Anywhere
+
+Beyond the basics, there are concepts that exist across providers but use different names or formats. We handle three common parameters that auto-map to each provider's native API:
+
+**Example: Same code, different providers**
+
+```python
+# Works with OpenAI
+result = client.audio.transcriptions.create(
+    model="openai:whisper-1",
+    file="meeting.mp3",
+    language="en",
+    prompt="discussion about API design"
+)
+
+# Exact same code works with Deepgram
+result = client.audio.transcriptions.create(
+    model="deepgram:nova-2",
+    file="meeting.mp3",
+    language="en",
+    prompt="discussion about API design"
+)
+```
+
+Behind the scenes:
+- **`language`** passes through as `language` for both OpenAI and Deepgram, but expands to `language_code: "en-US"` for Google
+- **`prompt`** passes as `prompt` to OpenAI, transforms to `keywords: ["discussion", "about", "API", "design"]` for Deepgram, and becomes `speech_contexts: [{"phrases": ["discussion about API design"]}]` for Google
+- **`temperature`** passes through to OpenAI (which supports it) and is silently ignored by Deepgram and Google (which don't)
+
+**Why auto-mapping?** Developers shouldn't need to remember that Google uses `language_code` while others use `language`, or that Deepgram expects a list of keywords. The framework handles these provider quirks transparently, letting you write portable code.
+
+---
+
+## Provider-Specific Features: Pass-Through for Power Users
+
+Each provider has unique features that give them competitive advantages. We don't limit you to the "lowest common denominator" - if you need provider-specific functionality, it's available:
+
+**Deepgram's advanced features:**
+```python
+result = client.audio.transcriptions.create(
+    model="deepgram:nova-2",
+    file="meeting.mp3",
+    language="en",
+    punctuate=True,        # Deepgram-specific
+    diarize=True,          # Deepgram-specific
+    sentiment=True,        # Deepgram-specific
+    smart_format=True      # Deepgram-specific
+)
+```
+
+**Google's speech contexts:**
+```python
+result = client.audio.transcriptions.create(
+    model="google:latest_long",
+    file="meeting.mp3",
+    language_code="en-US",
+    enable_automatic_punctuation=True,  # Google-specific
+    max_alternatives=3,                  # Google-specific
+    speech_contexts=[{"phrases": ["API", "SDK", "REST"]}]  # Google-specific
+)
+```
+
+These provider-specific parameters pass through directly to the provider's SDK. The framework validates them based on your configured mode (see next section), but doesn't block access to unique features.
+
+---
+
+## Progressive Validation: Safety When You Need It
+
+The validation system supports three modes to match different development stages:
+
+### Development Mode: `"warn"` (Default)
+```python
+client = Client(extra_param_mode="warn")
+```
+Unknown parameters trigger warnings but continue execution. Perfect for exploration and prototyping. You see *"OpenAI doesn't support 'punctuate'"* but your code keeps running.
+
+### Strict Mode: `"strict"`
+```python
+client = Client(extra_param_mode="strict")
+```
+Unknown parameters raise errors immediately. Use in production to catch typos, configuration mistakes, or provider API changes early. Ensures no silent failures.
+
+### Permissive Mode: `"permissive"`
+```python
+client = Client(extra_param_mode="permissive")
+```
+All parameters pass through without validation. Use for beta features, experimental parameters, or when providers add new capabilities faster than framework updates.
+
+**Progressive workflow:**
+1. **Develop** with `warn` - explore freely, see warnings
+2. **Refactor** - fix warnings to make code portable
+3. **Deploy** with `strict` - ensure production safety
+
+---
+
+## Developer Experience Benefits
+
+### 1. Write Portable Code Naturally
+The same parameter names work across providers. Switch from OpenAI to Deepgram by changing one word: the model identifier.
+
+### 2. Progressive Enhancement
+Start with portable common parameters. Add provider-specific features only where you need them. Your core logic remains portable even when using advanced features for specific providers.
+
+### 3. Zero Framework Lock-in
+Parameter names come directly from provider APIs, not framework abstractions. If you need to remove the framework, you already know the native API - the names are identical.
+
+### 4. Validation That Adapts to You
+Choose your safety level based on context. Strict for production, warn for development, permissive for bleeding-edge features. The framework supports your workflow rather than constraining it.
+
+### 5. No Documentation Friction
+Copy parameters from provider docs directly. No need to learn our abstraction layer or figure out mappings - we handle the common cases, you use native names for everything else.
+
+---
+
+## Alternative Design Considered
+
+We considered creating a unified options object (`TranscriptionOptions`) that explicitly defines all parameters with framework-specific names. We chose pass-through instead because:
+
+1. **Provider APIs evolve faster than frameworks** - New parameters appear frequently. Pass-through lets developers use them immediately (in permissive mode) without waiting for framework updates.
+
+2. **Provider features don't map cleanly** - Deepgram's sentiment analysis, Google's complex speech contexts, OpenAI's timestamp granularities - each is unique. A unified object means either losing functionality or creating complex provider-specific abstractions.
+
+3. **Direct API access reduces friction** - Developers already know their provider's API from official docs. They can use parameter names directly rather than learning another abstraction layer.
+
+The pass-through approach with progressive validation provides the best of both worlds: portability for common cases, power for advanced features, and safety when you need it.
+
+---
+
+## Design Principles Summary
+
+- **Mandatory Minimal**: Only `model` and `file` required
+- **Common Auto-Mapped**: Frequent cross-provider concepts map transparently
+- **Provider-Specific Pass-Through**: Unique features remain accessible
+- **Progressive Validation**: Three modes for different development stages
+- **Zero Abstraction Tax**: Use provider APIs directly with optional safety nets
+
+This design prioritizes developer experience through portability without sacrificing power, validation without blocking experimentation, and simplicity without limiting functionality.