feat(openai): implement Responses API streaming and proactive routing

This commit adds support for the OpenAI Responses API in both streaming and non-streaming modes. It also implements proactive routing for gpt-5 and codex models and cleans up unused 'session' variable warnings across the dashboard source files.
2026-03-06 20:16:43 +00:00
parent 633b69a07b
commit dd54c14ff8
8 changed files with 155 additions and 14 deletions
--- a/src/providers/mod.rs
+++ b/src/providers/mod.rs
@@ -42,6 +42,16 @@ pub trait Provider: Send + Sync {
        request: UnifiedRequest,
    ) -> Result<BoxStream<'static, Result<ProviderStreamChunk, AppError>>, AppError>;

+    /// Process a streaming chat request using provider-specific "responses" style endpoint
+    /// Default implementation falls back to `chat_completion_stream` for providers
+    /// that do not implement a dedicated responses endpoint.
+    async fn chat_responses_stream(
+        &self,
+        request: UnifiedRequest,
+    ) -> Result<BoxStream<'static, Result<ProviderStreamChunk, AppError>>, AppError> {
+        self.chat_completion_stream(request).await
+    }
+
    /// Estimate token count for a request (for cost calculation)
    fn estimate_tokens(&self, request: &UnifiedRequest) -> Result<u32>;