feat(server): add /v1/models endpoint for OpenAI-compatible model discovery

Open WebUI and other OpenAI-compatible clients call GET /v1/models to discover available models. Lists all models from enabled providers via the model registry, respects disabled models, and handles Ollama models from TOML config.
2026-03-02 14:06:31 -05:00
parent e38f012b23
commit 88aae389d2
1 changed files with 56 additions and 1 deletions
@@ -3,7 +3,7 @@ use axum::{
    extract::State,
    response::IntoResponse,
    response::sse::{Event, Sse},
-    routing::post,
+    routing::{get, post},
 };
 use futures::stream::StreamExt;
 use std::sync::Arc;
@@ -24,6 +24,7 @@ use crate::{
 pub fn router(state: AppState) -> Router {
    Router::new()
        .route("/v1/chat/completions", post(chat_completions))
+        .route("/v1/models", get(list_models))
        .layer(axum::middleware::from_fn_with_state(
            state.clone(),
            rate_limiting::middleware::rate_limit_middleware,
@@ -31,6 +32,60 @@ pub fn router(state: AppState) -> Router {
        .with_state(state)
 }

+/// GET /v1/models — OpenAI-compatible model listing.
+/// Returns all models from enabled providers so clients like Open WebUI can
+/// discover which models are available through the proxy.
+async fn list_models(
+    State(state): State<AppState>,
+    _auth: AuthenticatedClient,
+) -> Result<Json<serde_json::Value>, AppError> {
+    let registry = &state.model_registry;
+    let providers = state.provider_manager.get_all_providers().await;
+
+    let mut models = Vec::new();
+
+    for provider in &providers {
+        let provider_name = provider.name();
+
+        // Find this provider's models in the registry
+        if let Some(provider_info) = registry.providers.get(provider_name) {
+            for (model_id, meta) in &provider_info.models {
+                // Skip disabled models via the config cache
+                if let Some(cfg) = state.model_config_cache.get(model_id).await {
+                    if !cfg.enabled {
+                        continue;
+                    }
+                }
+
+                models.push(serde_json::json!({
+                    "id": model_id,
+                    "object": "model",
+                    "created": 0,
+                    "owned_by": provider_name,
+                    "name": meta.name,
+                }));
+            }
+        }
+
+        // For Ollama, models are configured in the TOML, not the registry
+        if provider_name == "ollama" {
+            for model_id in &state.config.providers.ollama.models {
+                models.push(serde_json::json!({
+                    "id": model_id,
+                    "object": "model",
+                    "created": 0,
+                    "owned_by": "ollama",
+                }));
+            }
+        }
+    }
+
+    Ok(Json(serde_json::json!({
+        "object": "list",
+        "data": models
+    })))
+}
+
 async fn get_model_cost(
    model: &str,
    prompt_tokens: u32,