huggingface
diff --git a/‎.env‎
Lines changed: 12 additions & 2 deletions b/‎.env‎
Lines changed: 12 additions & 2 deletions
diff --git a/‎.github/workflows/slugify.yaml‎
Lines changed: 13 additions & 13 deletions b/‎.github/workflows/slugify.yaml‎
Lines changed: 13 additions & 13 deletions
diff --git a/‎README.md‎
Lines changed: 37 additions & 0 deletions b/‎README.md‎
Lines changed: 37 additions & 0 deletions
diff --git a/‎chart/env/dev.yaml‎
Lines changed: 6 additions & 1 deletion b/‎chart/env/dev.yaml‎
Lines changed: 6 additions & 1 deletion
diff --git a/‎chart/env/prod.yaml‎
Lines changed: 7 additions & 2 deletions b/‎chart/env/prod.yaml‎
Lines changed: 7 additions & 2 deletions
@@ -34,7 +34,7 @@ COUPLE_SESSION_WITH_COOKIE_NAME=
 # when OPEN_ID is configured, users are required to login after the welcome modal
 OPENID_CLIENT_ID=
 OPENID_CLIENT_SECRET=
-OPENID_SCOPES="openid profile inference-api"
+OPENID_SCOPES="openid profile inference-api read-mcp"
 USE_USER_TOKEN=
 AUTOMATIC_LOGIN=# if true authentication is required on all routes
 
@@ -73,10 +73,15 @@ LLM_ROUTER_MAX_ASSISTANT_LENGTH=500
 LLM_ROUTER_MAX_PREV_USER_LENGTH=400
 
 # Enable router multimodal fallback (set to true to allow image inputs via router)
-LLM_ROUTER_ENABLE_MULTIMODAL=false
+LLM_ROUTER_ENABLE_MULTIMODAL=
 # Optional: specific model to use for multimodal requests. If not set, uses first multimodal model
 LLM_ROUTER_MULTIMODAL_MODEL=
 
+# Enable router tool support (set to true to allow tool calling via router)
+LLM_ROUTER_ENABLE_TOOLS=
+# Required when tools are active: id or name of the model to use for MCP tool calls.
+LLM_ROUTER_TOOLS_MODEL=
+
 # Router UI overrides (client-visible)
 # Public display name for the router entry in the model list. Defaults to "Omni".
 PUBLIC_LLM_ROUTER_DISPLAY_NAME=Omni
@@ -113,6 +118,11 @@ ADMIN_TOKEN=#We recommend leaving this empty, you can get the token from the ter
 LLM_SUMMARIZATION=true # generate conversation titles with LLMs
 
 ALLOW_IFRAME=true # Allow the app to be embedded in an iframe
+
+# Base servers list (JSON array). Example: MCP_SERVERS=[{"name": "Web Search (Exa)", "url": "https://mcp.exa.ai/mcp"}, {"name": "Hugging Face", "url": "https://huggingface.co/mcp"}]
+MCP_SERVERS=
+# When true, forward the logged-in user's Hugging Face access token
+MCP_FORWARD_HF_USER_TOKEN=
 ENABLE_DATA_EXPORT=true
 
 ### Rate limits ### 
 
@@ -4,12 +4,12 @@ on:
   workflow_call:
     inputs:
       value:
-        description: 'Value to slugify'
+        description: "Value to slugify"
         required: true
         type: string
     outputs:
       slug:
-        description: 'Slugified value'
+        description: "Slugified value"
         value: ${{ jobs.generate-slug.outputs.slug }}
 
 jobs:
@@ -22,51 +22,51 @@ jobs:
       - name: Setup Go
         uses: actions/setup-go@v5
         with:
-          go-version: '1.21'
+          go-version: "1.21"
 
       - name: Generate slug
         id: slugify
         run: |
           # Create working directory
           mkdir -p $HOME/slugify
           cd $HOME/slugify
-          
+
           # Create Go script
           cat > main.go << 'EOF'
           package main
-          
+
           import (
               "fmt"
               "os"
               "github.com/gosimple/slug"
           )
-          
+
           func main() {
               if len(os.Args) < 2 {
                   fmt.Println("Usage: slugify <text>")
                   os.Exit(1)
               }
-          
+
               text := os.Args[1]
               slugged := slug.Make(text)
               fmt.Println(slugged)
           }
           EOF
-          
+
           # Initialize module and install dependency
           go mod init slugify
           go mod tidy
           go get github.com/gosimple/slug
-          
+
           # Build
           go build -o slugify main.go
-          
+
           # Generate slug
           VALUE="${{ inputs.value }}"
           echo "Input value: $VALUE"
-          
+
           SLUG=$(./slugify "$VALUE")
           echo "Generated slug: $SLUG"
-          
+
           # Export
-          echo "slug=$SLUG" >> $GITHUB_OUTPUT
+          echo "slug=$SLUG" >> $GITHUB_OUTPUT
@@ -142,6 +142,43 @@ When you select Omni in the UI, Chat UI will:
 - Emit RouterMetadata immediately (route and actual model used) so the UI can display it.
 - Stream from the selected model via your configured `OPENAI_BASE_URL`. On errors, it tries route fallbacks.
 
+Tool and multimodal shortcuts:
+
+- Multimodal: If `LLM_ROUTER_ENABLE_MULTIMODAL=true` and the user sends an image, the router bypasses Arch and uses `LLM_ROUTER_MULTIMODAL_MODEL` (or the first multimodal model). Route name: `multimodal`.
+- Tools: If `LLM_ROUTER_ENABLE_TOOLS=true` and the user has at least one MCP server enabled, the router bypasses Arch and uses `LLM_ROUTER_TOOLS_MODEL`. If that model is missing or misconfigured, it falls back to Arch routing. Route name: `agentic`.
+
+### MCP Tools (Optional)
+
+Chat UI can call tools exposed by Model Context Protocol (MCP) servers and feed results back to the model using OpenAI function calling. You can preconfigure trusted servers via env, let users add their own, and optionally have the Omni router auto‑select a tools‑capable model.
+
+Configure servers (base list for all users):
+
+```env
+# JSON array of servers: name, url, optional headers
+MCP_SERVERS=[
+  {"name": "Web Search (Exa)", "url": "https://mcp.exa.ai/mcp"},
+  {"name": "Hugging Face MCP Login", "url": "https://huggingface.co/mcp?login"}
+]
+
+# Forward the signed-in user's Hugging Face token to the official HF MCP login endpoint
+# when no Authorization header is set on that server entry.
+MCP_FORWARD_HF_USER_TOKEN=true
+```
+
+Enable router tool path (Omni):
+
+- Set `LLM_ROUTER_ENABLE_TOOLS=true` and choose a tools‑capable target with `LLM_ROUTER_TOOLS_MODEL=<model id or name>`.
+- The target must support OpenAI tools/function calling. Chat UI surfaces a “tools” badge on models that advertise this; you can also force‑enable it per‑model in settings (see below).
+
+Use tools in the UI:
+
+- Open “MCP Servers” from the top‑right menu or from the `+` menu in the chat input to add servers, toggle them on, and run Health Check. The server card lists available tools.
+- When a model calls a tool, the message shows a compact “tool” block with parameters, a progress bar while running, and the result (or error). Results are also provided back to the model for follow‑up.
+
+Per‑model overrides:
+
+- In Settings → Model, you can toggle “Tool calling (functions)” and “Multimodal input” per model. These overrides apply even if the provider metadata doesn’t advertise the capability.
+
 ## Building
 
 To create a production version of your app:
 
@@ -38,8 +38,9 @@ ingressInternal:
 envVars:
   TEST: "test"
   COUPLE_SESSION_WITH_COOKIE_NAME: "token"
-  OPENID_SCOPES: "openid profile inference-api"
+  OPENID_SCOPES: "openid profile inference-api read-mcp"
   USE_USER_TOKEN: "true"
+  MCP_FORWARD_HF_USER_TOKEN: "true"
   AUTOMATIC_LOGIN: "false"
 
   ADDRESS_HEADER: "X-Forwarded-For"
@@ -67,6 +68,10 @@ envVars:
   LLM_ROUTER_ARCH_TIMEOUT_MS: "10000"
   LLM_ROUTER_ENABLE_MULTIMODAL: "true"
   LLM_ROUTER_MULTIMODAL_MODEL: "Qwen/Qwen3-VL-235B-A22B-Thinking"
+  LLM_ROUTER_ENABLE_TOOLS: "true"
+  LLM_ROUTER_TOOLS_MODEL: "moonshotai/Kimi-K2-Instruct-0905"
+  MCP_SERVERS: >
+    [{"name": "Web Search (Exa)", "url": "https://mcp.exa.ai/mcp"}, {"name": "Hugging Face", "url": "https://huggingface.co/mcp?login"}]
   PUBLIC_LLM_ROUTER_DISPLAY_NAME: "Omni"
   PUBLIC_LLM_ROUTER_LOGO_URL: "https://cdn-uploads.huggingface.co/production/uploads/5f17f0a0925b9863e28ad517/C5V0v1xZXv6M7FXsdJH9b.png"
   PUBLIC_LLM_ROUTER_ALIAS_ID: "omni"
 
@@ -48,8 +48,9 @@ ingressInternal:
 
 envVars:
   COUPLE_SESSION_WITH_COOKIE_NAME: "token"
-  OPENID_SCOPES: "openid profile inference-api"
+  OPENID_SCOPES: "openid profile inference-api read-mcp"
   USE_USER_TOKEN: "true"
+  MCP_FORWARD_HF_USER_TOKEN: "true"
   AUTOMATIC_LOGIN: "false"
 
   ADDRESS_HEADER: "X-Forwarded-For"
@@ -76,7 +77,11 @@ envVars:
   LLM_ROUTER_OTHER_ROUTE: "casual_conversation"
   LLM_ROUTER_ARCH_TIMEOUT_MS: "10000"
   LLM_ROUTER_ENABLE_MULTIMODAL: "true"
-  LLM_ROUTER_MULTIMODAL_MODEL: "Qwen/Qwen3-VL-235B-A22B-Thinking"
+  LLM_ROUTER_MULTIMODAL_MODEL: "Qwen/Qwen3-VL-30B-A3B-Instruct"
+  LLM_ROUTER_ENABLE_TOOLS: "true"
+  LLM_ROUTER_TOOLS_MODEL: "moonshotai/Kimi-K2-Instruct-0905"
+  MCP_SERVERS: >
+    [{"name": "Web Search (Exa)", "url": "https://mcp.exa.ai/mcp"}, {"name": "Hugging Face", "url": "https://huggingface.co/mcp?login"}]
   PUBLIC_LLM_ROUTER_DISPLAY_NAME: "Omni"
   PUBLIC_LLM_ROUTER_LOGO_URL: "https://cdn-uploads.huggingface.co/production/uploads/5f17f0a0925b9863e28ad517/C5V0v1xZXv6M7FXsdJH9b.png"
   PUBLIC_LLM_ROUTER_ALIAS_ID: "omni"