From dc0692f4eb71a4f20eff77e44705da6f5ae51c30 Mon Sep 17 00:00:00 2001
From: aliabd <ali.si3luwa@gmail.com>
Date: Wed, 27 Aug 2025 19:17:41 +0300
Subject: [PATCH 1/9] uploading images

---
 gradio/data_classes.py     |   1 +
 gradio/routes.py           |  61 ++++++++++++++--
 js/vibeeditor/Index.svelte | 138 +++++++++++++++++++++++++++----------
 3 files changed, 155 insertions(+), 45 deletions(-)

diff --git a/gradio/data_classes.py b/gradio/data_classes.py
index 3e167baeb1..e17e087b85 100644
--- a/gradio/data_classes.py
+++ b/gradio/data_classes.py
@@ -128,6 +128,7 @@ class ResetBody(BaseModel):
 
 class VibeEditBody(BaseModel):
     prompt: str
+    files: list[FileData] = []
 
 
 class VibeCodeBody(BaseModel):
diff --git a/gradio/routes.py b/gradio/routes.py
index 4a59ee9f01..8424db6a19 100644
--- a/gradio/routes.py
+++ b/gradio/routes.py
@@ -1969,7 +1969,54 @@ async def vibe_edit(body: VibeEditBody):
             client = InferenceClient()
 
             content = ""
-            prompt = f"""
+            system_prompt = load_system_prompt()
+            
+
+            has_images = len(body.files) > 0 
+            
+            if has_images:
+                # Use ERNIE model for image processing
+                model = "baidu/ERNIE-4.5-VL-424B-A47B-Base-PT"
+                
+                image_messages = []
+                for file in body.files:
+                    if file.mime_type and "image" in file.mime_type:
+                        import base64
+                        with open(file.path, "rb") as img_file:
+                            img_data = base64.b64encode(img_file.read()).decode('utf-8')
+                            image_messages.append({
+                                "type": "image_url",
+                                "image_url": {
+                                    "url": f"data:{file.mime_type};base64,{img_data}"
+                                }
+                            })
+                
+                prompt = f"""
+You are a code generator for Gradio apps. Given the following existing code, prompt, and images, return the full new code.
+Existing code:
+```python
+{original_code}
+```
+
+Prompt:
+{body.prompt}
+
+Please analyze the provided images and generate code based on the visual content and the text prompt.
+"""
+                
+                messages = [
+                    {"role": "system", "content": system_prompt},
+                    {
+                        "role": "user", 
+                        "content": [
+                            {"type": "text", "text": prompt}
+                        ] + image_messages
+                    }
+                ]
+            else:
+                # Use GPT-OSS for text-only prompts
+                model = "openai/gpt-oss-120b"
+                prompt = f"""
 You are a code generator for Gradio apps. Given the following existing code and prompt, return the full new code.
 Existing code:
 ```python
@@ -1978,14 +2025,14 @@ async def vibe_edit(body: VibeEditBody):
 
 Prompt:
 {body.prompt}"""
-            system_prompt = load_system_prompt()
+                messages = [
+                    {"role": "system", "content": system_prompt},
+                    {"role": "user", "content": prompt},
+                ]
             content = (
                 client.chat_completion(
-                    model="openai/gpt-oss-120b",
-                    messages=[
-                        {"role": "system", "content": system_prompt},
-                        {"role": "user", "content": prompt},
-                    ],
+                    model=model,
+                    messages=messages,
                     max_tokens=1000,
                 )
                 .choices[0]
diff --git a/js/vibeeditor/Index.svelte b/js/vibeeditor/Index.svelte
index 6693864be3..2d9d9bbab6 100644
--- a/js/vibeeditor/Index.svelte
+++ b/js/vibeeditor/Index.svelte
@@ -2,10 +2,12 @@
 	import { Client } from "@gradio/client";
 	import { onMount } from "svelte";
 	import { BaseCode } from "@gradio/code";
+	import { BaseMultimodalTextbox } from "@gradio/multimodaltextbox";
+	import type { FileData } from "@gradio/client";
 
 	export let app: Client;
 	export let root: string;
-	let prompt = "";
+	let prompt: { text: string; files: FileData[] } = { text: "", files: [] };
 	let editorWidth = 350;
 	let isResizing = false;
 	let editorElement: HTMLDivElement;
@@ -13,9 +15,11 @@
 
 	let codeValue = "";
 	let diffStats: { lines_added: number; lines_removed: number } | null = null;
+	let hasImages = false;
 
 	interface Message {
 		text: string;
+		files: FileData[];
 		isBot: boolean;
 		isPending?: boolean;
 		hash?: string;
@@ -24,25 +28,35 @@
 	let message_history: Message[] = [];
 
 	const submit = (): void => {
-		if (prompt.trim() === "") return;
+		if (prompt.text.trim() === "" && prompt.files.length === 0) return;
 
 		// Clear diff stats when submitting new prompt
 		diffStats = null;
 
 		const userMessageIndex = message_history.length;
-		message_history = [...message_history, { text: prompt, isBot: false }];
+		message_history = [
+			...message_history,
+			{ text: prompt.text, files: prompt.files, isBot: false }
+		];
 
 		const botMessageIndex = message_history.length;
 		message_history = [
 			...message_history,
-			{ text: "Working...", isBot: true, isPending: true }
+			{ text: "Working...", files: [], isBot: true, isPending: true }
 		];
 
-		const userPrompt = prompt;
-		prompt = "";
+		const userPrompt = prompt.text;
+		const userFiles = prompt.files;
+		prompt = { text: "", files: [] };
+
+		// Check if there are images to determine which model to use
+		hasImages = userFiles.some(
+			(file) => file.mime_type && file.mime_type.includes("image")
+		);
 
 		const post = app.post_data(`${root}/gradio_api/vibe-edit/`, {
-			prompt: userPrompt
+			prompt: userPrompt,
+			files: userFiles
 		});
 		post
 			.then(([response, status_code]) => {
@@ -70,6 +84,7 @@
 					index === botMessageIndex
 						? {
 								text: responseData.reasoning ? responseData.reasoning : "Done.",
+								files: [],
 								isBot: true,
 								isPending: false
 							}
@@ -79,7 +94,12 @@
 			.catch((error) => {
 				message_history = message_history.map((msg, index) =>
 					index === botMessageIndex
-						? { text: "Error occurred.", isBot: true, isPending: false }
+						? {
+								text: "Error occurred.",
+								files: [],
+								isBot: true,
+								isPending: false
+							}
 						: msg
 				);
 			});
@@ -96,7 +116,7 @@
 			diffStats = null;
 
 			const messageToUndo = message_history[messageIndex];
-			prompt = messageToUndo.text;
+			prompt = { text: messageToUndo.text, files: messageToUndo.files };
 
 			message_history = message_history.slice(0, messageIndex);
 		} catch (error) {
@@ -222,7 +242,22 @@
 						class:user-message={!message.isBot}
 					>
 						<div class="message-content">
-							<span class="message-text">{message.text}</span>
+							<div class="message-text">
+								<span>{message.text}</span>
+								{#if message.files && message.files.length > 0}
+									<div class="message-files">
+										{#each message.files as file}
+											{#if file.mime_type && file.mime_type.includes("image")}
+												<img
+													src={file.url}
+													alt="Uploaded image"
+													class="message-image"
+												/>
+											{/if}
+										{/each}
+									</div>
+								{/if}
+							</div>
 							{#if !message.isBot && message.hash && !message.isPending}
 								<button
 									class="undo-button"
@@ -263,22 +298,36 @@
 	</div>
 
 	<div class="input-section">
-		<div class="powered-by">Powered by: <code>gpt-oss</code></div>
-		<textarea
-			on:keydown={(e) => {
-				if (e.key === "Enter" && !e.shiftKey) {
-					e.preventDefault();
-					submit();
-				}
-			}}
+		<div class="powered-by">
+			Powered by: <a
+				style="text-decoration: underline;"
+				href={hasImages
+					? "https://hf.co/baidu/ERNIE-4.5-VL-424B-A47B-Base-PT"
+					: "https://hf.co/openai/gpt-oss-120b"}
+				target="_blank">{hasImages ? "ERNIE-4.5-VL" : "gpt-oss"}</a
+			>
+		</div>
+		<BaseMultimodalTextbox
 			bind:value={prompt}
 			placeholder="What can I add or change?"
-			class="prompt-input"
+			lines={1}
+			max_lines={10}
+			file_types={["image"]}
+			file_count="multiple"
+			sources={["upload"]}
+			submit_btn={false}
+			show_label={false}
+			label=""
+			i18n={(value) => value || ""}
+			waveform_settings={{}}
+			{root}
+			upload={(...args) => app.upload(...args)}
+			stream_handler={(...args) => app.stream(...args)}
 		/>
 		<button
 			on:click={submit}
 			class="submit-button"
-			disabled={prompt.trim() === ""}
+			disabled={prompt.text.trim() === "" && prompt.files.length === 0}
 		>
 			Send
 		</button>
@@ -433,6 +482,33 @@
 		flex: 1;
 	}
 
+	.message-files {
+		margin-top: 8px;
+		display: flex;
+		flex-direction: column;
+		gap: 4px;
+	}
+
+	.message-image {
+		max-width: 200px;
+		max-height: 150px;
+		border-radius: var(--radius-sm);
+		object-fit: cover;
+	}
+
+	.file-item {
+		display: flex;
+		align-items: center;
+		gap: 4px;
+		font-size: 12px;
+		color: var(--body-text-color-subdued);
+	}
+
+	.file-item :global(svg) {
+		width: 16px;
+		height: 16px;
+	}
+
 	.undo-button {
 		background: var(--button-secondary-background-fill);
 		color: var(--button-secondary-text-color);
@@ -466,24 +542,6 @@
 		gap: 12px;
 	}
 
-	.prompt-input {
-		width: 100%;
-		min-height: 80px;
-		background: var(--input-background-fill);
-		border: 1px solid var(--border-color-primary);
-		border-radius: var(--input-radius);
-		padding: 12px;
-		resize: vertical;
-		outline: none;
-		font-family: inherit;
-		font-size: 14px;
-		color: var(--body-text-color);
-	}
-
-	.prompt-input:focus {
-		border-color: var(--color-accent);
-	}
-
 	.submit-button {
 		background: var(--button-primary-background-fill);
 		color: var(--button-primary-text-color);
@@ -526,4 +584,8 @@
 	.diff-stats .removed {
 		color: #ef4444;
 	}
+
+	:global(.upload-button) {
+		margin-right: 0.5rem !important;
+	}
 </style>

From eeae6959faf396ba118efb7c1754fc6d7d44182c Mon Sep 17 00:00:00 2001
From: gradio-pr-bot <gradio-pr-bot@users.noreply.github.com>
Date: Wed, 27 Aug 2025 16:23:50 +0000
Subject: [PATCH 2/9] add changeset

---
 .changeset/soft-baths-chew.md | 6 ++++++
 1 file changed, 6 insertions(+)
 create mode 100644 .changeset/soft-baths-chew.md

diff --git a/.changeset/soft-baths-chew.md b/.changeset/soft-baths-chew.md
new file mode 100644
index 0000000000..b92b4fba15
--- /dev/null
+++ b/.changeset/soft-baths-chew.md
@@ -0,0 +1,6 @@
+---
+"@gradio/vibeeditor": minor
+"gradio": minor
+---
+
+feat:Adding images to vibe editor 

From 22a4fdc112f1b20944d5970c82c9ca32d01f71c5 Mon Sep 17 00:00:00 2001
From: aliabd <ali.si3luwa@gmail.com>
Date: Thu, 28 Aug 2025 13:26:37 +0300
Subject: [PATCH 3/9] lint

---
 gradio/routes.py           | 14 +++++++-------
 js/vibeeditor/Index.svelte | 21 ++++-----------------
 2 files changed, 11 insertions(+), 24 deletions(-)

diff --git a/gradio/routes.py b/gradio/routes.py
index 8424db6a19..8c8e459628 100644
--- a/gradio/routes.py
+++ b/gradio/routes.py
@@ -1970,14 +1970,14 @@ async def vibe_edit(body: VibeEditBody):
 
             content = ""
             system_prompt = load_system_prompt()
-            
 
-            has_images = len(body.files) > 0 
-            
+
+            has_images = len(body.files) > 0
+
             if has_images:
                 # Use ERNIE model for image processing
                 model = "baidu/ERNIE-4.5-VL-424B-A47B-Base-PT"
-                
+
                 image_messages = []
                 for file in body.files:
                     if file.mime_type and "image" in file.mime_type:
@@ -1990,7 +1990,7 @@ async def vibe_edit(body: VibeEditBody):
                                     "url": f"data:{file.mime_type};base64,{img_data}"
                                 }
                             })
-                
+
                 prompt = f"""
 You are a code generator for Gradio apps. Given the following existing code, prompt, and images, return the full new code.
 Existing code:
@@ -2003,11 +2003,11 @@ async def vibe_edit(body: VibeEditBody):
 
 Please analyze the provided images and generate code based on the visual content and the text prompt.
 """
-                
+
                 messages = [
                     {"role": "system", "content": system_prompt},
                     {
-                        "role": "user", 
+                        "role": "user",
                         "content": [
                             {"type": "text", "text": prompt}
                         ] + image_messages
diff --git a/js/vibeeditor/Index.svelte b/js/vibeeditor/Index.svelte
index 2d9d9bbab6..1436a64996 100644
--- a/js/vibeeditor/Index.svelte
+++ b/js/vibeeditor/Index.svelte
@@ -248,11 +248,10 @@
 									<div class="message-files">
 										{#each message.files as file}
 											{#if file.mime_type && file.mime_type.includes("image")}
-												<img
-													src={file.url}
-													alt="Uploaded image"
-													class="message-image"
-												/>
+                <img
+                  src={file.url}
+                  class="message-image"
+                />
 											{/if}
 										{/each}
 									</div>
@@ -496,18 +495,6 @@
 		object-fit: cover;
 	}
 
-	.file-item {
-		display: flex;
-		align-items: center;
-		gap: 4px;
-		font-size: 12px;
-		color: var(--body-text-color-subdued);
-	}
-
-	.file-item :global(svg) {
-		width: 16px;
-		height: 16px;
-	}
 
 	.undo-button {
 		background: var(--button-secondary-background-fill);

From 446bc655f3b79d1ce36f39fb05657cb59235ae64 Mon Sep 17 00:00:00 2001
From: aliabd <ali.si3luwa@gmail.com>
Date: Thu, 28 Aug 2025 13:44:03 +0300
Subject: [PATCH 4/9] formatting

---
 js/vibeeditor/Index.svelte | 6 +-----
 1 file changed, 1 insertion(+), 5 deletions(-)

diff --git a/js/vibeeditor/Index.svelte b/js/vibeeditor/Index.svelte
index 1436a64996..d9356fe008 100644
--- a/js/vibeeditor/Index.svelte
+++ b/js/vibeeditor/Index.svelte
@@ -248,10 +248,7 @@
 									<div class="message-files">
 										{#each message.files as file}
 											{#if file.mime_type && file.mime_type.includes("image")}
-                <img
-                  src={file.url}
-                  class="message-image"
-                />
+												<img src={file.url} class="message-image" />
 											{/if}
 										{/each}
 									</div>
@@ -495,7 +492,6 @@
 		object-fit: cover;
 	}
 
-
 	.undo-button {
 		background: var(--button-secondary-background-fill);
 		color: var(--button-secondary-text-color);

From 52f34b4fe8b0da9dd44388278904d3c7d45e5959 Mon Sep 17 00:00:00 2001
From: aliabd <ali.si3luwa@gmail.com>
Date: Thu, 28 Aug 2025 15:00:35 +0300
Subject: [PATCH 5/9] format

---
 js/vibeeditor/Index.svelte | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/js/vibeeditor/Index.svelte b/js/vibeeditor/Index.svelte
index d9356fe008..a58ed1c2d5 100644
--- a/js/vibeeditor/Index.svelte
+++ b/js/vibeeditor/Index.svelte
@@ -248,7 +248,7 @@
 									<div class="message-files">
 										{#each message.files as file}
 											{#if file.mime_type && file.mime_type.includes("image")}
-												<img src={file.url} class="message-image" />
+												<img src={file.url} alt="Uploaded image" class="message-image" />
 											{/if}
 										{/each}
 									</div>

From 9b59f565e49ef5cf1b06aba96f68e6ef9efac064 Mon Sep 17 00:00:00 2001
From: aliabd <ali.si3luwa@gmail.com>
Date: Thu, 28 Aug 2025 15:05:21 +0300
Subject: [PATCH 6/9] formatting

---
 js/vibeeditor/Index.svelte | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/js/vibeeditor/Index.svelte b/js/vibeeditor/Index.svelte
index a58ed1c2d5..d9ac1b3435 100644
--- a/js/vibeeditor/Index.svelte
+++ b/js/vibeeditor/Index.svelte
@@ -248,7 +248,11 @@
 									<div class="message-files">
 										{#each message.files as file}
 											{#if file.mime_type && file.mime_type.includes("image")}
-												<img src={file.url} alt="Uploaded image" class="message-image" />
+												<img
+													src={file.url}
+													alt="Uploaded image"
+													class="message-image"
+												/>
 											{/if}
 										{/each}
 									</div>

From 409b6381fbf530fc89f735cdae88e8bd89d1c9af Mon Sep 17 00:00:00 2001
From: aliabd <ali.si3luwa@gmail.com>
Date: Mon, 15 Sep 2025 15:08:20 +0400
Subject: [PATCH 7/9] fix linting/formatting

---
 gradio/routes.py           | 22 +++++++++++-----------
 js/vibeeditor/Index.svelte |  2 +-
 2 files changed, 12 insertions(+), 12 deletions(-)

diff --git a/gradio/routes.py b/gradio/routes.py
index 6f001b1e6f..87655cee44 100644
--- a/gradio/routes.py
+++ b/gradio/routes.py
@@ -1994,7 +1994,6 @@ async def vibe_edit(body: VibeEditBody):
             content = ""
             system_prompt = load_system_prompt()
 
-
             has_images = len(body.files) > 0
 
             if has_images:
@@ -2005,14 +2004,17 @@ async def vibe_edit(body: VibeEditBody):
                 for file in body.files:
                     if file.mime_type and "image" in file.mime_type:
                         import base64
+
                         with open(file.path, "rb") as img_file:
-                            img_data = base64.b64encode(img_file.read()).decode('utf-8')
-                            image_messages.append({
-                                "type": "image_url",
-                                "image_url": {
-                                    "url": f"data:{file.mime_type};base64,{img_data}"
+                            img_data = base64.b64encode(img_file.read()).decode("utf-8")
+                            image_messages.append(
+                                {
+                                    "type": "image_url",
+                                    "image_url": {
+                                        "url": f"data:{file.mime_type};base64,{img_data}"
+                                    },
                                 }
-                            })
+                            )
 
                 prompt = f"""
 You are a code generator for Gradio apps. Given the following existing code, prompt, and images, return the full new code.
@@ -2031,10 +2033,8 @@ async def vibe_edit(body: VibeEditBody):
                     {"role": "system", "content": system_prompt},
                     {
                         "role": "user",
-                        "content": [
-                            {"type": "text", "text": prompt}
-                        ] + image_messages
-                    }
+                        "content": [{"type": "text", "text": prompt}] + image_messages,
+                    },
                 ]
             else:
                 # Use GPT-OSS for text-only prompts
diff --git a/js/vibeeditor/Index.svelte b/js/vibeeditor/Index.svelte
index d9ac1b3435..0c6a1a63f8 100644
--- a/js/vibeeditor/Index.svelte
+++ b/js/vibeeditor/Index.svelte
@@ -250,7 +250,7 @@
 											{#if file.mime_type && file.mime_type.includes("image")}
 												<img
 													src={file.url}
-													alt="Uploaded image"
+													alt=""
 													class="message-image"
 												/>
 											{/if}

From 9cc7aee50ce74fafc94c51221127dd14dc479e89 Mon Sep 17 00:00:00 2001
From: aliabd <ali.si3luwa@gmail.com>
Date: Mon, 15 Sep 2025 15:14:27 +0400
Subject: [PATCH 8/9] formatting for the 100th time

---
 js/vibeeditor/Index.svelte | 6 +-----
 1 file changed, 1 insertion(+), 5 deletions(-)

diff --git a/js/vibeeditor/Index.svelte b/js/vibeeditor/Index.svelte
index 0c6a1a63f8..bfb3b69795 100644
--- a/js/vibeeditor/Index.svelte
+++ b/js/vibeeditor/Index.svelte
@@ -248,11 +248,7 @@
 									<div class="message-files">
 										{#each message.files as file}
 											{#if file.mime_type && file.mime_type.includes("image")}
-												<img
-													src={file.url}
-													alt=""
-													class="message-image"
-												/>
+												<img src={file.url} alt="" class="message-image" />
 											{/if}
 										{/each}
 									</div>

From a0bfa6730508ac2a4b09fe223e34548b3f30e17e Mon Sep 17 00:00:00 2001
From: aliabd <ali.si3luwa@gmail.com>
Date: Mon, 15 Sep 2025 17:42:59 +0400
Subject: [PATCH 9/9] switch to GLM-4.5V

---
 gradio/routes.py           | 6 +++---
 js/vibeeditor/Index.svelte | 4 ++--
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/gradio/routes.py b/gradio/routes.py
index 87655cee44..4d13f7ecdd 100644
--- a/gradio/routes.py
+++ b/gradio/routes.py
@@ -1997,8 +1997,8 @@ async def vibe_edit(body: VibeEditBody):
             has_images = len(body.files) > 0
 
             if has_images:
-                # Use ERNIE model for image processing
-                model = "baidu/ERNIE-4.5-VL-424B-A47B-Base-PT"
+                # Use GLM-4.5V model for image processing
+                model = "zai-org/GLM-4.5V"
 
                 image_messages = []
                 for file in body.files:
@@ -2056,7 +2056,7 @@ async def vibe_edit(body: VibeEditBody):
                 client.chat_completion(
                     model=model,
                     messages=messages,
-                    max_tokens=1000,
+                    max_tokens=3000,
                 )
                 .choices[0]
                 .message.content
diff --git a/js/vibeeditor/Index.svelte b/js/vibeeditor/Index.svelte
index bfb3b69795..807cc02161 100644
--- a/js/vibeeditor/Index.svelte
+++ b/js/vibeeditor/Index.svelte
@@ -298,9 +298,9 @@
 			Powered by: <a
 				style="text-decoration: underline;"
 				href={hasImages
-					? "https://hf.co/baidu/ERNIE-4.5-VL-424B-A47B-Base-PT"
+					? "https://hf.co/zai-org/GLM-4.5V"
 					: "https://hf.co/openai/gpt-oss-120b"}
-				target="_blank">{hasImages ? "ERNIE-4.5-VL" : "gpt-oss"}</a
+				target="_blank">{hasImages ? "GLM-4.5V" : "gpt-oss"}</a
 			>
 		</div>
 		<BaseMultimodalTextbox