RooCodeInc
diff --git a/‎packages/types/src/experiment.ts‎
Lines changed: 7 additions & 1 deletion b/‎packages/types/src/experiment.ts‎
Lines changed: 7 additions & 1 deletion
diff --git a/‎packages/types/src/provider-settings.ts‎
Lines changed: 8 additions & 0 deletions b/‎packages/types/src/provider-settings.ts‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎packages/types/src/tool.ts‎
Lines changed: 1 addition & 0 deletions b/‎packages/types/src/tool.ts‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎src/core/assistant-message/presentAssistantMessage.ts‎
Lines changed: 6 additions & 0 deletions b/‎src/core/assistant-message/presentAssistantMessage.ts‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎src/core/prompts/tools/generate-image.ts‎
Lines changed: 20 additions & 0 deletions b/‎src/core/prompts/tools/generate-image.ts‎
Lines changed: 20 additions & 0 deletions
diff --git a/‎src/core/prompts/tools/index.ts‎
Lines changed: 8 additions & 0 deletions b/‎src/core/prompts/tools/index.ts‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎src/core/tools/generateImageTool.ts‎
Lines changed: 264 additions & 0 deletions b/‎src/core/tools/generateImageTool.ts‎
Lines changed: 264 additions & 0 deletions
@@ -6,7 +6,12 @@ import type { Keys, Equals, AssertEqual } from "./type-fu.js"
  * ExperimentId
  */
 
-export const experimentIds = ["powerSteering", "multiFileApplyDiff", "preventFocusDisruption"] as const
+export const experimentIds = [
+	"powerSteering",
+	"multiFileApplyDiff",
+	"preventFocusDisruption",
+	"imageGeneration",
+] as const
 
 export const experimentIdsSchema = z.enum(experimentIds)
 
@@ -20,6 +25,7 @@ export const experimentsSchema = z.object({
 	powerSteering: z.boolean().optional(),
 	multiFileApplyDiff: z.boolean().optional(),
 	preventFocusDisruption: z.boolean().optional(),
+	imageGeneration: z.boolean().optional(),
 })
 
 export type Experiments = z.infer<typeof experimentsSchema>
 
@@ -112,6 +112,14 @@ const baseProviderSettingsSchema = z.object({
 
 	// Model verbosity.
 	verbosity: verbosityLevelsSchema.optional(),
+
+	// Image generation settings (experimental)
+	imageGenerationSettings: z
+		.object({
+			openRouterApiKey: z.string().optional(),
+			selectedModel: z.string().optional(),
+		})
+		.optional(),
 })
 
 // Several of the providers share common model config properties.
 
@@ -34,6 +34,7 @@ export const toolNames = [
 	"fetch_instructions",
 	"codebase_search",
 	"update_todo_list",
+	"generate_image",
 ] as const
 
 export const toolNamesSchema = z.enum(toolNames)
 
@@ -28,6 +28,7 @@ import { attemptCompletionTool } from "../tools/attemptCompletionTool"
 import { newTaskTool } from "../tools/newTaskTool"
 
 import { updateTodoListTool } from "../tools/updateTodoListTool"
+import { generateImageTool } from "../tools/generateImageTool"
 
 import { formatResponse } from "../prompts/responses"
 import { validateToolUse } from "../tools/validateToolUse"
@@ -221,6 +222,8 @@ export async function presentAssistantMessage(cline: Task) {
 						const modeName = getModeBySlug(mode, customModes)?.name ?? mode
 						return `[${block.name} in ${modeName} mode: '${message}']`
 					}
+					case "generate_image":
+						return `[${block.name} for '${block.params.path}']`
 				}
 			}
 
@@ -546,6 +549,9 @@ export async function presentAssistantMessage(cline: Task) {
 						askFinishSubTaskApproval,
 					)
 					break
+				case "generate_image":
+					await generateImageTool(cline, block, askApproval, handleError, pushToolResult, removeClosingTag)
+					break
 			}
 
 			break
 
@@ -0,0 +1,20 @@
+import { ToolArgs } from "./types"
+
+export function getGenerateImageDescription(args: ToolArgs): string {
+	return `## generate_image
+Description: Request to generate an image using AI models through OpenRouter API. This tool creates images from text prompts and saves them to the specified path. Requires OpenRouter API key to be configured in experimental settings.
+Parameters:
+- prompt: (required) The text prompt describing the image to generate
+- path: (required) The file path where the generated image should be saved (relative to the current workspace directory ${args.cwd}). The tool will automatically add the appropriate image extension if not provided.
+Usage:
+<generate_image>
+<prompt>Your image description here</prompt>
+<path>path/to/save/image.png</path>
+</generate_image>
+
+Example: Requesting to generate a sunset image
+<generate_image>
+<prompt>A beautiful sunset over mountains with vibrant orange and purple colors</prompt>
+<path>images/sunset.png</path>
+</generate_image>`
+}
@@ -25,6 +25,7 @@ import { getSwitchModeDescription } from "./switch-mode"
 import { getNewTaskDescription } from "./new-task"
 import { getCodebaseSearchDescription } from "./codebase-search"
 import { getUpdateTodoListDescription } from "./update-todo-list"
+import { getGenerateImageDescription } from "./generate-image"
 import { CodeIndexManager } from "../../../services/code-index/manager"
 
 // Map of tool names to their description functions
@@ -56,6 +57,7 @@ const toolDescriptionMap: Record<string, (args: ToolArgs) => string | undefined>
 	apply_diff: (args) =>
 		args.diffStrategy ? args.diffStrategy.getToolDescription({ cwd: args.cwd, toolOptions: args.toolOptions }) : "",
 	update_todo_list: (args) => getUpdateTodoListDescription(args),
+	generate_image: (args) => getGenerateImageDescription(args),
 }
 
 export function getToolDescriptionsForMode(
@@ -129,6 +131,11 @@ export function getToolDescriptionsForMode(
 		tools.delete("update_todo_list")
 	}
 
+	// Conditionally exclude generate_image if experiment is not enabled
+	if (!experiments?.imageGeneration) {
+		tools.delete("generate_image")
+	}
+
 	// Map tool descriptions for allowed tools
 	const descriptions = Array.from(tools).map((toolName) => {
 		const descriptionFn = toolDescriptionMap[toolName]
@@ -164,4 +171,5 @@ export {
 	getInsertContentDescription,
 	getSearchAndReplaceDescription,
 	getCodebaseSearchDescription,
+	getGenerateImageDescription,
 }
@@ -0,0 +1,264 @@
+import path from "path"
+import fs from "fs/promises"
+import * as vscode from "vscode"
+import { Task } from "../task/Task"
+import { formatResponse } from "../prompts/responses"
+import { ToolUse, AskApproval, HandleError, PushToolResult, RemoveClosingTag } from "../../shared/tools"
+import { fileExistsAtPath } from "../../utils/fs"
+import { getReadablePath } from "../../utils/path"
+import { isPathOutsideWorkspace } from "../../utils/pathUtils"
+import { EXPERIMENT_IDS, experiments } from "../../shared/experiments"
+import { safeWriteJson } from "../../utils/safeWriteJson"
+
+// Hardcoded list of image generation models for now
+const IMAGE_GENERATION_MODELS = [
+	"google/gemini-2.5-flash-image-preview",
+	// Add more models as they become available
+]
+
+interface ImageGenerationResponse {
+	choices?: Array<{
+		message?: {
+			content?: string
+			images?: Array<{
+				type?: string
+				image_url?: {
+					url?: string
+				}
+			}>
+		}
+	}>
+	error?: {
+		message?: string
+		type?: string
+		code?: string
+	}
+}
+
+export async function generateImageTool(
+	cline: Task,
+	block: ToolUse,
+	askApproval: AskApproval,
+	handleError: HandleError,
+	pushToolResult: PushToolResult,
+	removeClosingTag: RemoveClosingTag,
+) {
+	const prompt: string | undefined = block.params.prompt
+	const relPath: string | undefined = block.params.path
+
+	// Check if the experiment is enabled
+	const provider = cline.providerRef.deref()
+	const state = await provider?.getState()
+	const isImageGenerationEnabled = experiments.isEnabled(state?.experiments ?? {}, EXPERIMENT_IDS.IMAGE_GENERATION)
+
+	if (!isImageGenerationEnabled) {
+		pushToolResult(
+			formatResponse.toolError(
+				"Image generation is an experimental feature that must be enabled in settings. Please enable 'Image Generation' in the Experimental Settings section.",
+			),
+		)
+		return
+	}
+
+	if (block.partial && (!prompt || !relPath)) {
+		// Wait for complete parameters
+		return
+	}
+
+	if (!prompt) {
+		cline.consecutiveMistakeCount++
+		cline.recordToolError("generate_image")
+		pushToolResult(await cline.sayAndCreateMissingParamError("generate_image", "prompt"))
+		return
+	}
+
+	if (!relPath) {
+		cline.consecutiveMistakeCount++
+		cline.recordToolError("generate_image")
+		pushToolResult(await cline.sayAndCreateMissingParamError("generate_image", "path"))
+		return
+	}
+
+	// Validate access permissions
+	const accessAllowed = cline.rooIgnoreController?.validateAccess(relPath)
+	if (!accessAllowed) {
+		await cline.say("rooignore_error", relPath)
+		pushToolResult(formatResponse.toolError(formatResponse.rooIgnoreError(relPath)))
+		return
+	}
+
+	// Check if file is write-protected
+	const isWriteProtected = cline.rooProtectedController?.isWriteProtected(relPath) || false
+
+	// Get OpenRouter API key from settings or profile
+	const imageGenerationSettings = (state as any)?.imageGenerationSettings
+	let openRouterApiKey = imageGenerationSettings?.openRouterApiKey
+
+	// If no API key in settings, check profiles for openRouterApiKey
+	if (!openRouterApiKey) {
+		// Check the current API configuration for OpenRouter key
+		const currentApiConfig = state?.apiConfiguration
+		if (currentApiConfig?.openRouterApiKey) {
+			openRouterApiKey = currentApiConfig.openRouterApiKey
+		}
+	}
+
+	if (!openRouterApiKey) {
+		await cline.say(
+			"error",
+			"OpenRouter API key is required for image generation. Please configure it in the Image Generation experimental settings or use a profile with an OpenRouter API key.",
+		)
+		pushToolResult(
+			formatResponse.toolError(
+				"OpenRouter API key is required for image generation. Please configure it in the Image Generation experimental settings or use a profile with an OpenRouter API key.",
+			),
+		)
+		return
+	}
+
+	// Get selected model from settings or use default
+	const selectedModel = imageGenerationSettings?.selectedModel || IMAGE_GENERATION_MODELS[0]
+
+	// Determine if the path is outside the workspace
+	const fullPath = path.resolve(cline.cwd, removeClosingTag("path", relPath))
+	const isOutsideWorkspace = isPathOutsideWorkspace(fullPath)
+
+	const sharedMessageProps = {
+		tool: "generateImage" as const,
+		path: getReadablePath(cline.cwd, removeClosingTag("path", relPath)),
+		content: prompt,
+		isOutsideWorkspace,
+		isProtected: isWriteProtected,
+	}
+
+	try {
+		if (!block.partial) {
+			cline.consecutiveMistakeCount = 0
+
+			// Ask for approval before generating the image
+			const approvalMessage = JSON.stringify({
+				...sharedMessageProps,
+				content: prompt,
+			})
+
+			const didApprove = await askApproval("tool", approvalMessage, undefined, isWriteProtected)
+
+			if (!didApprove) {
+				return
+			}
+
+			// Call OpenRouter API to generate image
+			const response = await fetch("https://openrouter.ai/api/v1/chat/completions", {
+				method: "POST",
+				headers: {
+					Authorization: `Bearer ${openRouterApiKey}`,
+					"Content-Type": "application/json",
+					"HTTP-Referer": "https://github.com/RooVetGit/Roo-Code",
+					"X-Title": "Roo Code",
+				},
+				body: JSON.stringify({
+					model: selectedModel,
+					messages: [
+						{
+							role: "user",
+							content: prompt,
+						},
+					],
+					modalities: ["image", "text"],
+				}),
+			})
+
+			if (!response.ok) {
+				const errorText = await response.text()
+				let errorMessage = `Failed to generate image: ${response.status} ${response.statusText}`
+				try {
+					const errorJson = JSON.parse(errorText)
+					if (errorJson.error?.message) {
+						errorMessage = `Failed to generate image: ${errorJson.error.message}`
+					}
+				} catch {
+					// Use default error message
+				}
+				await cline.say("error", errorMessage)
+				pushToolResult(formatResponse.toolError(errorMessage))
+				return
+			}
+
+			const result: ImageGenerationResponse = await response.json()
+
+			if (result.error) {
+				const errorMessage = `Failed to generate image: ${result.error.message}`
+				await cline.say("error", errorMessage)
+				pushToolResult(formatResponse.toolError(errorMessage))
+				return
+			}
+
+			// Extract the generated image from the response
+			const images = result.choices?.[0]?.message?.images
+			if (!images || images.length === 0) {
+				const errorMessage = "No image was generated in the response"
+				await cline.say("error", errorMessage)
+				pushToolResult(formatResponse.toolError(errorMessage))
+				return
+			}
+
+			const imageData = images[0]?.image_url?.url
+			if (!imageData) {
+				const errorMessage = "Invalid image data in response"
+				await cline.say("error", errorMessage)
+				pushToolResult(formatResponse.toolError(errorMessage))
+				return
+			}
+
+			// Extract base64 data from data URL
+			const base64Match = imageData.match(/^data:image\/(png|jpeg|jpg);base64,(.+)$/)
+			if (!base64Match) {
+				const errorMessage = "Invalid image format received"
+				await cline.say("error", errorMessage)
+				pushToolResult(formatResponse.toolError(errorMessage))
+				return
+			}
+
+			const imageFormat = base64Match[1]
+			const base64Data = base64Match[2]
+
+			// Ensure the file has the correct extension
+			let finalPath = relPath
+			if (!finalPath.match(/\.(png|jpg|jpeg)$/i)) {
+				finalPath = `${finalPath}.${imageFormat === "jpeg" ? "jpg" : imageFormat}`
+			}
+
+			// Convert base64 to buffer
+			const imageBuffer = Buffer.from(base64Data, "base64")
+
+			// Create directory if it doesn't exist
+			const absolutePath = path.resolve(cline.cwd, finalPath)
+			const directory = path.dirname(absolutePath)
+			await fs.mkdir(directory, { recursive: true })
+
+			// Write the image file
+			await fs.writeFile(absolutePath, imageBuffer)
+
+			// Track file creation
+			if (finalPath) {
+				await cline.fileContextTracker.trackFileContext(finalPath, "roo_edited")
+			}
+
+			cline.didEditFile = true
+
+			// Display the generated image in the chat using a text message with the image
+			await cline.say("text", `Image generated and saved to: ${getReadablePath(cline.cwd, finalPath)}`, [
+				imageData,
+			])
+
+			pushToolResult(
+				formatResponse.toolResult(`Image created successfully at ${getReadablePath(cline.cwd, finalPath)}`),
+			)
+
+			return
+		}
+	} catch (error) {
+		await handleError("generating image", error)
+		return
+	}
+}
Original file line number	Diff line number	Diff line change
`@@ -28,6 +28,7 @@ import { attemptCompletionTool } from "../tools/attemptCompletionTool"`
`28`	`28`	`import { newTaskTool } from "../tools/newTaskTool"`
`29`	`29`
`30`	`30`	`import { updateTodoListTool } from "../tools/updateTodoListTool"`
	`31`	`+import { generateImageTool } from "../tools/generateImageTool"`
`31`	`32`
`32`	`33`	`import { formatResponse } from "../prompts/responses"`
`33`	`34`	`import { validateToolUse } from "../tools/validateToolUse"`
`@@ -221,6 +222,8 @@ export async function presentAssistantMessage(cline: Task) {`
`221`	`222`	`const modeName = getModeBySlug(mode, customModes)?.name ?? mode`
`222`	`223`	return `[${block.name} in ${modeName} mode: '${message}']`
`223`	`224`	`}`
	`225`	`+ case "generate_image":`
	`226`	+ return `[${block.name} for '${block.params.path}']`
`224`	`227`	`}`
`225`	`228`	`}`
`226`	`229`
`@@ -546,6 +549,9 @@ export async function presentAssistantMessage(cline: Task) {`
`546`	`549`	`askFinishSubTaskApproval,`
`547`	`550`	`)`
`548`	`551`	`break`
	`552`	`+ case "generate_image":`
	`553`	`+ await generateImageTool(cline, block, askApproval, handleError, pushToolResult, removeClosingTag)`
	`554`	`+ break`
`549`	`555`	`}`
`550`	`556`
`551`	`557`	`break`