feat: add script to open gemini tab and submit prompt

est7 · dehesa · commit 867d36916402 · 2025-05-13T10:31:00.000+02:00
Implement a Node.js script that enables seamless interaction with Google Gemini from Raycast. The script allows users to:
- Open Gemini in Chrome browser
- Submit prompts with optional selected text as context
- Work with existing Gemini tabs without opening duplicates

Dependencies: Node.js and chrome-cli

feat: add script to open gemini tab and submit prompt

Implement a Node.js script that enables seamless interaction with Google Gemini from Raycast. The script allows users to:
- Open Gemini in Chrome browser
- Submit prompts with optional selected text as context
- Work with existing Gemini tabs without opening duplicates

Dependencies: Node.js and chrome-cli

Delete gemini.js
diff --git a/commands/ai/gemini/gemini.js b/commands/ai/gemini/gemini.js
@@ -0,0 +1,205 @@
+#!/usr/bin/env node
+
+// Dependencies:
+// This script requires the following software to be installed:
+// - `node` https://nodejs.org
+// - `chrome-cli` https://github.com/prasmussen/chrome-cli
+// Install via homebrew: `brew install node chrome-cli`
+
+// This script needs to run JavaScript in your browser, which requires your permission.
+// To do so, open Chrome and find the menu bar item:
+// View > Developer > Allow JavaScript from Apple Events
+
+// Required parameters:
+// @raycast.schemaVersion 1
+// @raycast.title Ask Gemini
+// @raycast.mode silent
+// @raycast.packageName Gemini
+
+// Optional parameters:
+// @raycast.icon ../images/icon-gemini.svg
+// @raycast.argument1 { "type": "text", "placeholder": "Selected Text", "optional": true }
+// @raycast.argument2 { "type": "text", "placeholder": "Prompt"}
+
+// Documentation:
+// @raycast.description Open Gemini in Chrome browser and submit a prompt with optional selected text as context
+// @raycast.author Modified from Nimo Beeren's Claude script
+
+const { execSync } = require("child_process");
+
+const selectedText = process.argv[2] || ""; // Get the selected text, or an empty string if none is selected.
+const prompt = process.argv[3];
+
+process.env.OUTPUT_FORMAT = "json";
+
+/** Escape a string so that it can be used in JavaScript code when wrapped in double quotes. */
+function escapeJsString(str) {
+  return str.replaceAll(`\\`, `\\\\`).replaceAll(`"`, `\\"`);
+}
+
+/** Escape a string so that it can be used in a shell command when wrapped in single quotes. */
+function escapeShellString(str) {
+  return str.replaceAll(`'`, `'"'"'`);
+}
+
+// used to wait for Chrome to activate.
+function sleep(ms) {
+  const start = Date.now();
+  while (Date.now() - start < ms) {}
+}
+
+try {
+  execSync("which chrome-cli");
+} catch {
+  console.error(
+    "chrome-cli is required to run this script (https://github.com/prasmussen/chrome-cli)",
+  );
+  process.exit(1);
+}
+
+// Bring Chrome to the foreground first.
+try {
+  // Try to activate Chrome through AppleScript, supporting different possible application names.
+  execSync("osascript -e 'tell application \"Google Chrome\" to activate'", {
+    stdio: "ignore",
+  });
+} catch (e) {
+  try {
+    // If the first naming method fails, try possible alternatives.
+    execSync("osascript -e 'tell application \"Chrome\" to activate'", {
+      stdio: "ignore",
+    });
+  } catch (err) {
+    console.error(
+      "Unable to activate Chrome browser, continue with other operations",
+    );
+  }
+}
+
+// Give Chrome a little time to make sure it is activated
+sleep(300);
+
+// Find the Gemini tab if one is already open
+let tabs = JSON.parse(execSync("chrome-cli list tabs")).tabs;
+let geminiTab = tabs.find((tab) =>
+  tab.url.startsWith("https://gemini.google.com/"),
+);
+
+// If there is a Gemini tab open, get its info. Otherwise, open Gemini in a new window.
+let geminiTabInfo;
+if (geminiTab) {
+  // Focus on existing tags, do not refresh the page
+  execSync(`chrome-cli activate -t ${geminiTab.id}`);
+  // Get tab info
+  geminiTabInfo = JSON.parse(execSync(`chrome-cli info -t ${geminiTab.id}`));
+} else {
+  // Open a Gemini session in a new tab, focus it and return the tab info
+  geminiTabInfo = JSON.parse(
+    execSync("chrome-cli open 'https://gemini.google.com/app'"),
+  );
+}
+
+// Wait for the tab to be loaded, then execute the script
+let interval = setInterval(() => {
+  if (geminiTabInfo.loading) {
+    geminiTabInfo = JSON.parse(
+      execSync(`chrome-cli info -t ${geminiTabInfo.id}`),
+    );
+  } else {
+    clearInterval(interval);
+    executeScript();
+  }
+}, 100);
+
+function executeScript() {
+  const script = async function (selectedText, prompt) {
+    // Wait for prompt element to be on the page
+    let promptElement;
+    await new Promise((resolve) => {
+      let interval = setInterval(() => {
+        promptElement = document.querySelector(
+          'div[aria-label="Enter a prompt here"]',
+        );
+        if (promptElement) {
+          clearInterval(interval);
+          resolve();
+        }
+      }, 100);
+    });
+
+    // Prepare the final text
+    let finalText = "";
+    if (selectedText && selectedText.trim() !== "") {
+      finalText += `<file_content>${selectedText}</file_contents>\n\n${prompt}`;
+    } else {
+      finalText = prompt;
+    }
+
+    // Focus the input element first
+    promptElement.focus();
+
+    // Check if there's existing content
+    const hasExistingContent = promptElement.textContent.trim() !== "";
+
+    // Clear existing content if needed - safely without innerHTML
+    if (!hasExistingContent) {
+      // If empty, we'll just add our content
+      // No need to clear anything
+    } else {
+      // If we want to append to existing content, add a newline
+      // Create a new paragraph for separation
+      const selection = window.getSelection();
+      const range = document.createRange();
+
+      // Move cursor to the end of existing content
+      range.selectNodeContents(promptElement);
+      range.collapse(false); // false means collapse to end
+      selection.removeAllRanges();
+      selection.addRange(range);
+
+      // Insert two newlines to separate content
+      document.execCommand("insertText", false, "\n\n");
+    }
+
+    // Insert the content using execCommand which is safer than innerHTML
+    // Split by newlines and insert with proper paragraph formatting
+    const paragraphs = finalText.split("\n");
+    paragraphs.forEach((paragraph, index) => {
+      if (index > 0) {
+        // Insert newline between paragraphs (not before the first one)
+        document.execCommand("insertText", false, "\n");
+      }
+
+      // Insert the paragraph text
+      document.execCommand("insertText", false, paragraph || "\u200B");
+    });
+
+    // Trigger input event to notify Gemini of changes
+    const inputEvent = new Event("input", { bubbles: true });
+    promptElement.dispatchEvent(inputEvent);
+
+    // Ensure cursor is at the end and visible
+    const selection = window.getSelection();
+    const range = document.createRange();
+    range.selectNodeContents(promptElement);
+    range.collapse(false); // false means collapse to end
+    selection.removeAllRanges();
+    selection.addRange(range);
+
+    // Scroll to make cursor visible
+    promptElement.scrollTop = promptElement.scrollHeight;
+
+    // Additional scroll after a short delay to ensure visibility
+    setTimeout(() => {
+      promptElement.scrollTop = promptElement.scrollHeight;
+    }, 100);
+  };
+
+  const functionString = escapeShellString(script.toString());
+  const selectedTextString = escapeShellString(escapeJsString(selectedText));
+  const promptString = escapeShellString(escapeJsString(prompt));
+
+  execSync(
+    `chrome-cli execute '(${functionString})(\"${selectedTextString}\", \"${promptString}\")' -t ${geminiTabInfo.id}`,
+  );
+}
diff --git a/commands/ai/images/icon-gemini.svg b/commands/ai/images/icon-gemini.svg
@@ -0,0 +1,10 @@
+<svg width="28" height="28" viewBox="0 0 28 28" fill="none" xmlns="http://www.w3.org/2000/svg">
+<path d="M14 28C14 26.0633 13.6267 24.2433 12.88 22.54C12.1567 20.8367 11.165 19.355 9.905 18.095C8.645 16.835 7.16333 15.8433 5.46 15.12C3.75667 14.3733 1.93667 14 0 14C1.93667 14 3.75667 13.6383 5.46 12.915C7.16333 12.1683 8.645 11.165 9.905 9.905C11.165 8.645 12.1567 7.16333 12.88 5.46C13.6267 3.75667 14 1.93667 14 0C14 1.93667 14.3617 3.75667 15.085 5.46C15.8317 7.16333 16.835 8.645 18.095 9.905C19.355 11.165 20.8367 12.1683 22.54 12.915C24.2433 13.6383 26.0633 14 28 14C26.0633 14 24.2433 14.3733 22.54 15.12C20.8367 15.8433 19.355 16.835 18.095 18.095C16.835 19.355 15.8317 20.8367 15.085 22.54C14.3617 24.2433 14 26.0633 14 28Z" fill="url(#paint0_radial_16771_53212)"/>
+<defs>
+<radialGradient id="paint0_radial_16771_53212" cx="0" cy="0" r="1" gradientUnits="userSpaceOnUse" gradientTransform="translate(2.77876 11.3795) rotate(18.6832) scale(29.8025 238.737)">
+<stop offset="0.0671246" stop-color="#9168C0"/>
+<stop offset="0.342551" stop-color="#5684D1"/>
+<stop offset="0.672076" stop-color="#1BA1E3"/>
+</radialGradient>
+</defs>
+</svg>