browser-use
diff --git a/‎examples/apps/ad-use/README.md‎
Lines changed: 61 additions & 0 deletions b/‎examples/apps/ad-use/README.md‎
Lines changed: 61 additions & 0 deletions
diff --git a/‎examples/apps/ad-use/ad_generator.py‎
Lines changed: 220 additions & 0 deletions b/‎examples/apps/ad-use/ad_generator.py‎
Lines changed: 220 additions & 0 deletions
diff --git a/‎examples/apps/ad-use/output/ad_20250908_150030.png‎
1.36 MB b/‎examples/apps/ad-use/output/ad_20250908_150030.png‎
1.36 MB
diff --git a/‎examples/apps/ad-use/output/landing_page_20250908_150030.png‎
1.45 MB b/‎examples/apps/ad-use/output/landing_page_20250908_150030.png‎
1.45 MB
@@ -0,0 +1,61 @@
+# Ad-Use
+
+Automatically generate Instagram ads from any landing page using browser agents and Google's Nano Banana 🍌 image generation model.
+
+[!CAUTION]
+This demo requires browser-use v0.7.4+.
+
+## Features
+
+1. Agent visits your target website
+2. Captures brand name, tagline, and key selling points
+3. Takes a clean screenshot for design reference
+4. Creates a scroll-stopping Instagram ad with 🍌
+
+## Setup
+
+Make sure the newest version of browser-use is installed (with screenshot functionality):
+```bash
+pip install -U browser-use
+```
+
+Export your Gemini API key, get it from: [Google AI Studio](https://makersuite.google.com/app/apikey) 
+```
+export GOOGLE_API_KEY='your-google-api-key-here'
+```
+
+## Normal Usage
+
+```bash
+# Basic - Generate ad from any website
+python ad_generator.py https://www.apple.com/iphone-16-pro/
+
+# Debug Mode - See the browser in action
+python ad_generator.py https://www.apple.com/iphone-16-pro/ --debug
+```
+
+## Programmatic Usage
+```python
+import asyncio
+from ad_generator import create_ad_from_landing_page
+
+async def main():
+    results = await create_ad_from_landing_page(
+        url="https://your-landing-page.com",
+        debug=False
+    )
+    print(f"Generated ads: {results}")
+
+asyncio.run(main())
+```
+
+## Output
+
+Generated ads are saved in the `output/` directory with:
+- **PNG image files** (ad_style_timestamp.png) - Actual generated ads from Gemini 2.5 Flash Image
+- **Prompt files** (ad_style_timestamp_prompt.txt) - The prompts used for generation  
+- **Landing page screenshots** for reference
+
+## Source Code
+
+Full implementation: [https://github.com/browser-use/browser-use/tree/main/examples/apps/ad-use](https://github.com/browser-use/browser-use/tree/main/examples/apps/ad-use) 
@@ -0,0 +1,220 @@
+import asyncio
+import argparse
+import logging
+import os
+import subprocess
+import sys
+from datetime import datetime
+from pathlib import Path
+from typing import Dict
+
+def setup_environment(debug: bool):
+    if not debug:
+        os.environ['BROWSER_USE_SETUP_LOGGING'] = 'false'
+        os.environ['BROWSER_USE_LOGGING_LEVEL'] = 'critical'
+        logging.getLogger().setLevel(logging.CRITICAL)
+    else:
+        os.environ['BROWSER_USE_SETUP_LOGGING'] = 'true'
+        os.environ['BROWSER_USE_LOGGING_LEVEL'] = 'info'
+
+parser = argparse.ArgumentParser(description='Generate ads from landing pages using browser-use + 🍌')
+parser.add_argument('url', nargs='?', help='Landing page URL to analyze')
+parser.add_argument('--debug', action='store_true', default=False, help='Enable debug mode (show browser, verbose logs)')
+args = parser.parse_args()
+setup_environment(args.debug)
+
+from PIL import Image
+from google import genai
+from browser_use import Agent, BrowserSession
+from browser_use.llm.google import ChatGoogle
+import aiofiles
+
+GOOGLE_API_KEY = os.getenv("GOOGLE_API_KEY")
+
+class LandingPageAnalyzer:
+    def __init__(self, debug: bool = False):
+        self.debug = debug
+        self.llm = ChatGoogle(
+            model="gemini-2.0-flash-exp",
+            api_key=GOOGLE_API_KEY
+        )
+        self.output_dir = Path("output")
+        self.output_dir.mkdir(exist_ok=True)
+        
+    async def analyze_landing_page(self, url: str) -> Dict:
+        browser_session = BrowserSession(
+            headless=not self.debug,  # headless=False only when debug=True
+            disable_security=True
+        )
+        
+        agent = Agent(
+            task=f"""Go to {url} and quickly extract key brand information for Instagram ad creation.
+
+Steps:
+1. Navigate to the website
+2. From the initial view, extract ONLY these essentials:
+   - Brand/Product name
+   - Main tagline or value proposition (one sentence)
+   - Primary call-to-action text
+   - Any visible pricing or special offer
+3. Scroll down half a page, twice (0.5 pages each) to check for any key info
+4. Done - keep it simple and focused on the brand
+
+Return ONLY the key brand info, not page structure details.""",
+            llm=self.llm,
+            browser_session=browser_session,
+            max_actions_per_step=2,
+            step_timeout=30,
+            use_thinking=False,
+            vision_detail_level='high',
+        )
+        
+        screenshot_path = None
+        timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+        
+        # Take screenshot after page fully loads
+        async def screenshot_callback(agent_instance):
+            nonlocal screenshot_path
+            import asyncio
+            await asyncio.sleep(4)
+            screenshot_path = self.output_dir / f"landing_page_{timestamp}.png"
+            active_session = agent_instance.browser_session
+            screenshot_data = await active_session.take_screenshot(path=str(screenshot_path), full_page=False)
+        
+        import asyncio
+        screenshot_task = asyncio.create_task(screenshot_callback(agent))
+        
+        history = await agent.run()
+        
+        try:
+            await screenshot_task
+        except Exception as e:
+            print(f"Screenshot task failed: {e}")
+        
+        analysis = history.final_result()
+        if not analysis:
+            analysis = "No analysis content extracted"
+        
+        return {
+            'url': url,
+            'analysis': analysis,
+            'screenshot_path': screenshot_path,
+            'timestamp': timestamp
+        }
+
+class AdGenerator:
+    def __init__(self, api_key: str = GOOGLE_API_KEY):
+        self.client = genai.Client(api_key=api_key)
+        self.output_dir = Path("output")
+        self.output_dir.mkdir(exist_ok=True)
+
+    def create_ad_prompt(self, browser_analysis: str) -> str:
+        prompt = f"""Create an Instagram ad for this brand:
+
+{browser_analysis}
+
+Create a vibrant, eye-catching Instagram ad image with:
+- Try to use the colors and style of the logo or brand, else:
+- Bold, modern gradient background with bright colors
+- Large, playful sans-serif text with the product/service name from the analysis
+- Trendy design elements: geometric shapes, sparkles, emojis
+- Fun bubbles or badges for any pricing or special offers mentioned
+- Call-to-action button with text from the analysis
+- Emphasizes the key value proposition from the analysis
+- Uses visual elements that match the brand personality
+- Square format (1:1 ratio)
+- Use color psychology to drive action
+
+Style: Modern Instagram advertisement, (1:1), scroll-stopping, professional but playful, conversion-focused"""
+        return prompt
+
+    async def generate_ad_image(self, prompt: str, screenshot_path: Path = None) -> bytes:
+        try:
+            contents = [prompt]
+            
+            if screenshot_path and screenshot_path.exists():
+                screenshot_prompt = f"\n\nHere is the actual landing page screenshot to reference for design inspiration, colors, layout, and visual style:"
+                text_part=prompt+screenshot_prompt
+                img=Image.open(screenshot_path)
+                w,h=img.size
+                img=img.crop(((w-min(w,h))//2,(h-min(w,h))//2,(w+min(w,h))//2,(h+min(w,h))//2))
+                contents=[text_part,img]
+            
+            response = self.client.models.generate_content(
+                model="gemini-2.5-flash-image-preview",
+                contents=contents
+            )
+            
+            for part in response.candidates[0].content.parts:
+                if hasattr(part, 'inline_data') and part.inline_data:
+                    return part.inline_data.data
+                    
+        except Exception as e:
+            print(f"❌ Image generation failed: {e}")
+            
+    async def save_results(self, ad_image: bytes, prompt: str, analysis: str, url: str, timestamp: str) -> str:
+        image_path = self.output_dir / f"ad_{timestamp}.png"
+        with open(image_path, 'wb') as f:
+            f.write(ad_image)
+        
+        analysis_path = self.output_dir / f"analysis_{timestamp}.txt"
+        async with aiofiles.open(analysis_path, 'w', encoding='utf-8') as f:
+            await f.write(f"URL: {url}\n\n")
+            await f.write("BROWSER-USE ANALYSIS:\n")
+            await f.write(analysis)
+            await f.write("\n\nGENERATED PROMPT:\n")
+            await f.write(prompt)
+        
+        return str(image_path)
+
+def open_image(image_path: str):
+    """Open image with default system viewer"""
+    try:
+        if sys.platform.startswith('darwin'):  
+            # macOS
+            subprocess.run(['open', image_path], check=True)
+        elif sys.platform.startswith('win'):  
+            # Windows
+            os.startfile(image_path)
+        else:  
+            # Linux
+            subprocess.run(['xdg-open', image_path], check=True)
+    except Exception as e:
+        print(f"❌ Could not open image: {e}")
+
+async def create_ad_from_landing_page(url: str, debug: bool = False):
+    analyzer = LandingPageAnalyzer(debug=debug)
+    generator = AdGenerator()
+    
+    try:
+        print(f"🚀 Analyzing {url}...")
+        page_data = await analyzer.analyze_landing_page(url)
+        
+        prompt = generator.create_ad_prompt(page_data['analysis'])
+        ad_image = await generator.generate_ad_image(prompt, page_data.get('screenshot_path'))
+        result_path = await generator.save_results(
+            ad_image, 
+            prompt, 
+            page_data['analysis'], 
+            url, 
+            page_data['timestamp']
+        )
+        
+        print(f"🎨 Generated ad: {result_path}")
+        if page_data.get('screenshot_path'):
+            print(f"📸 Page screenshot: {page_data['screenshot_path']}")
+        open_image(result_path)
+        
+        return result_path
+        
+    except Exception as e:
+        print(f"❌ Error: {e}")
+        raise
+
+
+if __name__ == "__main__":
+    url = args.url
+    if not url:
+        url = input("🔗 Enter URL: ").strip() or "https://www.apple.com/iphone-16-pro/"
+    
+    asyncio.run(create_ad_from_landing_page(url, debug=args.debug))