brightdata
diff --git a/‎lastcheck.md‎
Lines changed: 400 additions & 0 deletions b/‎lastcheck.md‎
Lines changed: 400 additions & 0 deletions
diff --git a/‎src/brightdata/scrapers/amazon/scraper.py‎
Lines changed: 6 additions & 17 deletions b/‎src/brightdata/scrapers/amazon/scraper.py‎
Lines changed: 6 additions & 17 deletions
diff --git a/‎src/brightdata/scrapers/api_client.py‎
Lines changed: 2 additions & 2 deletions b/‎src/brightdata/scrapers/api_client.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/brightdata/scrapers/chatgpt/scraper.py‎
Lines changed: 7 additions & 5 deletions b/‎src/brightdata/scrapers/chatgpt/scraper.py‎
Lines changed: 7 additions & 5 deletions
diff --git a/‎src/brightdata/scrapers/instagram/search.py‎
Lines changed: 1 addition & 1 deletion b/‎src/brightdata/scrapers/instagram/search.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/brightdata/scrapers/linkedin/scraper.py‎
Lines changed: 4 additions & 4 deletions b/‎src/brightdata/scrapers/linkedin/scraper.py‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎src/brightdata/scrapers/linkedin/search.py‎
Lines changed: 9 additions & 5 deletions b/‎src/brightdata/scrapers/linkedin/search.py‎
Lines changed: 9 additions & 5 deletions
diff --git a/‎tests/enes/amazon.py‎
Lines changed: 66 additions & 58 deletions b/‎tests/enes/amazon.py‎
Lines changed: 66 additions & 58 deletions
@@ -43,9 +43,9 @@ class AmazonScraper(BaseWebScraper):
     """
 
     # Amazon dataset IDs
-    DATASET_ID = "gd_l7q7dkf244hwxbl93"  # Amazon Products
-    DATASET_ID_REVIEWS = "gd_l1vq6tkpl34p7mq7c"  # Amazon Reviews
-    DATASET_ID_SELLERS = "gd_lwjkkolem8c4o7j3s"  # Amazon Sellers
+    DATASET_ID = "gd_l7q7dkf244hwjntr0"  # Amazon Products
+    DATASET_ID_REVIEWS = "gd_le8e811kzy4ggddlq"  # Amazon Reviews
+    DATASET_ID_SELLERS = "gd_lhotzucw1etoe5iw1k"  # Amazon Sellers
 
     PLATFORM_NAME = "amazon"
     MIN_POLL_TIMEOUT = DEFAULT_TIMEOUT_MEDIUM  # Amazon scrapes can take longer
@@ -150,21 +150,10 @@ async def reviews_async(
         else:
             validate_url_list(url)
 
-        # Build custom payload with review filters
+        # Build payload - Amazon Reviews dataset only accepts URL
+        # Note: pastDays, keyWord, numOfReviews are not supported by the API
         url_list = [url] if isinstance(url, str) else url
-        payload = []
-        
-        for u in url_list:
-            item: Dict[str, Any] = {"url": u}
-            
-            if pastDays is not None:
-                item["pastDays"] = pastDays
-            if keyWord is not None:
-                item["keyWord"] = keyWord
-            if numOfReviews is not None:
-                item["numOfReviews"] = numOfReviews
-            
-            payload.append(item)
+        payload = [{"url": u} for u in url_list]
 
         # Use reviews dataset with standard async workflow
         is_single = isinstance(url, str)
 
@@ -65,9 +65,9 @@ async def trigger(
             "dataset_id": dataset_id,
             "include_errors": str(include_errors).lower(),
         }
-        
+
         if sdk_function:
-            payload = [{**item, "sdk_function": sdk_function} for item in payload]
+            params["sdk_function"] = sdk_function
 
         async with self.engine.post_to_url(
             self.TRIGGER_URL,
 
@@ -81,13 +81,14 @@ async def prompt_async(
         if not prompt or not isinstance(prompt, str):
             raise ValidationError("Prompt must be a non-empty string")
 
-        # Build payload
+        # Build payload - ChatGPT scraper requires url field pointing to ChatGPT
         payload = [{
+            "url": "https://chatgpt.com/",
             "prompt": prompt,
             "country": country.upper(),
             "web_search": web_search,
         }]
-        
+
         if additional_prompt:
             payload[0]["additional_prompt"] = additional_prompt
 
@@ -158,18 +159,19 @@ async def prompts_async(
         if not prompts or not isinstance(prompts, list):
             raise ValidationError("Prompts must be a non-empty list")
 
-        # Build batch payload
+        # Build batch payload - ChatGPT scraper requires url field
         payload = []
         for i, prompt in enumerate(prompts):
             item = {
+                "url": "https://chatgpt.com/",
                 "prompt": prompt,
                 "country": countries[i].upper() if countries and i < len(countries) else "US",
                 "web_search": web_searches[i] if web_searches and i < len(web_searches) else False,
             }
-            
+
             if additional_prompts and i < len(additional_prompts):
                 item["additional_prompt"] = additional_prompts[i]
-            
+
             payload.append(item)
 
         # Execute workflow
 
@@ -115,7 +115,6 @@ async def posts_async(
             end_date=end_date,
             post_type=post_type,
             timeout=timeout,
-            sdk_function="posts",
         )
 
     def posts(
@@ -216,6 +215,7 @@ async def _discover_with_params(
         end_date: Optional[str] = None,
         post_type: Optional[str] = None,
         timeout: int = DEFAULT_TIMEOUT_MEDIUM,
+        sdk_function: Optional[str] = None,
     ) -> Union[ScrapeResult, List[ScrapeResult]]:
         """
         Discover content with additional parameters using standard async workflow.
 
@@ -53,10 +53,10 @@ class LinkedInScraper(BaseWebScraper):
     """
 
     # LinkedIn dataset IDs
-    DATASET_ID = "gd_l1oojb10z2jye29kh"  # People Profiles
-    DATASET_ID_COMPANIES = "gd_lhkq90okie75oj8mo"  # Companies
-    DATASET_ID_JOBS = "gd_lj4v2v5oqpp3qb79j"  # Jobs
-    DATASET_ID_POSTS = "gd_lwae11111pwxp6c4ea"  # Posts
+    DATASET_ID = "gd_l1viktl72bvl7bjuj0"  # People Profiles
+    DATASET_ID_COMPANIES = "gd_l1vikfnt1wgvvqz95w"  # Companies
+    DATASET_ID_JOBS = "gd_lpfll7v5hcqtkxl6l"  # Jobs
+    DATASET_ID_POSTS = "gd_lyy3tktm25m4avu764"  # Posts
 
     PLATFORM_NAME = "linkedin"
     MIN_POLL_TIMEOUT = DEFAULT_TIMEOUT_SHORT
 
@@ -39,9 +39,10 @@ class LinkedInSearchScraper:
     """
 
     # Dataset IDs for different LinkedIn types
-    DATASET_ID_POSTS = "gd_lwae11111pwxp6c4ea"
-    DATASET_ID_PROFILES = "gd_l1oojb10z2jye29kh"
-    DATASET_ID_JOBS = "gd_lj4v2v5oqpp3qb79j"
+    DATASET_ID_POSTS = "gd_lyy3tktm25m4avu764"
+    DATASET_ID_PROFILES = "gd_l1viktl72bvl7bjuj0"
+    DATASET_ID_JOBS = "gd_lpfll7v5hcqtkxl6l"  # URL-based job scraping
+    DATASET_ID_JOBS_DISCOVERY = "gd_m487ihp32jtc4ujg45"  # Keyword/location discovery
 
     def __init__(self, bearer_token: str, engine: Optional[AsyncEngine] = None):
         """
@@ -288,10 +289,13 @@ async def jobs_async(
                 item["locationRadius"] = location_radii[i]
 
             payload.append(item)
-        
+
+        # Use discovery dataset if searching by keyword/location, otherwise URL-based
+        dataset_id = self.DATASET_ID_JOBS_DISCOVERY if (keyword or location) else self.DATASET_ID_JOBS
+
         return await self._execute_search(
             payload=payload,
-            dataset_id=self.DATASET_ID_JOBS,
+            dataset_id=dataset_id,
             timeout=timeout
         )
 
 
@@ -24,39 +24,43 @@ async def test_amazon_products():
     client = BrightDataClient()
 
     async with client.engine:
-        print("\n🛒 Testing Amazon product scraping...")
-        print("📍 Product URL: https://www.amazon.com/dp/B0CRMZHDG8")
+        scraper = client.scrape.amazon
+        async with scraper.engine:
+            print("\n🛒 Testing Amazon product scraping...")
+            print("📍 Product URL: https://www.amazon.com/dp/B0CRMZHDG8")
 
-        try:
-            result = await client.scrape.amazon.products_async(
+            try:
+                result = await scraper.products_async(
                 url="https://www.amazon.com/dp/B0CRMZHDG8",
                 timeout=240
             )
 
-            print(f"\n✅ API call succeeded")
-            print(f"⏱️  Elapsed: {result.elapsed_ms():.2f}ms" if result.elapsed_ms() else "")
-
-            print(f"\n📊 Result analysis:")
-            print(f"   - result.success: {result.success}")
-            print(f"   - result.data type: {type(result.data)}")
-
-            if result.data:
-                print(f"\n✅ Got product data:")
-                if isinstance(result.data, dict):
-                    print(f"   - Title: {result.data.get('title', 'N/A')}")
-                    print(f"   - Price: {result.data.get('price', 'N/A')}")
-                    print(f"   - ASIN: {result.data.get('asin', 'N/A')}")
-                    print(f"   - Rating: {result.data.get('rating', 'N/A')}")
-                    print(f"   - Review Count: {result.data.get('reviews_count', 'N/A')}")
+                print(f"\n✅ API call succeeded")
+                print(f"⏱️  Elapsed: {result.elapsed_ms():.2f}ms" if result.elapsed_ms() else "")
+
+                print(f"\n📊 Result analysis:")
+                print(f"   - result.success: {result.success}")
+                print(f"   - result.data type: {type(result.data)}")
+                print(f"   - result.status: {result.status if hasattr(result, 'status') else 'N/A'}")
+                print(f"   - result.error: {result.error if hasattr(result, 'error') else 'N/A'}")
+
+                if result.data:
+                    print(f"\n✅ Got product data:")
+                    if isinstance(result.data, dict):
+                        print(f"   - Title: {result.data.get('title', 'N/A')}")
+                        print(f"   - Price: {result.data.get('price', 'N/A')}")
+                        print(f"   - ASIN: {result.data.get('asin', 'N/A')}")
+                        print(f"   - Rating: {result.data.get('rating', 'N/A')}")
+                        print(f"   - Review Count: {result.data.get('reviews_count', 'N/A')}")
+                    else:
+                        print(f"   Data: {result.data}")
                 else:
-                    print(f"   Data: {result.data}")
-            else:
-                print(f"\n❌ No product data returned")
+                    print(f"\n❌ No product data returned")
 
-        except Exception as e:
-            print(f"\n❌ Error: {e}")
-            import traceback
-            traceback.print_exc()
+            except Exception as e:
+                print(f"\n❌ Error: {e}")
+                import traceback
+                traceback.print_exc()
 
 
 async def test_amazon_reviews():
@@ -69,45 +73,49 @@ async def test_amazon_reviews():
     client = BrightDataClient()
 
     async with client.engine:
-        print("\n📝 Testing Amazon reviews scraping...")
-        print("📍 Product URL: https://www.amazon.com/dp/B0CRMZHDG8")
-        print("📋 Parameters: pastDays=30, numOfReviews=10")
-
-        try:
-            result = await client.scrape.amazon.reviews_async(
+        scraper = client.scrape.amazon
+        async with scraper.engine:
+            print("\n📝 Testing Amazon reviews scraping...")
+            print("📍 Product URL: https://www.amazon.com/dp/B0CRMZHDG8")
+            print("📋 Parameters: pastDays=30, numOfReviews=10")
+
+            try:
+                result = await scraper.reviews_async(
                 url="https://www.amazon.com/dp/B0CRMZHDG8",
                 pastDays=30,
                 numOfReviews=10,
                 timeout=240
             )
 
-            print(f"\n✅ API call succeeded")
-            print(f"⏱️  Elapsed: {result.elapsed_ms():.2f}ms" if result.elapsed_ms() else "")
-
-            print(f"\n📊 Result analysis:")
-            print(f"   - result.success: {result.success}")
-            print(f"   - result.data type: {type(result.data)}")
-
-            if result.data:
-                if isinstance(result.data, list):
-                    print(f"\n✅ Got {len(result.data)} reviews:")
-                    for i, review in enumerate(result.data[:3], 1):
-                        print(f"\n   Review {i}:")
-                        print(f"   - Rating: {review.get('rating', 'N/A')}")
-                        print(f"   - Title: {review.get('title', 'N/A')[:60]}...")
-                        print(f"   - Author: {review.get('author', 'N/A')}")
-                elif isinstance(result.data, dict):
-                    reviews = result.data.get('reviews', [])
-                    print(f"\n✅ Got {len(reviews)} reviews")
+                print(f"\n✅ API call succeeded")
+                print(f"⏱️  Elapsed: {result.elapsed_ms():.2f}ms" if result.elapsed_ms() else "")
+
+                print(f"\n📊 Result analysis:")
+                print(f"   - result.success: {result.success}")
+                print(f"   - result.data type: {type(result.data)}")
+                print(f"   - result.status: {result.status if hasattr(result, 'status') else 'N/A'}")
+                print(f"   - result.error: {result.error if hasattr(result, 'error') else 'N/A'}")
+
+                if result.data:
+                    if isinstance(result.data, list):
+                        print(f"\n✅ Got {len(result.data)} reviews:")
+                        for i, review in enumerate(result.data[:3], 1):
+                            print(f"\n   Review {i}:")
+                            print(f"   - Rating: {review.get('rating', 'N/A')}")
+                            print(f"   - Title: {review.get('title', 'N/A')[:60]}...")
+                            print(f"   - Author: {review.get('author', 'N/A')}")
+                    elif isinstance(result.data, dict):
+                        reviews = result.data.get('reviews', [])
+                        print(f"\n✅ Got {len(reviews)} reviews")
+                    else:
+                        print(f"   Data: {result.data}")
                 else:
-                    print(f"   Data: {result.data}")
-            else:
-                print(f"\n❌ No reviews data returned")
-
-        except Exception as e:
-            print(f"\n❌ Error: {e}")
-            import traceback
-            traceback.print_exc()
+                    print(f"\n❌ No reviews data returned")
+
+            except Exception as e:
+                print(f"\n❌ Error: {e}")
+                import traceback
+                traceback.print_exc()
 
 
 if __name__ == "__main__":