|
| 1 | +name: "NewSensationsVOD" |
| 2 | +groupByURL: |
| 3 | + - action: scrapeXPath |
| 4 | + url: |
| 5 | + - vod.newsensations.com/dvds |
| 6 | + scraper: movieScraper |
| 7 | +sceneByURL: |
| 8 | + - action: scrapeXPath |
| 9 | + url: |
| 10 | + - vod.newsensations.com/scenes |
| 11 | + scraper: sceneScraper |
| 12 | +performerByURL: |
| 13 | + - action: scrapeXPath |
| 14 | + url: |
| 15 | + - vod.newsensations.com/models |
| 16 | + scraper: performerScraper |
| 17 | + |
| 18 | +xPathScrapers: |
| 19 | + sceneScraper: |
| 20 | + scene: |
| 21 | + Title: //div[@class="title_bar"]/span |
| 22 | + Date: |
| 23 | + selector: //div[@class="cell update_date"][1] |
| 24 | + postProcess: |
| 25 | + - parseDate: 01/02/2006 |
| 26 | + Details: //span[@class="update_description"] |
| 27 | + Performers: |
| 28 | + Name: //div[@class="gallery_info"]/span[@class="update_models"]/a/text() |
| 29 | + Tags: |
| 30 | + Name: //div[@class="gallery_info"]/span[@class="update_tags"]/a/text() |
| 31 | + Image: |
| 32 | + selector: //meta[@property="og:image"]/@content |
| 33 | + postProcess: |
| 34 | + - replace: |
| 35 | + - regex: "-2x" |
| 36 | + with: "-4x" |
| 37 | + Studio: |
| 38 | + Name: |
| 39 | + fixed: NewSensations |
| 40 | + URL: //div[contains(@id,"packageinfo")][1]/@data-redirect |
| 41 | + movieScraper: |
| 42 | + group: |
| 43 | + Name: /html/head/title |
| 44 | + Date: |
| 45 | + selector: //div[@class="cell dvd_info"]/span[@class="update_date"]/text() |
| 46 | + postProcess: |
| 47 | + - parseDate: 01/02/2006 |
| 48 | + Studio: |
| 49 | + Name: //div[@class="dvd_details_overview"]/span[@class="update_date"]/a/text() |
| 50 | + Synopsis: |
| 51 | + selector: //div[@class="dvd_description dvd_info"]/text() |
| 52 | + URL: //div[@class="cell_top cell_thumb"]/a/@href |
| 53 | + FrontImage: //div[@class="cell_top cell_thumb"]/a/img/@src0_3x |
| 54 | + Director: |
| 55 | + selector: //div[@class="dvd_extra_fields"]/div[contains(text(), "Director")]/text() |
| 56 | + postProcess: |
| 57 | + - replace: |
| 58 | + - regex: "Director:" |
| 59 | + with: "" |
| 60 | + Tags: |
| 61 | + Name: //div[@class="update_tags dvd_info"]/a/text() |
| 62 | + performerScraper: |
| 63 | + performer: |
| 64 | + Name: //span[@class="title_bar_hilite"]/text() |
| 65 | + # Measurements: |
| 66 | + # selector: //div[@class="model_bio"]/text()[12] |
| 67 | + # postProcess: |
| 68 | + # - replace: |
| 69 | + # - regex: Measurements: \s+ |
| 70 | + # with: "" |
| 71 | + Height: |
| 72 | + selector: //div[@class="model_bio"]/text()[11] |
| 73 | + postProcess: |
| 74 | + - replace: |
| 75 | + - regex: .+(\d{3})cm |
| 76 | + with: "$1" |
| 77 | + # Birthdate: |
| 78 | + # selector: //div[@class="model_bio"]/text()[13] |
| 79 | + # postProcess: |
| 80 | + # - replace: |
| 81 | + # - regex: \s{2,} |
| 82 | + # with: "" |
| 83 | + # - regex: Birthday:\xc2\xa0 |
| 84 | + # with: "" |
| 85 | + # - parseDate: January 2, 2006 |
| 86 | +# Last Updated December 6, 2025 |
0 commit comments