161 lines
4.6 KiB
YAML
161 lines
4.6 KiB
YAML
name: AdultEmpireCash
|
|
# Sites ("Brands") from https://www.adultempirecash.com
|
|
sceneByURL:
|
|
- action: scrapeXPath
|
|
scraper: sceneScraper
|
|
url:
|
|
- blackmassivecocks.com/
|
|
- braziliantransgirls.com/
|
|
- bruthasinc.com/
|
|
- concoxxxion.com/
|
|
- elegantangel.com/
|
|
- forbiddenfruitsfilms.com/
|
|
- hornyhousehold.com/
|
|
- hotwifefun.com/
|
|
- hotwivescheating.com/
|
|
- jayspov.net/
|
|
- jodiwest.com/
|
|
- kingsoffetish.com/
|
|
- latinoguysporn.com/
|
|
- lethalhardcore.com/
|
|
- pornstarstroker.com/ # aggregator site?
|
|
- reaganfoxx.com/
|
|
- severesexfilms.com/
|
|
- smutfactor.com/
|
|
- spankmonster.com/
|
|
- stephousexxx.com/
|
|
- thirdworldxxx.com/
|
|
- transationalfantasies.com/
|
|
- wcpclub.com/
|
|
- westcoastproductions.com/
|
|
- data18.empirestores.co/
|
|
|
|
# VR Sites
|
|
- action: scrapeXPath
|
|
scraper: vrSceneScraper
|
|
url:
|
|
- lethalhardcorevr.com/
|
|
- whorecraftvr.com/
|
|
|
|
movieByURL:
|
|
- action: scrapeXPath
|
|
scraper: movieScraper
|
|
url:
|
|
- braziliantransgirls.com/
|
|
# - bangmytransass.com/ # Scenes published as movies?
|
|
# - blacktranswhackers.com/ # Scenes published as movies?
|
|
- concoxxxion.com/
|
|
- elegantangel.com/
|
|
- filthykings.com/
|
|
- forbiddenfruitsfilms.com/
|
|
- lethalhardcore.com/
|
|
- severesexfilms.com/
|
|
# - shemalestrokers.com/ # Scenes published as movies?
|
|
- thirdworldxxx.com/
|
|
- transationalfantasies.com/
|
|
- wcpclub.com/
|
|
- westcoastproductions.com/
|
|
- data18.empirestores.co/
|
|
|
|
|
|
xPathScrapers:
|
|
sceneScraper:
|
|
scene:
|
|
Title: //h1[@class="description"]/text()
|
|
Date:
|
|
selector: //div[@class="release-date"][1]/text()
|
|
postProcess:
|
|
- parseDate: Jan 02, 2006
|
|
Details:
|
|
selector: //div[@class="synopsis"]//text()
|
|
concat: "\n\n"
|
|
Tags:
|
|
Name: //div[@class="tags"]/a/text()|//div[@class="categories"]/a/text()
|
|
Performers:
|
|
Name: //div[@class="video-performer"]/a//text()
|
|
Studio:
|
|
Name:
|
|
selector: //div[@class="studio"]/span[contains(text(),"Studio:")]/following-sibling::*
|
|
postProcess:
|
|
# Override studio name only when needed
|
|
- map:
|
|
Jay Rock Clips: Jay's POV
|
|
- replace:
|
|
# 'Jane Doe Clips' => 'Jane Doe'
|
|
- regex: \sClips$
|
|
with:
|
|
Image: //link[@rel="image_src"]/@href
|
|
Movies:
|
|
Name: //h1[@class="description"]/following-sibling::p/a/text()
|
|
Director:
|
|
selector: //div[@class="director"]/text()
|
|
postProcess:
|
|
- replace:
|
|
- regex: \s{2,}
|
|
with: " "
|
|
- regex: " ,"
|
|
with: ","
|
|
Code:
|
|
selector: //meta[@name="og:url"]/@content
|
|
postProcess:
|
|
- replace:
|
|
- regex: ^https?://[^/]+/(\d+)/.+
|
|
with: $1
|
|
- regex: ^http.*
|
|
with:
|
|
|
|
movieScraper:
|
|
movie:
|
|
Name: //h1[@class="description"]/text()
|
|
Date:
|
|
selector: //div[@class="release-date"][1]/text()
|
|
postProcess:
|
|
- parseDate: Jan 02, 2006
|
|
Synopsis:
|
|
selector: //div[@class="synopsis"]//text()
|
|
concat: "\n\n"
|
|
Director: //div[@class="director"]/a/text()
|
|
Duration:
|
|
selector: //div[@class="release-date"][2]/text()
|
|
postProcess:
|
|
- replace:
|
|
- regex: " hrs. "
|
|
with: ":"
|
|
- regex: " mins."
|
|
with: ":00"
|
|
Studio:
|
|
Name:
|
|
selector: //div[@class="studio"]/a
|
|
postProcess:
|
|
- replace:
|
|
# 'Jane Doe Clips' => 'Jane Doe'
|
|
- regex: \sClips$
|
|
with:
|
|
FrontImage: //link[@rel="image_src"]/@href
|
|
BackImage: //div[@class="carousel-item"]/img/@data-src
|
|
|
|
vrSceneScraper:
|
|
common:
|
|
$content: //div[@class="item-page-details"]
|
|
scene:
|
|
Title: $content//h1
|
|
Details:
|
|
selector: $content//div[@id="synopsis-full"]
|
|
concat: "\n\n"
|
|
Performers:
|
|
Name:
|
|
selector: $content//span[@class="overlay-inner"]//small
|
|
postProcess:
|
|
- replace:
|
|
- regex: \((.+)\)
|
|
with: $1
|
|
Image:
|
|
selector: //link[@rel="image_src"]/@href
|
|
postProcess:
|
|
- replace:
|
|
- regex: ^.+/(\d+)h.+$
|
|
with: https://imgs1cdn.adultempire.com/product/${1}_lg.jpg
|
|
Studio:
|
|
Name: //meta[@name="og:site_name"]/@content
|
|
# Last Updated March 19, 2024
|