82 lines
2.5 KiB
YAML
82 lines
2.5 KiB
YAML
name: Combat Zone
|
|
|
|
sceneByURL:
|
|
- action: scrapeXPath
|
|
scraper: sceneScraper
|
|
url:
|
|
- tour.blackmarketxxx.com/trailers/
|
|
- tour.combatzonexxx.com/trailers/
|
|
- tour.fillyfilms.com/trailers/
|
|
- tour.smashpictures.com/trailers/
|
|
|
|
movieByURL:
|
|
- action: scrapeXPath
|
|
scraper: movieScraper
|
|
url:
|
|
- combatzone.us/distributor/
|
|
|
|
xPathScrapers:
|
|
sceneScraper:
|
|
scene:
|
|
Title: //div[contains(@class, "title")]/h2
|
|
Date:
|
|
selector: //div[@class="info"]/p/text()[contains(., "Added:")]
|
|
postProcess:
|
|
- replace:
|
|
- regex: ^Added:\s+
|
|
with:
|
|
- parseDate: January 2, 2006
|
|
Details: //div[@class="description"]/p
|
|
Tags:
|
|
Name: //ul[@class="tags"]//a
|
|
Performers:
|
|
Name: //div[@class="info"]//a[contains(@href, "/models/")]
|
|
Image:
|
|
selector: //div[@id="fakeplayer"]//img/@src
|
|
postProcess:
|
|
- replace:
|
|
- regex: ^
|
|
with: https://tour.combatzonexxx.com
|
|
Studio:
|
|
Name:
|
|
# Search for the scene in order to get the correct studio
|
|
selector: //div[contains(@class, "title")]/h2
|
|
postProcess:
|
|
- replace:
|
|
- regex: \s
|
|
with: +
|
|
- regex: ^(.+)$
|
|
with: https://tour.combatzonexxx.com/search.php?st=advanced&qall=$1&cat[]=5
|
|
- subScraper: //i[@class="site_badge"]/text()
|
|
- map:
|
|
BM: Black Market XXX
|
|
CZ: Combat Zone XXX
|
|
FF: Filly Films
|
|
SP: Smash Pictures
|
|
|
|
movieScraper:
|
|
movie:
|
|
Name: //h1
|
|
Date:
|
|
selector: //p[span[contains(text(), "Release Date:")]]/text()[2]
|
|
postProcess:
|
|
- parseDate: January 2, 2006
|
|
Synopsis: //p[span[contains(text(), "Synopsis:")]]/text()[2]
|
|
Director: //p[span[contains(text(), "Director:")]]/text()[2]
|
|
FrontImage:
|
|
selector: //img[starts-with(@src, "/distributor/cvr/") and contains(@alt, "front cover")]/@src
|
|
postProcess:
|
|
- replace:
|
|
- regex: ^/(.+)-s([fb]\.jpg)$
|
|
with: https://www.combatzone.us/$1-l$2
|
|
BackImage:
|
|
selector: //img[starts-with(@src, "/distributor/cvr/") and contains(@alt, "back cover")]/@src
|
|
postProcess:
|
|
- replace:
|
|
- regex: ^/(.+)-s([fb]\.jpg)$
|
|
with: https://www.combatzone.us/$1-l$2
|
|
Studio:
|
|
Name: //p[span[contains(text(), "Studio:")]]/text()[2]
|
|
|
|
# Last Updated November 17, 2020
|