78 lines
2.8 KiB
YAML
78 lines
2.8 KiB
YAML
name: TitanMen
|
|
sceneByURL:
|
|
- action: scrapeXPath
|
|
url:
|
|
- titanmen.com
|
|
scraper: sceneScraper
|
|
movieByURL:
|
|
- action: scrapeXPath
|
|
url:
|
|
- titanmen.com
|
|
scraper: movieScraper
|
|
xPathScrapers:
|
|
sceneScraper:
|
|
common:
|
|
$details: //div[contains(@class, "scene-page-detail")]
|
|
scene:
|
|
Title: //h1[@class="scene-header-title"]
|
|
Details:
|
|
selector: //div[@class="col span_6_of_12"][1]/p/text()
|
|
concat: "\n\n"
|
|
Director: $details//strong[starts-with(text(), "Director")]/following-sibling::a
|
|
Code: //div[@class="rating_box"]/@data-id
|
|
Date:
|
|
selector: $details//strong[starts-with(text(), "Released")]/following-sibling::text()
|
|
postProcess:
|
|
- parseDate: Jan 2, 2006
|
|
Studio:
|
|
Name:
|
|
selector: $details//strong[starts-with(text(), "Movie Title")]/following-sibling::a/@href
|
|
postProcess:
|
|
- replace:
|
|
- regex: ^
|
|
with: https://www.titanmen.com/
|
|
- subScraper: //div[contains(@class, "movie-page-detail")]//strong[starts-with(text(), "Studio")]/following-sibling::a
|
|
- map:
|
|
Rough: TitanMen Rough
|
|
Performers:
|
|
Name: $details//strong[starts-with(text(), "Starring")]/following-sibling::a/text()
|
|
URL:
|
|
selector: $details//strong[starts-with(text(), "Starring")]/following-sibling::a/@href
|
|
postProcess:
|
|
- replace:
|
|
- regex: ^
|
|
with: https://www.titanmen.com/
|
|
Movies:
|
|
Name: $details//strong[starts-with(text(), "Movie")]/following-sibling::a
|
|
URL:
|
|
selector: $details//strong[starts-with(text(), "Movie")]/following-sibling::a/@href
|
|
postProcess:
|
|
- replace:
|
|
- regex: ^
|
|
with: https://www.titanmen.com/
|
|
Tags:
|
|
Name: $details//strong[starts-with(text(), "Categories")]/following-sibling::a
|
|
Image:
|
|
selector: //script[contains(text(), concat("scene-image-", //div[@class="rating_box"]/@data-id))]/text()
|
|
postProcess:
|
|
- replace:
|
|
- regex: .*image:\s*"([^"]+).*
|
|
with: $1
|
|
movieScraper:
|
|
movie:
|
|
Name:
|
|
selector: //div[@class="col span_9_of_12"]/h1/text()
|
|
Synopsis:
|
|
selector: //div[@class="col span_9_of_12"]/p[1]/text()
|
|
concat: "\n\n"
|
|
Date:
|
|
selector: //div[@class="col span_9_of_12"]/p[3]/text()
|
|
postProcess:
|
|
- parseDate: Jan 2, 2006
|
|
Studio:
|
|
Name: //div[contains(@class, "movie-page-detail")]//strong[starts-with(text(), "Studio")]/following-sibling::a
|
|
Director: //div[contains(@class, "movie-page-detail")]//strong[starts-with(text(), "Director")]/following-sibling::a
|
|
FrontImage: //div[contains(@class, "box-cover")]//img/@src
|
|
# Last Updated January 07, 2024
|
|
|