97 lines
2.7 KiB
YAML
Executable File
97 lines
2.7 KiB
YAML
Executable File
name: TheMovieDB
|
|
|
|
movieByURL:
|
|
- action: scrapeXPath
|
|
url:
|
|
- themoviedb.org
|
|
scraper: movieScraper
|
|
sceneByURL:
|
|
- action: scrapeXPath
|
|
url:
|
|
- themoviedb.org
|
|
scraper: sceneScraper
|
|
|
|
xPathScrapers:
|
|
movieScraper:
|
|
movie:
|
|
Name: (//h2/a)[1]
|
|
Director: //div[@class='header_info']/ol[@class='people no_image']/li[@class='profile']/p[1]/a
|
|
Duration:
|
|
selector: //span[@class='runtime']
|
|
postProcess:
|
|
- replace:
|
|
- regex: "h "
|
|
with: ":"
|
|
- regex: "m"
|
|
with: ":00"
|
|
Date:
|
|
selector: //span[@class='release']
|
|
postProcess:
|
|
- replace:
|
|
- regex: \(.*$
|
|
with:
|
|
- parseDate: 01/02/2006
|
|
Synopsis: //div[@class='header_info']/div[@class='overview']/p
|
|
URL: //meta[@name='og:url']/@content
|
|
FrontImage:
|
|
selector: (//img[@class='poster']/@src)[1]
|
|
postProcess:
|
|
- replace:
|
|
- regex: w300
|
|
with: w600
|
|
- replace:
|
|
- regex: h450
|
|
with: h900
|
|
sceneScraper:
|
|
scene:
|
|
Title: (//h2/a)[1]
|
|
Details: //div[@class='header_info']/div[@class='overview']/p
|
|
Director: //div[@class='header_info']/ol[@class='people no_image']/li[@class='profile']/p[1]/a
|
|
Date:
|
|
selector: //span[@class='release']
|
|
postProcess:
|
|
- replace:
|
|
- regex: \(.*$
|
|
with:
|
|
- parseDate: 01/02/2006
|
|
Studio:
|
|
Name: //a[@label="Studio"]/text()
|
|
Movies:
|
|
Name: (//h2/a)[1]
|
|
URL: //link[@rel="canonical"]/@href
|
|
Director: //div[@class='header_info']/ol[@class='people no_image']/li[@class='profile']/p[1]/a
|
|
Duration:
|
|
selector: //small[contains(text(), "Length")]/following-sibling::text()
|
|
postProcess:
|
|
- replace:
|
|
- regex: " hrs. "
|
|
with: ":"
|
|
- regex: " mins."
|
|
with: ":00"
|
|
Date:
|
|
selector: //span[@class='release']
|
|
postProcess:
|
|
- replace:
|
|
- regex: \(.*$
|
|
with:
|
|
- parseDate: 01/02/2006
|
|
Synopsis: //div[@class='header_info']/div[@class='overview']/p
|
|
FrontImage:
|
|
selector: (//img[@class='poster']/@src)[1]
|
|
postProcess:
|
|
- replace:
|
|
- regex: w300
|
|
with: w600
|
|
- replace:
|
|
- regex: h450
|
|
with: h900
|
|
Performers:
|
|
Name: //ol[@class='people scroller']/li[@class='card']/p[1]
|
|
URL: //meta[@name='og:url']/@content
|
|
|
|
driver:
|
|
headers:
|
|
- Key: "User-Agent"
|
|
Value: stash-scraper/1.0.0
|
|
# Last Updated March 11, 2024
|