68 lines
2.0 KiB
YAML
68 lines
2.0 KiB
YAML
name: DartTechStudios
|
|
sceneByURL:
|
|
- action: scrapeXPath
|
|
url:
|
|
- darttechstudios.com/Media.php
|
|
scraper: sceneScraper
|
|
|
|
sceneByFragment:
|
|
action: scrapeXPath
|
|
queryURL: https://www.darttechstudios.com/Media.php?ID={filename}
|
|
queryURLReplace:
|
|
filename:
|
|
# the filename of the file downloaded from the site is the ID with an mp4 extension
|
|
- regex: (.*).mp4 # support filenames in the form 12345_performer_other_data.mp4
|
|
with: $1
|
|
scraper: sceneScraper
|
|
|
|
xPathScrapers:
|
|
sceneScraper:
|
|
scene:
|
|
Title:
|
|
selector: &titledateSelector //font[@size="+1"]/b/text()
|
|
postProcess:
|
|
- replace:
|
|
- regex: ([^-]+).*
|
|
with: $1
|
|
Date:
|
|
selector: *titledateSelector
|
|
postProcess:
|
|
- replace:
|
|
- regex: .*([0-9]{2}/[0-9]{2}/[0-9]{4})
|
|
with: $1
|
|
- parseDate: 01/02/2006
|
|
Performers:
|
|
Name: //div[@class="item2"]/a[contains(@href, '/Videos.php?Model=')]
|
|
Tags:
|
|
Name: //div[@class="item2"]/a[contains(@href, '/Videos.php?Fetish=')]
|
|
Details:
|
|
selector: //div[@class="item2"]/text()
|
|
concat: "\n\n"
|
|
postProcess:
|
|
- replace:
|
|
- regex: "\n\n,"
|
|
with: ""
|
|
Image:
|
|
#selector: //div[@class="galleryEntry_UpdatePage"][1]//img/@src
|
|
selector: &imgSelector //img[@alt="Main Image"]/@src
|
|
postProcess:
|
|
- replace:
|
|
- regex: (.*)
|
|
with: https://www.darttechstudios.com$1
|
|
Code:
|
|
selector: *imgSelector
|
|
postProcess:
|
|
- replace:
|
|
- regex: &codeRegex /Content/[0-9]{4}_(.*)/Main.jpg
|
|
with: $1
|
|
URL:
|
|
selector: *imgSelector
|
|
postProcess:
|
|
- replace:
|
|
- regex: *codeRegex
|
|
with: https://www.darttechstudios.com/Media.php?ID=$1
|
|
Studio:
|
|
Name:
|
|
fixed: Dart_Tech Studios
|
|
# Last Updated October 08, 2023
|