stash
This commit is contained in:
@@ -0,0 +1,66 @@
|
||||
name: "Woodman Casting X"
|
||||
sceneByURL:
|
||||
- action: scrapeXPath
|
||||
url:
|
||||
- woodmancastingx.com
|
||||
scraper: sceneScraper
|
||||
sceneByName:
|
||||
action: scrapeXPath
|
||||
queryURL: https://www.woodmancastingx.com/search?query={}
|
||||
scraper: sceneSearch
|
||||
sceneByQueryFragment:
|
||||
action: scrapeXPath
|
||||
queryURL: "{url}"
|
||||
scraper: sceneScraper
|
||||
|
||||
xPathScrapers:
|
||||
sceneScraper:
|
||||
scene:
|
||||
Title: //h1
|
||||
Details: //p[@class="description"]
|
||||
Date:
|
||||
selector: //p[span="Published"]/text()
|
||||
postProcess:
|
||||
- replace:
|
||||
- regex: "^.*: "
|
||||
with: ""
|
||||
- parseDate: 2006-01-02
|
||||
Performers:
|
||||
Name: //a[@class="girl_item"]/span[@class="name"]
|
||||
URL:
|
||||
selector: //a[@class="girl_item"]/@href
|
||||
postProcess: &pp
|
||||
- replace:
|
||||
- regex: ^/
|
||||
with: "https://www.woodmancastingx.com/"
|
||||
Studio:
|
||||
Name:
|
||||
selector: //div[@id="breadcrumb"]
|
||||
postProcess:
|
||||
- replace:
|
||||
- regex: ^[^>]*> (Casting|Sthuf).*$
|
||||
with: "Woodman Casting X"
|
||||
- regex: ^[^>]*> (Scenes|Backstage|Live).*$
|
||||
with: "Pierre Woodman"
|
||||
Tags:
|
||||
Name: //a[@class="tag"]
|
||||
Image:
|
||||
selector: //script[contains(.,'image')]
|
||||
postProcess:
|
||||
- replace:
|
||||
- regex: ^.*image:\s+"([^"]+)".*$
|
||||
with: $1
|
||||
URL:
|
||||
selector: //meta[@property="og:url"]/@content
|
||||
postProcess: *pp
|
||||
|
||||
sceneSearch:
|
||||
common:
|
||||
$res: //div[contains(@class,("items container"))]/a[@class="item scene"]
|
||||
scene:
|
||||
Title: $res/img/@alt
|
||||
Image: $res/img/@src
|
||||
URL:
|
||||
selector: $res/@href
|
||||
postProcess: *pp
|
||||
# Last Updated May 30, 2023
|
||||
Reference in New Issue
Block a user