49 lines
1.4 KiB
YAML
49 lines
1.4 KiB
YAML
name: "XXXPawn"
|
|
sceneByURL:
|
|
- action: scrapeXPath
|
|
url:
|
|
- xxxpawn.com
|
|
- xxxpawn.xxx
|
|
scraper: sceneScraper
|
|
xPathScrapers:
|
|
sceneScraper:
|
|
scene:
|
|
Title: //h1/text()|//div[@id="content"]//h2/text()
|
|
Date:
|
|
selector: //link[@rel="canonical"]/@href
|
|
postProcess:
|
|
- replace:
|
|
- regex: .+(?:\.xxx|\.com\/video\d+)\/([\w-]+)(?:.+|)
|
|
with: https://xxxpawn.xxx/$1
|
|
- subScraper:
|
|
selector: //div[@id="title-single"]/span/text()
|
|
postProcess:
|
|
- replace:
|
|
- regex: (\w+\s)(\d+)\w+,(\s\d{4})
|
|
with: $1$2$3
|
|
- parseDate: January 2 2006
|
|
Details:
|
|
selector: //p[@class="videoDetail"]/text()|//p[@class="more"]/text()|//span[@class="morecontent"]/span/text()
|
|
concat: ''
|
|
Studio:
|
|
Name:
|
|
selector: //link[@rel="canonical"]/@href
|
|
postProcess:
|
|
- replace:
|
|
- regex: .+
|
|
with: 'XXXPawn'
|
|
Image:
|
|
selector: //link[@rel="canonical"]/@href
|
|
postProcess:
|
|
- replace:
|
|
- regex: .+(?:\.xxx|\.com\/video\d+)\/([\w-]+)(?:.+|)
|
|
with: https://xxxpawn.xxx/$1
|
|
- subScraper:
|
|
selector: //video/@poster
|
|
Tags:
|
|
Name:
|
|
selector: //meta[@http-equiv="keywords"]/@content
|
|
split: ', '
|
|
|
|
# Last Updated November 08, 2020
|