Files
compose-projects-arr/stash/config/scrapers/community/Spizoo/Spizoo.yml
Christoph Califice 0a5f88d75a stash
2025-10-10 09:50:30 -03:00

82 lines
2.8 KiB
YAML

name: Spizoo
sceneByURL:
- action: scrapeXPath
url:
- creamher.com/updates/
- drdaddypov.com/updates/
- firstclasspov.com/updates/
- mrluckypov.com/updates/
- mrluckyraw.com/updates/
- mrluckyvip.com/updates/
- rawattack.com/updates/
- realsensual.com/updates/
- spizoo.com/updates/
- vlogxxx.com/updates/
scraper: sceneScraper
sceneByName:
action: scrapeXPath
queryURL: https://www.spizoo.com/search.php?query={}
scraper: sceneSearch
sceneByQueryFragment:
action: scrapeXPath
queryURL: "{url}"
scraper: sceneScraper
xPathScrapers:
sceneSearch:
common:
$row: //div[@class="model-update row"]
scene:
Title: $row//h3
URL: $row//h3/../@href
Image: $row//img/@src
Details: $row//p[contains(@class, "model-update-description")]
sceneScraper:
common:
$scene_info: //section[@id="trailer-data" or @id="sceneInfo" or @id="scene-info" or @id="des-scene"]
$video_section: (//section[@id="trailer-video" or @id="scene" or @id="scene-video"] | //div[contains(@class, "videoHolder")])
scene:
Title:
selector: //div[@class="title" or @class="row"]//h1 | //h2[contains(@class, "titular")] | //title
postProcess:
# RawAttack titles have a trailing dash and space
- replace:
- regex: \s\-\s*$
with:
Date:
selector: $scene_info//p[@class="date"]
postProcess:
- parseDate: 2006-01-02
Details: $scene_info//p
Performers:
Name: $scene_info//a[contains(@href,"/model")]/@title
Tags:
Name: $scene_info//a[contains(@href,"/categories")] | //div[contains(@class, "categories-holder")]/a
Studio:
Name:
# Scenes on Spizoo can have an <i id="site"> element with the studio name, others we get from the base URL
selector: //i[@id="site"]/@value | //base/@href
postProcess:
- replace:
- regex: https?://(?:www\.)?(.*)(?:\.com)(?:/.*)?
with: $1
- map:
creamher: Cream Her
drdaddypov: Dr. Daddy POV
firstclasspov: First Class POV
mrluckypov: Mr. LuckyPOV
mrluckyraw: Mr. LuckyRaw
mrluckyvip: Mr. LuckyVIP
rawattack: RawAttack
realsensual: Real Sensual
spizoo: Spizoo
vlogxxx: Vlog XXX
Image:
selector: $video_section//video/@poster | //img[contains(@class, "update_thumb") or contains(@class, "trailer-thumb")]/@src
postProcess:
- replace:
# Remove any resizing parameters for the image, we want the original
- regex: "[?&]img(?:q|w|h)=[^&]+"
with:
# Last Updated February 26, 2024