This commit is contained in:
Christoph Califice
2025-10-09 20:05:31 -03:00
parent ed22ef22bc
commit 0a5f88d75a
1442 changed files with 101562 additions and 0 deletions

View File

@@ -0,0 +1,134 @@
name: Raunchy Bastards
sceneByURL:
- action: scrapeXPath
url:
- boundjocks.com/scene/
- boyshalfwayhouse.com/scene/
- coltstudiogroup.com/scene/
- daddycarl.com/scene/
- hotoldermale.com/scene/
- monstercub.com/scene/
- naturalbornbreeders.com/scene/
- older4me.com/scene/
- raunchybastards.com/scene/
- stockydudes.com/scene/
- toplatindaddies.com/scene/
scraper: oldStyleSite
- action: scrapeXPath
url:
- blackboyaddictionz.com/scene/
- blacksondaddies.com/scene/
- myfirstdaddy.com/scene/
- playdaddy.com/scene/
scraper: newStyleSite
xPathScrapers:
oldStyleSite:
common:
$scene: //div[contains(@class, "sceneContainer")]
scene:
Title: $scene/div[@class="sceneTitle"]
Code:
selector: $scene//div[contains(@class, "sceneImgBig")]/@id
postProcess:
- replace:
- regex: \D*
with: $1
Date:
selector: $scene//span[contains(@class, "sceneDetails")]
postProcess: &ppDate
- replace:
# https://regex101.com/r/rsjbb6/3
- regex: ^(?:Details:\s*)?(\w{3}\s*\d{1,2}),\s*(\d{4}).*?$
with: $1, $2
- parseDate: Jan 2, 2006
# All of this can be replaced once scrapers get access to the URL they are scraping
Studio:
Name:
selector: &image >
$scene//video/@poster
| $scene//div[contains(@class, "sceneImgBig")]/img/@src
| //div[contains(@style, "background-image")]/@style
| //*[contains(@class, "videoTrailer") or contains(@class, "bgScene")]//@srcset
postProcess: &studioNameFromURL
- replace:
- regex: ^(?:https:\/\/[\w\.]*?)([^.]+)\.com.*$
with: $1
- map:
blackboyaddictionz: Black Boy Addictionz
blacksondaddies: Blacks on Daddies
boundjocks: Bound Jocks
boyshalfwayhouse: Boys Halfway House
coltstudiogroup: Colt Studio Group
daddycarl: Daddy Carl
hotoldermale: Hot Older Male
monstercub: Monster Cub
myfirstdaddy: My First Daddy
naturalbornbreeders: Natural Born Breeders
older4me: Older4Me
playdaddy: Play Daddy
raunchybastards: Raunchy Bastards
stockydudees: Stocky dudes
toplatindaddies: Top Latin Daddies
URL:
selector: *image
postProcess:
- replace:
- regex: ^(?:https:\/\/[\w\.]*?)([^.]+)\.com.*$
with: https://$1.com
Performers:
Name: >
$scene//div[contains(@class, "scenePerformers")]/a
| $scene//div[@class="scenePerf"]/span[@class="perfName"]
URL: >
$scene//div[contains(@class, "scenePerformers")]/a/@href
| $scene//div[@class="scenePerf"]/@data-href
Tags:
Name: $scene//a[@class="sceneTagsLnk"]/text()
Details:
selector: $scene//div[contains(@class, "sceneDescription")]/text()
concat: "\n\n"
Image:
selector: *image
postProcess:
- replace:
- regex: .*url\("(.*)"\).*
with: $1
- regex: \s*2x$
with:
newStyleSite:
common:
$details: //div[contains(@class, "container_styled_1")]
scene:
Title: //h2[@class="main_title"]
Code:
selector: //link[@rel="canonical"]/@href
postProcess:
- replace:
- regex: \D*
with: $1
# All of this can be replaced once scrapers get access to the URL they are scraping
Studio:
Name:
selector: //link[@rel="canonical"]/@href
postProcess: *studioNameFromURL
URL:
selector: //link[@rel="canonical"]/@href
postProcess:
- replace:
- regex: ^(?:https:\/\/[\w\.]*?)([^.]+)\.com.*$
with: https://$1.com
Performers:
Name: $details//span[contains(@class, "perfImage")]/a
URL: $details//span[contains(@class, "perfImage")]/a/@href
Details:
selector: $details//p/text()
concat: "\n\n"
Date:
selector: ($details//h5[contains(text(), "Details")]/text())[1]
postProcess: *ppDate
Image:
selector: //meta[@property="og:image"]/@content
Tags:
Name: $details//h5[contains(., "Categories")]/a/text()
# Last Updated September 22, 2023

View File

@@ -0,0 +1,9 @@
id: AdultSiteRunner
name: Raunchy Bastards
metadata: {}
version: 0b5e6be
date: "2023-09-22 04:12:45"
requires: []
source_repository: https://stashapp.github.io/CommunityScrapers/stable/index.yml
files:
- AdultSiteRunner.yml