This commit is contained in:
Christoph Califice
2025-10-09 20:05:31 -03:00
parent ed22ef22bc
commit 0a5f88d75a
1442 changed files with 101562 additions and 0 deletions

View File

@@ -0,0 +1,161 @@
name: JavDB
sceneByFragment:
action: scrapeXPath
queryURL: https://javdb.com/search?q={filename}&f=all
queryURLReplace:
filename:
- regex: \..+$
with: ""
scraper: sceneQueryScraper
sceneByURL:
- action: scrapeXPath
url:
- javdb.com/v/
- javdb36.com/v/
scraper: sceneScraper
queryURL: "{url}"
queryURLReplace:
url:
- regex: javdb\.com
with: "javdb.com"
sceneByName:
action: scrapeXPath
queryURL: https://javdb.com/search?q={}
scraper: sceneSearch
sceneByQueryFragment:
action: scrapeXPath
queryURL: "{url}"
scraper: sceneScraper
movieByURL:
- action: scrapeXPath
url:
- javdb.com/v/
- javdb36.com/v/
scraper: movieScraper
queryURL: "{url}"
queryURLReplace:
url:
- regex: javdb\.com
with: "javdb.com"
xPathScrapers:
sceneSearch:
common:
$videoItem: //div[starts-with(@class, 'movie-list')]/div[@class="item"]
scene:
Title: $videoItem/a/div[@class="video-title"]
URL:
selector: $videoItem/a[@class="box"]/@href
postProcess:
- replace:
- regex: ^
with: "https://javdb.com"
Image:
selector: $videoItem//img/@src
postProcess:
- replace:
- regex: (http:|https:)
with:
- regex: ^
with: "https:"
sceneQueryScraper:
common:
$videoItem: //div[starts-with(@class, 'movie-list')]/div[@class="item"]
scene:
Title: $videoItem/a/div[@class="video-title"]/text()
URL:
selector: $videoItem/a[@class="box"]/@href
postProcess:
- replace:
- regex: ^
with: "https://javdb.com"
# If you don't support cookie you can use this regex.
# - regex: $
# with: "?locale=en"
sceneScraper:
scene:
Title:
selector: //strong[text()='ID:']/../span
concat: "|"
postProcess:
- replace:
- regex: \|
with: ""
Date: //strong[text()='Released Date:']/../span/text()
Details:
selector: //strong[@class="current-title"]/text()
Director: //strong[text()='Director:']/../span/a/text()
Tags:
Name: //strong[text()='Tags:']/../span/a/text()
Performers:
Name: //strong[text()='Actor(s):']/../span/a/text()
Studio:
Name:
selector: //strong[text()='Maker:']/../span/a/text()|//strong[text()='Publisher:']/../span/a/text()
Image: //img[@class="video-cover"]/@src
URL: //link[@rel="canonical"]/@href
movieScraper:
movie:
Name:
selector: //strong[text()='ID:']/../span
concat: "|"
postProcess:
- replace:
- regex: \|
with: ""
Director: //strong[text()='Director:']/../span/a/text()
Duration:
selector: //strong[text()='Duration:']/../span/text()
postProcess:
- replace:
- regex: \D
with: ""
Date: //strong[text()='Released Date:']/../span/text()
Synopsis:
selector: //h2[@class="title is-4"]/strong/text()
postProcess:
- replace:
- regex: (.*?\s)(.+)
with: $2
Studio:
Name:
selector: //strong[text()='Maker:']/../span/a/text()|//strong[text()='Publisher:']/../span/a/text()
FrontImage:
selector: //img[@class="video-cover"]/@src
URL: //link[@rel="canonical"]/@href
driver:
cookies:
- CookieURL: "https://javdb.com"
Cookies:
- Name: "locale"
Domain: "javdb.com"
Value: "en"
Path: "/"
# Access to certain titles requires a javdb account
# Uncomment the below replacing the Value part
#- Name: "_jdb_session"
# Value: "Add here the actual value from your cookies"
# Path: "/"
# Domain: "javdb.com"
#- Name: "remember_me_token"
# Value: "Add here the actual value from your cookies"
# Path: "/"
# Domain: "javdb.com"
- CookieURL: "https://javdb36.com"
Cookies:
- Name: "locale"
Domain: "javdb36.com"
Value: "en"
Path: "/"
# Access to certain titles requires a javdb account
# Uncomment the below replacing the Value part
#- Name: "_jdb_session"
# Value: "Add here the actual value from your cookies"
# Path: "/"
# Domain: "javdb36.com"
#- Name: "remember_me_token"
# Value: "Add here the actual value from your cookies"
# Path: "/"
# Domain: "javdb36.com"
# Last Updated January 21, 2024