This commit is contained in:
Christoph Califice
2025-10-09 20:05:31 -03:00
parent ed22ef22bc
commit 0a5f88d75a
1442 changed files with 101562 additions and 0 deletions

View File

@@ -0,0 +1,395 @@
name: "Staxus"
sceneByURL:
- action: scrapeXPath
url:
- staxus.com/trial/
scraper: sceneScraper
performerByURL:
- action: scrapeXPath
url:
- staxus.com/trial/
scraper: performerScraper
xPathScrapers:
sceneScraper:
common:
$script: //script[@type="application/ld+json"]
$info: //div[@class="text"]
scene:
Title:
selector: //div[@class="video-descr__title"]//h2
postProcess:
- replace:
- regex: " HD"
with: ""
Date:
selector: $script/text()
postProcess:
- replace:
- regex: .*"(\d{4}-\d{2}-\d{2})".*
with: $1
- parseDate: 2006-01-02
Code:
selector: //script[@type="application/ld+json"]
postProcess:
- replace:
- regex: .+id\=(\d+)".+
with: $1
Director:
selector: //div[@class='video-details'][contains(strong,"Director:")]/text()
Tags:
Name: //p/a[@href[contains(., "category.php")]]/text()
Performers:
Name:
selector: //div[@class="video-descr__model-item"]/p/a/text()
Details:
selector: //div[@class="video-descr__content"]/p/text()
concat: "\n"
Image:
selector: //div[contains(@class, "player-wrapper")]/@style
postProcess:
- replace:
- regex: .*'(.*)'.*
with: https:$1
Studio:
Name:
fixed: Staxus
performerScraper:
performer:
Name: //div[@class="model-header-details"]/h4/text()
Gender:
fixed: Male
Height:
selector: //p[@class="flex-item"]/b[text()="Height:"]/following-sibling::span[1]/text()
postProcess:
- replace:
- regex: "cm.*"
with: ""
- regex: '^.*/(\s)?'
with: ""
Measurements:
selector: //p[@class="flex-item"]/b[text()="Cock size:"]/following-sibling::span[1]/text()
postProcess:
- replace:
- regex: "cm.*"
with: ""
- regex: '^.*/(\s)?'
with: ""
Birthdate:
selector: //p[@class="flex-item"]/b[text()="Date of birth:"]/following-sibling::span[1]/text()
postProcess:
- replace:
- regex: '(\d+)\S+\s+([a-zA-Z]+)\D+(\d+)'
with: "$1 $2 $3"
- parseDate: 2 January 2006
Country:
selector: //p[@class="flex-item"]/b[text()="Ethnicity:"]/following-sibling::span[1]/text()
postProcess:
- map:
# https://en.wikipedia.org/wiki/List_of_adjectival_and_demonymic_forms_for_countries_and_nations
"Abkhaz": "Abkhazia"
"Abkhazian": "Abkhazia"
"Afghan": "Afghanistan"
"Albanian": "Albania"
"Algerian": "Algeria"
"American Samoan": "American Samoa"
"American": "United States of America"
"Andorran": "Andorra"
"Angolan": "Angola"
"Anguillan": "Anguilla"
"Antarctic": "Antarctica"
"Antiguan": "Antigua and Barbuda"
"Argentine": "Argentina"
"Argentinian": "Argentina"
"Armenian": "Armenia"
"Aruban": "Aruba"
"Australian": "Australia"
"Austrian": "Austria"
"Azerbaijani": "Azerbaijan"
"Azeri": "Azerbaijan"
"Bahamian": "Bahamas"
"Bahraini": "Bahrain"
"Bangladeshi": "Bangladesh"
"Barbadian": "Barbados"
"Barbudan": "Antigua and Barbuda"
"Basotho": "Lesotho"
"Belarusian": "Belarus"
"Belgian": "Belgium"
"Belizean": "Belize"
"Beninese": "Benin"
"Beninois": "Benin"
"Bermudan": "Bermuda"
"Bermudian": "Bermuda"
"Bhutanese": "Bhutan"
"BIOT": "British Indian Ocean Territory"
"Bissau-Guinean": "Guinea-Bissau"
"Bolivian": "Bolivia"
"Bonaire": "Bonaire"
"Bonairean": "Bonaire"
"Bosnian": "Bosnia and Herzegovina"
"Botswanan": "Botswana"
"Bouvet Island": "Bouvet Island"
"Brazilian": "Brazil"
"British Virgin Island": "Virgin Islands, British"
"British": "United Kingdom"
"Bruneian": "Brunei"
"Bulgarian": "Bulgaria"
"Burkinabé": "Burkina Faso"
"Burmese": "Burma"
"Burundian": "Burundi"
"Cabo Verdean": "Cabo Verde"
"Cambodian": "Cambodia"
"Cameroonian": "Cameroon"
"Canadian": "Canada"
"Cantonese": "Hong Kong"
"Caymanian": "Cayman Islands"
"Central African": "Central African Republic"
"Chadian": "Chad"
"Channel Island": "Guernsey"
"Chilean": "Chile"
"Chinese": "China"
"Christmas Island": "Christmas Island"
"Cocos Island": "Cocos (Keeling) Islands"
"Colombian": "Colombia"
"Comoran": "Comoros"
"Comorian": "Comoros"
"Congolese": "Congo"
"Cook Island": "Cook Islands"
"Costa Rican": "Costa Rica"
"Croatian": "Croatia"
"Cuban": "Cuba"
"Curaçaoan": "Curaçao"
"Cypriot": "Cyprus"
"Czech": "Czech Republic"
"Danish": "Denmark"
"Djiboutian": "Djibouti"
"Dominican": "Dominica"
"Dutch": "Netherlands"
"Ecuadorian": "Ecuador"
"Egyptian": "Egypt"
"Emirati": "United Arab Emirates"
"Emiri": "United Arab Emirates"
"Emirian": "United Arab Emirates"
"English people": "England"
"English": "England"
"Equatoguinean": "Equatorial Guinea"
"Equatorial Guinean": "Equatorial Guinea"
"Eritrean": "Eritrea"
"Estonian": "Estonia"
"Ethiopian": "Ethiopia"
"European": "European Union"
"Falkland Island": "Falkland Islands"
"Faroese": "Faroe Islands"
"Fijian": "Fiji"
"Filipino": "Philippines"
"Finnish": "Finland"
"Formosan": "Taiwan"
"French Guianese": "French Guiana"
"French Polynesian": "French Polynesia"
"French Southern Territories": "French Southern Territories"
"French": "France"
"Futunan": "Wallis and Futuna"
"Gabonese": "Gabon"
"Gambian": "Gambia"
"Georgian": "Georgia"
"German": "Germany"
"Ghanaian": "Ghana"
"Gibraltar": "Gibraltar"
"Greek": "Greece"
"Greenlandic": "Greenland"
"Grenadian": "Grenada"
"Guadeloupe": "Guadeloupe"
"Guamanian": "Guam"
"Guatemalan": "Guatemala"
"Guinean": "Guinea"
"Guyanese": "Guyana"
"Haitian": "Haiti"
"Heard Island": "Heard Island and McDonald Islands"
"Hellenic": "Greece"
"Herzegovinian": "Bosnia and Herzegovina"
"Honduran": "Honduras"
"Hong Kong": "Hong Kong"
"Hong Konger": "Hong Kong"
"Hungarian": "Hungary"
"Icelandic": "Iceland"
"Indian": "India"
"Indonesian": "Indonesia"
"Iranian": "Iran"
"Iraqi": "Iraq"
"Irish": "Ireland"
"Israeli": "Israel"
"Israelite": "Israel"
"Italian": "Italy"
"Ivorian": "Ivory Coast"
"Jamaican": "Jamaica"
"Jan Mayen": "Jan Mayen"
"Japanese": "Japan"
"Jordanian": "Jordan"
"Kazakh": "Kazakhstan"
"Kazakhstani": "Kazakhstan"
"Kenyan": "Kenya"
"Kirghiz": "Kyrgyzstan"
"Kirgiz": "Kyrgyzstan"
"Kiribati": "Kiribati"
"Korean": "South Korea"
"Kosovan": "Kosovo"
"Kosovar": "Kosovo"
"Kuwaiti": "Kuwait"
"Kyrgyz": "Kyrgyzstan"
"Kyrgyzstani": "Kyrgyzstan"
"Lao": "Lao People's Democratic Republic"
"Laotian": "Lao People's Democratic Republic"
"Latvian": "Latvia"
"Lebanese": "Lebanon"
"Lettish": "Latvia"
"Liberian": "Liberia"
"Libyan": "Libya"
"Liechtensteiner": "Liechtenstein"
"Lithuanian": "Lithuania"
"Luxembourg": "Luxembourg"
"Luxembourgish": "Luxembourg"
"Macanese": "Macau"
"Macedonian": "North Macedonia"
"Magyar": "Hungary"
"Mahoran": "Mayotte"
"Malagasy": "Madagascar"
"Malawian": "Malawi"
"Malaysian": "Malaysia"
"Maldivian": "Maldives"
"Malian": "Mali"
"Malinese": "Mali"
"Maltese": "Malta"
"Manx": "Isle of Man"
"Marshallese": "Marshall Islands"
"Martinican": "Martinique"
"Martiniquais": "Martinique"
"Mauritanian": "Mauritania"
"Mauritian": "Mauritius"
"McDonald Islands": "Heard Island and McDonald Islands"
"Mexican": "Mexico"
"Moldovan": "Moldova"
"Monacan": "Monaco"
"Mongolian": "Mongolia"
"Montenegrin": "Montenegro"
"Montserratian": "Montserrat"
"Monégasque": "Monaco"
"Moroccan": "Morocco"
"Motswana": "Botswana"
"Mozambican": "Mozambique"
"Myanma": "Myanmar"
"Namibian": "Namibia"
"Nauruan": "Nauru"
"Nepalese": "Nepal"
"Nepali": "Nepal"
"Netherlandic": "Netherlands"
"New Caledonian": "New Caledonia"
"New Zealand": "New Zealand"
"Ni-Vanuatu": "Vanuatu"
"Nicaraguan": "Nicaragua"
"Nigerian": "Nigeria"
"Nigerien": "Niger"
"Niuean": "Niue"
"Norfolk Island": "Norfolk Island"
"Northern Irish": "Northern Ireland"
"Northern Marianan": "Northern Mariana Islands"
"Norwegian": "Norway"
"Omani": "Oman"
"Pakistani": "Pakistan"
"Palauan": "Palau"
"Palestinian": "Palestine"
"Panamanian": "Panama"
"Papua New Guinean": "Papua New Guinea"
"Papuan": "Papua New Guinea"
"Paraguayan": "Paraguay"
"Persian": "Iran"
"Peruvian": "Peru"
"Philippine": "Philippines"
"Pitcairn Island": "Pitcairn Islands"
"Polish": "Poland"
"Portuguese": "Portugal"
"Puerto Rican": "Puerto Rico"
"Qatari": "Qatar"
"Romanian": "Romania"
"Russian": "Russia"
"Rwandan": "Rwanda"
"Saba": "Saba"
"Saban": "Saba"
"Sahraouian": "Western Sahara"
"Sahrawi": "Western Sahara"
"Sahrawian": "Western Sahara"
"Salvadoran": "El Salvador"
"Sammarinese": "San Marino"
"Samoan": "Samoa"
"Saudi Arabian": "Saudi Arabia"
"Saudi": "Saudi Arabia"
"Scottish": "Scotland"
"Senegalese": "Senegal"
"Serbian": "Serbia"
"Seychellois": "Seychelles"
"Sierra Leonean": "Sierra Leone"
"Singapore": "Singapore"
"Singaporean": "Singapore"
"Slovak": "Slovakia"
"Slovene": "Slovenia"
"Slovenian": "Slovenia"
"Solomon Island": "Solomon Islands"
"Somali": "Somalia"
"Somalilander": "Somaliland"
"South African": "South Africa"
"South Georgia Island": "South Georgia and the South Sandwich Islands"
"South Ossetian": "South Ossetia"
"South Sandwich Island": "South Georgia and the South Sandwich Islands"
"South Sudanese": "South Sudan"
"Spanish": "Spain"
"Sri Lankan": "Sri Lanka"
"Sudanese": "Sudan"
"Surinamese": "Suriname"
"Svalbard resident": "Svalbard"
"Swati": "Eswatini"
"Swazi": "Eswatini"
"Swedish": "Sweden"
"Swiss": "Switzerland"
"Syrian": "Syrian Arab Republic"
"Taiwanese": "Taiwan"
"Tajikistani": "Tajikistan"
"Tanzanian": "Tanzania"
"Thai": "Thailand"
"Timorese": "Timor-Leste"
"Tobagonian": "Trinidad and Tobago"
"Togolese": "Togo"
"Tokelauan": "Tokelau"
"Tongan": "Tonga"
"Trinidadian": "Trinidad and Tobago"
"Tunisian": "Tunisia"
"Turkish": "Turkey"
"Turkmen": "Turkmenistan"
"Turks and Caicos Island": "Turks and Caicos Islands"
"Tuvaluan": "Tuvalu"
"Ugandan": "Uganda"
"Ukrainian": "Ukraine"
"Uruguayan": "Uruguay"
"Uzbek": "Uzbekistan"
"Uzbekistani": "Uzbekistan"
"Vanuatuan": "Vanuatu"
"Vatican": "Vatican City State"
"Venezuelan": "Venezuela"
"Vietnamese": "Vietnam"
"Wallis and Futuna": "Wallis and Futuna"
"Wallisian": "Wallis and Futuna"
"Welsh": "Wales"
"Yemeni": "Yemen"
"Zambian": "Zambia"
"Zimbabwean": "Zimbabwe"
"Åland Island": "Åland Islands"
Image:
selector: //div[@class="item active"]/img/@src
postProcess:
- replace:
- regex: ^
with: "https:"
Details:
selector: //div[@class="video-descr__section col-md-12"]//p[2]/text()
# Last Updated December 23, 2022