modify scripts

This commit is contained in:
2025-11-14 13:32:18 +08:00
parent 1848510b65
commit f189dcfaca
4 changed files with 238 additions and 0 deletions

View File

@ -0,0 +1,110 @@
name: Javbus
sceneByFragment:
action: scrapeXPath
queryURL: https://www.javbus.com/{filename}
queryURLReplace:
filename:
- regex: -JG\d
with: ""
- regex: (.*[^a-zA-Z0-9])*([a-zA-Z-]+\d+)(.+)
with: $2
scraper: sceneScraper
sceneByURL:
- action: scrapeXPath
url:
- https://www.javbus.com
- https://www.seejav.bid
- https://www.cdnbus.lol
- https://www.dmmbus.lol
- https://www.seedmm.cfd
scraper: sceneScraper
sceneByName:
action: scrapeXPath
queryURL: https://www.javbus.com/search/{}&type=&parent=ce
scraper: sceneSearch
sceneByQueryFragment:
action: scrapeXPath
queryURL: "{url}"
scraper: sceneScraper
performerByURL:
- action: scrapeXPath
url:
- https://www.javbus.com
- https://www.seejav.bid
- https://www.cdnbus.lol
- https://www.dmmbus.lol
- https://www.seedmm.cfd
scraper: performerScraper
performerByName:
action: scrapeXPath
queryURL: https://www.javbus.com/searchstar/{}&type=&parent=ce
scraper: performerSearch
xPathScrapers:
performerSearch:
performer:
Name: //span[@class="mleft"]
URL: //*[@id="waterfall"]/div/a/@href
performerScraper:
performer:
Name: //*[@id="waterfall"]/div[1]/div/div[2]/span
Birthdate:
selector: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '生日')]
postProcess:
- replace:
- regex: ^(.*? ){1}
with:
Height:
selector: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '身高')]
postProcess:
- replace:
- regex: ^(.*? ){1}
with:
# Measurements: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '胸圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '腰圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '臀圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '罩杯')]
Image:
selector: //*[@id="waterfall"]/div[1]/div/div[1]/img/@src
postProcess:
- replace:
- regex: ^
with: https://www.javbus.com
sceneSearch:
scene:
Title: //div[@class="photo-info"]/span
URL: //*[@id="waterfall"]/div/a/@href
sceneScraper:
scene:
Title:
selector: //div[@class="col-md-3 info"]//span[contains(text(), '識別碼')]/../span[2]/text()
URL:
selector: /html/head/link[@hreflang="zh"]/@href
Date:
selector: //div[@class="col-md-3 info"]//span[contains(text(), '發行日期')]/../text()
Details:
selector: //div[@class="container"]/h3/text()
postProcess:
- replace:
- regex: ^(.*? ){1}
with:
Tags:
Name: //div[@class="col-md-3 info"]//span[@class="genre"]/label/a/text()
Performers:
Name: //div[@class="star-name"]/a
Director: //div[@id='video_director']/table/tbody/tr/td[@class="text"]/span/a/text()
Image:
selector: //div[@class="row movie"]/div[@class="col-md-9 screencap"]/a[@class="bigImage"]/img/@src
postProcess:
- replace:
- regex: ^
with: https://www.javbus.com
Studio:
Name: //div[@class="col-md-3 info"]//span[contains(text(), '發行商')]/../a/text()
driver:
headers:
- Key: User-Agent
Value: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/138.0.0.0 Safari/537.36
- Key: Accept-Language
Value: zh-cn
# Last Updated Aug 01, 2025

View File

@ -0,0 +1,9 @@
id: JavBus
name: Javbus
metadata: {}
version: b4672ccf
date: "2025-08-01 16:01:27"
requires: []
source_repository: https://stashapp.github.io/CommunityScrapers/stable/index.yml
files:
- JavBus.yml

View File

@ -0,0 +1,110 @@
name: Javbus_en
sceneByFragment:
action: scrapeXPath
queryURL: https://www.javbus.com/en/{filename}
queryURLReplace:
filename:
- regex: -JG\d
with: ""
- regex: (.*[^a-zA-Z0-9])*([a-zA-Z-]+\d+)(.+)
with: $2
scraper: sceneScraper
sceneByURL:
- action: scrapeXPath
url:
- https://www.javbus.com/en
- https://www.seejav.bid
- https://www.cdnbus.lol
- https://www.dmmbus.lol
- https://www.seedmm.cfd
scraper: sceneScraper
sceneByName:
action: scrapeXPath
queryURL: https://www.javbus.com/en/search/{}&type=&parent=ce
scraper: sceneSearch
sceneByQueryFragment:
action: scrapeXPath
queryURL: "{url}"
scraper: sceneScraper
performerByURL:
- action: scrapeXPath
url:
- https://www.javbus.com/en
- https://www.seejav.bid
- https://www.cdnbus.lol
- https://www.dmmbus.lol
- https://www.seedmm.cfd
scraper: performerScraper
performerByName:
action: scrapeXPath
queryURL: https://www.javbus.com/en/searchstar/{}&type=&parent=ce
scraper: performerSearch
xPathScrapers:
performerSearch:
performer:
Name: //span[@class="mleft"]
URL: //*[@id="waterfall"]/div/a/@href
performerScraper:
performer:
Name: //*[@id="waterfall"]/div[1]/div/div[2]/span
Birthdate:
selector: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '生日')]
postProcess:
- replace:
- regex: ^(.*? ){1}
with:
Height:
selector: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '身高')]
postProcess:
- replace:
- regex: ^(.*? ){1}
with:
# Measurements: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '胸圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '腰圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '臀圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '罩杯')]
Image:
selector: //*[@id="waterfall"]/div[1]/div/div[1]/img/@src
postProcess:
- replace:
- regex: ^
with: https://www.javbus.com/en
sceneSearch:
scene:
Title: //div[@class="photo-info"]/span
URL: //*[@id="waterfall"]/div/a/@href
sceneScraper:
scene:
Title:
selector: //div[@class="col-md-3 info"]//span[contains(text(), '識別碼')]/../span[2]/text()
URL:
selector: /html/head/link[@hreflang="zh"]/@href
Date:
selector: //div[@class="col-md-3 info"]//span[contains(text(), '發行日期')]/../text()
Details:
selector: //div[@class="container"]/h3/text()
postProcess:
- replace:
- regex: ^(.*? ){1}
with:
Tags:
Name: //div[@class="col-md-3 info"]//span[@class="genre"]/label/a/text()
Performers:
Name: //div[@class="star-name"]/a
Director: //div[@id='video_director']/table/tbody/tr/td[@class="text"]/span/a/text()
Image:
selector: //div[@class="row movie"]/div[@class="col-md-9 screencap"]/a[@class="bigImage"]/img/@src
postProcess:
- replace:
- regex: ^
with: https://www.javbus.com/en
Studio:
Name: //div[@class="col-md-3 info"]//span[contains(text(), '發行商')]/../a/text()
driver:
headers:
- Key: User-Agent
Value: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/138.0.0.0 Safari/537.36
- Key: Accept-Language
Value: zh-cn
# Last Updated Aug 01, 2025

View File

@ -0,0 +1,9 @@
id: JavBus_en
name: Javbus_en
metadata: {}
version: b4672ccf
date: "2025-08-01 16:01:27"
requires: []
source_repository: https://stashapp.github.io/CommunityScrapers/stable/index.yml
files:
- JavBus_en.yml