modify scripts
This commit is contained in:
110
docker/stash/scripts/scrapers/JavBus/JavBus.yml
Normal file
110
docker/stash/scripts/scrapers/JavBus/JavBus.yml
Normal file
@ -0,0 +1,110 @@
|
|||||||
|
name: Javbus
|
||||||
|
sceneByFragment:
|
||||||
|
action: scrapeXPath
|
||||||
|
queryURL: https://www.javbus.com/{filename}
|
||||||
|
queryURLReplace:
|
||||||
|
filename:
|
||||||
|
- regex: -JG\d
|
||||||
|
with: ""
|
||||||
|
- regex: (.*[^a-zA-Z0-9])*([a-zA-Z-]+\d+)(.+)
|
||||||
|
with: $2
|
||||||
|
scraper: sceneScraper
|
||||||
|
sceneByURL:
|
||||||
|
- action: scrapeXPath
|
||||||
|
url:
|
||||||
|
- https://www.javbus.com
|
||||||
|
- https://www.seejav.bid
|
||||||
|
- https://www.cdnbus.lol
|
||||||
|
- https://www.dmmbus.lol
|
||||||
|
- https://www.seedmm.cfd
|
||||||
|
scraper: sceneScraper
|
||||||
|
sceneByName:
|
||||||
|
action: scrapeXPath
|
||||||
|
queryURL: https://www.javbus.com/search/{}&type=&parent=ce
|
||||||
|
scraper: sceneSearch
|
||||||
|
sceneByQueryFragment:
|
||||||
|
action: scrapeXPath
|
||||||
|
queryURL: "{url}"
|
||||||
|
scraper: sceneScraper
|
||||||
|
|
||||||
|
performerByURL:
|
||||||
|
- action: scrapeXPath
|
||||||
|
url:
|
||||||
|
- https://www.javbus.com
|
||||||
|
- https://www.seejav.bid
|
||||||
|
- https://www.cdnbus.lol
|
||||||
|
- https://www.dmmbus.lol
|
||||||
|
- https://www.seedmm.cfd
|
||||||
|
scraper: performerScraper
|
||||||
|
performerByName:
|
||||||
|
action: scrapeXPath
|
||||||
|
queryURL: https://www.javbus.com/searchstar/{}&type=&parent=ce
|
||||||
|
scraper: performerSearch
|
||||||
|
|
||||||
|
xPathScrapers:
|
||||||
|
performerSearch:
|
||||||
|
performer:
|
||||||
|
Name: //span[@class="mleft"]
|
||||||
|
URL: //*[@id="waterfall"]/div/a/@href
|
||||||
|
performerScraper:
|
||||||
|
performer:
|
||||||
|
Name: //*[@id="waterfall"]/div[1]/div/div[2]/span
|
||||||
|
Birthdate:
|
||||||
|
selector: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '生日')]
|
||||||
|
postProcess:
|
||||||
|
- replace:
|
||||||
|
- regex: ^(.*? ){1}
|
||||||
|
with:
|
||||||
|
Height:
|
||||||
|
selector: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '身高')]
|
||||||
|
postProcess:
|
||||||
|
- replace:
|
||||||
|
- regex: ^(.*? ){1}
|
||||||
|
with:
|
||||||
|
# Measurements: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '胸圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '腰圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '臀圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '罩杯')]
|
||||||
|
Image:
|
||||||
|
selector: //*[@id="waterfall"]/div[1]/div/div[1]/img/@src
|
||||||
|
postProcess:
|
||||||
|
- replace:
|
||||||
|
- regex: ^
|
||||||
|
with: https://www.javbus.com
|
||||||
|
|
||||||
|
sceneSearch:
|
||||||
|
scene:
|
||||||
|
Title: //div[@class="photo-info"]/span
|
||||||
|
URL: //*[@id="waterfall"]/div/a/@href
|
||||||
|
sceneScraper:
|
||||||
|
scene:
|
||||||
|
Title:
|
||||||
|
selector: //div[@class="col-md-3 info"]//span[contains(text(), '識別碼')]/../span[2]/text()
|
||||||
|
URL:
|
||||||
|
selector: /html/head/link[@hreflang="zh"]/@href
|
||||||
|
Date:
|
||||||
|
selector: //div[@class="col-md-3 info"]//span[contains(text(), '發行日期')]/../text()
|
||||||
|
Details:
|
||||||
|
selector: //div[@class="container"]/h3/text()
|
||||||
|
postProcess:
|
||||||
|
- replace:
|
||||||
|
- regex: ^(.*? ){1}
|
||||||
|
with:
|
||||||
|
Tags:
|
||||||
|
Name: //div[@class="col-md-3 info"]//span[@class="genre"]/label/a/text()
|
||||||
|
Performers:
|
||||||
|
Name: //div[@class="star-name"]/a
|
||||||
|
Director: //div[@id='video_director']/table/tbody/tr/td[@class="text"]/span/a/text()
|
||||||
|
Image:
|
||||||
|
selector: //div[@class="row movie"]/div[@class="col-md-9 screencap"]/a[@class="bigImage"]/img/@src
|
||||||
|
postProcess:
|
||||||
|
- replace:
|
||||||
|
- regex: ^
|
||||||
|
with: https://www.javbus.com
|
||||||
|
Studio:
|
||||||
|
Name: //div[@class="col-md-3 info"]//span[contains(text(), '發行商')]/../a/text()
|
||||||
|
|
||||||
|
driver:
|
||||||
|
headers:
|
||||||
|
- Key: User-Agent
|
||||||
|
Value: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/138.0.0.0 Safari/537.36
|
||||||
|
- Key: Accept-Language
|
||||||
|
Value: zh-cn
|
||||||
|
# Last Updated Aug 01, 2025
|
||||||
9
docker/stash/scripts/scrapers/JavBus/manifest
Normal file
9
docker/stash/scripts/scrapers/JavBus/manifest
Normal file
@ -0,0 +1,9 @@
|
|||||||
|
id: JavBus
|
||||||
|
name: Javbus
|
||||||
|
metadata: {}
|
||||||
|
version: b4672ccf
|
||||||
|
date: "2025-08-01 16:01:27"
|
||||||
|
requires: []
|
||||||
|
source_repository: https://stashapp.github.io/CommunityScrapers/stable/index.yml
|
||||||
|
files:
|
||||||
|
- JavBus.yml
|
||||||
110
docker/stash/scripts/scrapers/JavBus_en/JavBus_en.yml
Normal file
110
docker/stash/scripts/scrapers/JavBus_en/JavBus_en.yml
Normal file
@ -0,0 +1,110 @@
|
|||||||
|
name: Javbus_en
|
||||||
|
sceneByFragment:
|
||||||
|
action: scrapeXPath
|
||||||
|
queryURL: https://www.javbus.com/en/{filename}
|
||||||
|
queryURLReplace:
|
||||||
|
filename:
|
||||||
|
- regex: -JG\d
|
||||||
|
with: ""
|
||||||
|
- regex: (.*[^a-zA-Z0-9])*([a-zA-Z-]+\d+)(.+)
|
||||||
|
with: $2
|
||||||
|
scraper: sceneScraper
|
||||||
|
sceneByURL:
|
||||||
|
- action: scrapeXPath
|
||||||
|
url:
|
||||||
|
- https://www.javbus.com/en
|
||||||
|
- https://www.seejav.bid
|
||||||
|
- https://www.cdnbus.lol
|
||||||
|
- https://www.dmmbus.lol
|
||||||
|
- https://www.seedmm.cfd
|
||||||
|
scraper: sceneScraper
|
||||||
|
sceneByName:
|
||||||
|
action: scrapeXPath
|
||||||
|
queryURL: https://www.javbus.com/en/search/{}&type=&parent=ce
|
||||||
|
scraper: sceneSearch
|
||||||
|
sceneByQueryFragment:
|
||||||
|
action: scrapeXPath
|
||||||
|
queryURL: "{url}"
|
||||||
|
scraper: sceneScraper
|
||||||
|
|
||||||
|
performerByURL:
|
||||||
|
- action: scrapeXPath
|
||||||
|
url:
|
||||||
|
- https://www.javbus.com/en
|
||||||
|
- https://www.seejav.bid
|
||||||
|
- https://www.cdnbus.lol
|
||||||
|
- https://www.dmmbus.lol
|
||||||
|
- https://www.seedmm.cfd
|
||||||
|
scraper: performerScraper
|
||||||
|
performerByName:
|
||||||
|
action: scrapeXPath
|
||||||
|
queryURL: https://www.javbus.com/en/searchstar/{}&type=&parent=ce
|
||||||
|
scraper: performerSearch
|
||||||
|
|
||||||
|
xPathScrapers:
|
||||||
|
performerSearch:
|
||||||
|
performer:
|
||||||
|
Name: //span[@class="mleft"]
|
||||||
|
URL: //*[@id="waterfall"]/div/a/@href
|
||||||
|
performerScraper:
|
||||||
|
performer:
|
||||||
|
Name: //*[@id="waterfall"]/div[1]/div/div[2]/span
|
||||||
|
Birthdate:
|
||||||
|
selector: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '生日')]
|
||||||
|
postProcess:
|
||||||
|
- replace:
|
||||||
|
- regex: ^(.*? ){1}
|
||||||
|
with:
|
||||||
|
Height:
|
||||||
|
selector: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '身高')]
|
||||||
|
postProcess:
|
||||||
|
- replace:
|
||||||
|
- regex: ^(.*? ){1}
|
||||||
|
with:
|
||||||
|
# Measurements: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '胸圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '腰圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '臀圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '罩杯')]
|
||||||
|
Image:
|
||||||
|
selector: //*[@id="waterfall"]/div[1]/div/div[1]/img/@src
|
||||||
|
postProcess:
|
||||||
|
- replace:
|
||||||
|
- regex: ^
|
||||||
|
with: https://www.javbus.com/en
|
||||||
|
|
||||||
|
sceneSearch:
|
||||||
|
scene:
|
||||||
|
Title: //div[@class="photo-info"]/span
|
||||||
|
URL: //*[@id="waterfall"]/div/a/@href
|
||||||
|
sceneScraper:
|
||||||
|
scene:
|
||||||
|
Title:
|
||||||
|
selector: //div[@class="col-md-3 info"]//span[contains(text(), '識別碼')]/../span[2]/text()
|
||||||
|
URL:
|
||||||
|
selector: /html/head/link[@hreflang="zh"]/@href
|
||||||
|
Date:
|
||||||
|
selector: //div[@class="col-md-3 info"]//span[contains(text(), '發行日期')]/../text()
|
||||||
|
Details:
|
||||||
|
selector: //div[@class="container"]/h3/text()
|
||||||
|
postProcess:
|
||||||
|
- replace:
|
||||||
|
- regex: ^(.*? ){1}
|
||||||
|
with:
|
||||||
|
Tags:
|
||||||
|
Name: //div[@class="col-md-3 info"]//span[@class="genre"]/label/a/text()
|
||||||
|
Performers:
|
||||||
|
Name: //div[@class="star-name"]/a
|
||||||
|
Director: //div[@id='video_director']/table/tbody/tr/td[@class="text"]/span/a/text()
|
||||||
|
Image:
|
||||||
|
selector: //div[@class="row movie"]/div[@class="col-md-9 screencap"]/a[@class="bigImage"]/img/@src
|
||||||
|
postProcess:
|
||||||
|
- replace:
|
||||||
|
- regex: ^
|
||||||
|
with: https://www.javbus.com/en
|
||||||
|
Studio:
|
||||||
|
Name: //div[@class="col-md-3 info"]//span[contains(text(), '發行商')]/../a/text()
|
||||||
|
|
||||||
|
driver:
|
||||||
|
headers:
|
||||||
|
- Key: User-Agent
|
||||||
|
Value: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/138.0.0.0 Safari/537.36
|
||||||
|
- Key: Accept-Language
|
||||||
|
Value: zh-cn
|
||||||
|
# Last Updated Aug 01, 2025
|
||||||
9
docker/stash/scripts/scrapers/JavBus_en/manifest
Normal file
9
docker/stash/scripts/scrapers/JavBus_en/manifest
Normal file
@ -0,0 +1,9 @@
|
|||||||
|
id: JavBus_en
|
||||||
|
name: Javbus_en
|
||||||
|
metadata: {}
|
||||||
|
version: b4672ccf
|
||||||
|
date: "2025-08-01 16:01:27"
|
||||||
|
requires: []
|
||||||
|
source_repository: https://stashapp.github.io/CommunityScrapers/stable/index.yml
|
||||||
|
files:
|
||||||
|
- JavBus_en.yml
|
||||||
Reference in New Issue
Block a user