From f189dcfaca7e868308d2bf2701f2c63af5757543 Mon Sep 17 00:00:00 2001 From: sophon Date: Fri, 14 Nov 2025 13:32:18 +0800 Subject: [PATCH] modify scripts --- .../stash/scripts/scrapers/JavBus/JavBus.yml | 110 ++++++++++++++++++ docker/stash/scripts/scrapers/JavBus/manifest | 9 ++ .../scripts/scrapers/JavBus_en/JavBus_en.yml | 110 ++++++++++++++++++ .../stash/scripts/scrapers/JavBus_en/manifest | 9 ++ 4 files changed, 238 insertions(+) create mode 100644 docker/stash/scripts/scrapers/JavBus/JavBus.yml create mode 100644 docker/stash/scripts/scrapers/JavBus/manifest create mode 100644 docker/stash/scripts/scrapers/JavBus_en/JavBus_en.yml create mode 100644 docker/stash/scripts/scrapers/JavBus_en/manifest diff --git a/docker/stash/scripts/scrapers/JavBus/JavBus.yml b/docker/stash/scripts/scrapers/JavBus/JavBus.yml new file mode 100644 index 0000000..d5bb2a2 --- /dev/null +++ b/docker/stash/scripts/scrapers/JavBus/JavBus.yml @@ -0,0 +1,110 @@ +name: Javbus +sceneByFragment: + action: scrapeXPath + queryURL: https://www.javbus.com/{filename} + queryURLReplace: + filename: + - regex: -JG\d + with: "" + - regex: (.*[^a-zA-Z0-9])*([a-zA-Z-]+\d+)(.+) + with: $2 + scraper: sceneScraper +sceneByURL: + - action: scrapeXPath + url: + - https://www.javbus.com + - https://www.seejav.bid + - https://www.cdnbus.lol + - https://www.dmmbus.lol + - https://www.seedmm.cfd + scraper: sceneScraper +sceneByName: + action: scrapeXPath + queryURL: https://www.javbus.com/search/{}&type=&parent=ce + scraper: sceneSearch +sceneByQueryFragment: + action: scrapeXPath + queryURL: "{url}" + scraper: sceneScraper + +performerByURL: + - action: scrapeXPath + url: + - https://www.javbus.com + - https://www.seejav.bid + - https://www.cdnbus.lol + - https://www.dmmbus.lol + - https://www.seedmm.cfd + scraper: performerScraper +performerByName: + action: scrapeXPath + queryURL: https://www.javbus.com/searchstar/{}&type=&parent=ce + scraper: performerSearch + +xPathScrapers: + performerSearch: + performer: + Name: //span[@class="mleft"] + URL: //*[@id="waterfall"]/div/a/@href + performerScraper: + performer: + Name: //*[@id="waterfall"]/div[1]/div/div[2]/span + Birthdate: + selector: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '生日')] + postProcess: + - replace: + - regex: ^(.*? ){1} + with: + Height: + selector: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '身高')] + postProcess: + - replace: + - regex: ^(.*? ){1} + with: + # Measurements: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '胸圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '腰圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '臀圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '罩杯')] + Image: + selector: //*[@id="waterfall"]/div[1]/div/div[1]/img/@src + postProcess: + - replace: + - regex: ^ + with: https://www.javbus.com + + sceneSearch: + scene: + Title: //div[@class="photo-info"]/span + URL: //*[@id="waterfall"]/div/a/@href + sceneScraper: + scene: + Title: + selector: //div[@class="col-md-3 info"]//span[contains(text(), '識別碼')]/../span[2]/text() + URL: + selector: /html/head/link[@hreflang="zh"]/@href + Date: + selector: //div[@class="col-md-3 info"]//span[contains(text(), '發行日期')]/../text() + Details: + selector: //div[@class="container"]/h3/text() + postProcess: + - replace: + - regex: ^(.*? ){1} + with: + Tags: + Name: //div[@class="col-md-3 info"]//span[@class="genre"]/label/a/text() + Performers: + Name: //div[@class="star-name"]/a + Director: //div[@id='video_director']/table/tbody/tr/td[@class="text"]/span/a/text() + Image: + selector: //div[@class="row movie"]/div[@class="col-md-9 screencap"]/a[@class="bigImage"]/img/@src + postProcess: + - replace: + - regex: ^ + with: https://www.javbus.com + Studio: + Name: //div[@class="col-md-3 info"]//span[contains(text(), '發行商')]/../a/text() + +driver: + headers: + - Key: User-Agent + Value: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/138.0.0.0 Safari/537.36 + - Key: Accept-Language + Value: zh-cn +# Last Updated Aug 01, 2025 \ No newline at end of file diff --git a/docker/stash/scripts/scrapers/JavBus/manifest b/docker/stash/scripts/scrapers/JavBus/manifest new file mode 100644 index 0000000..fc3a93d --- /dev/null +++ b/docker/stash/scripts/scrapers/JavBus/manifest @@ -0,0 +1,9 @@ +id: JavBus +name: Javbus +metadata: {} +version: b4672ccf +date: "2025-08-01 16:01:27" +requires: [] +source_repository: https://stashapp.github.io/CommunityScrapers/stable/index.yml +files: +- JavBus.yml diff --git a/docker/stash/scripts/scrapers/JavBus_en/JavBus_en.yml b/docker/stash/scripts/scrapers/JavBus_en/JavBus_en.yml new file mode 100644 index 0000000..122e4cd --- /dev/null +++ b/docker/stash/scripts/scrapers/JavBus_en/JavBus_en.yml @@ -0,0 +1,110 @@ +name: Javbus_en +sceneByFragment: + action: scrapeXPath + queryURL: https://www.javbus.com/en/{filename} + queryURLReplace: + filename: + - regex: -JG\d + with: "" + - regex: (.*[^a-zA-Z0-9])*([a-zA-Z-]+\d+)(.+) + with: $2 + scraper: sceneScraper +sceneByURL: + - action: scrapeXPath + url: + - https://www.javbus.com/en + - https://www.seejav.bid + - https://www.cdnbus.lol + - https://www.dmmbus.lol + - https://www.seedmm.cfd + scraper: sceneScraper +sceneByName: + action: scrapeXPath + queryURL: https://www.javbus.com/en/search/{}&type=&parent=ce + scraper: sceneSearch +sceneByQueryFragment: + action: scrapeXPath + queryURL: "{url}" + scraper: sceneScraper + +performerByURL: + - action: scrapeXPath + url: + - https://www.javbus.com/en + - https://www.seejav.bid + - https://www.cdnbus.lol + - https://www.dmmbus.lol + - https://www.seedmm.cfd + scraper: performerScraper +performerByName: + action: scrapeXPath + queryURL: https://www.javbus.com/en/searchstar/{}&type=&parent=ce + scraper: performerSearch + +xPathScrapers: + performerSearch: + performer: + Name: //span[@class="mleft"] + URL: //*[@id="waterfall"]/div/a/@href + performerScraper: + performer: + Name: //*[@id="waterfall"]/div[1]/div/div[2]/span + Birthdate: + selector: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '生日')] + postProcess: + - replace: + - regex: ^(.*? ){1} + with: + Height: + selector: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '身高')] + postProcess: + - replace: + - regex: ^(.*? ){1} + with: + # Measurements: //*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '胸圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '腰圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '臀圍')]//*[@id="waterfall"]/div[1]/div/div[2]/p[contains(text(), '罩杯')] + Image: + selector: //*[@id="waterfall"]/div[1]/div/div[1]/img/@src + postProcess: + - replace: + - regex: ^ + with: https://www.javbus.com/en + + sceneSearch: + scene: + Title: //div[@class="photo-info"]/span + URL: //*[@id="waterfall"]/div/a/@href + sceneScraper: + scene: + Title: + selector: //div[@class="col-md-3 info"]//span[contains(text(), '識別碼')]/../span[2]/text() + URL: + selector: /html/head/link[@hreflang="zh"]/@href + Date: + selector: //div[@class="col-md-3 info"]//span[contains(text(), '發行日期')]/../text() + Details: + selector: //div[@class="container"]/h3/text() + postProcess: + - replace: + - regex: ^(.*? ){1} + with: + Tags: + Name: //div[@class="col-md-3 info"]//span[@class="genre"]/label/a/text() + Performers: + Name: //div[@class="star-name"]/a + Director: //div[@id='video_director']/table/tbody/tr/td[@class="text"]/span/a/text() + Image: + selector: //div[@class="row movie"]/div[@class="col-md-9 screencap"]/a[@class="bigImage"]/img/@src + postProcess: + - replace: + - regex: ^ + with: https://www.javbus.com/en + Studio: + Name: //div[@class="col-md-3 info"]//span[contains(text(), '發行商')]/../a/text() + +driver: + headers: + - Key: User-Agent + Value: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/138.0.0.0 Safari/537.36 + - Key: Accept-Language + Value: zh-cn +# Last Updated Aug 01, 2025 \ No newline at end of file diff --git a/docker/stash/scripts/scrapers/JavBus_en/manifest b/docker/stash/scripts/scrapers/JavBus_en/manifest new file mode 100644 index 0000000..62c4646 --- /dev/null +++ b/docker/stash/scripts/scrapers/JavBus_en/manifest @@ -0,0 +1,9 @@ +id: JavBus_en +name: Javbus_en +metadata: {} +version: b4672ccf +date: "2025-08-01 16:01:27" +requires: [] +source_repository: https://stashapp.github.io/CommunityScrapers/stable/index.yml +files: +- JavBus_en.yml