modify scripts

This commit is contained in:
2025-07-26 19:13:40 +08:00
parent 228566a6f3
commit 7e1b905afe

View File

@ -169,7 +169,7 @@ class JavbusSpiderSpider(BaseSpider):
movies_cnt = titles.get('movies_cnt', 0)
if not self.need_update_actor(href=actor_url, movies_cnt=movies_cnt):
self.crawler.stats.inc_value(f"{self.name}/actor_done")
self.logger.info(f"actor ({actor_name}) up to date. skipping... url: {actor_url}")
self.logger.info(f"actor ({actor_name}) up to date. movies cnt: {movies_cnt} skipping... url: {actor_url}")
return None
# 需要更新了,先翻页
@ -275,7 +275,9 @@ class JavbusSpiderSpider(BaseSpider):
if href == '':
return
if is_valid_url(href):
# 只有en和ja需要手动补齐一下zh
langs_url = generate_multilang_urls(href)
langs_url['zh'] = href
for lang, next_url in langs_url.items():
if not self._can_request(next_url):
continue
@ -328,6 +330,7 @@ class JavbusSpiderSpider(BaseSpider):
name_key = f"{lang}_name" if lang !='zh' else 'name'
if name_key in item.fields:
item[name_key] = title_meta.get('title')
self.logger.debug(f"movies list ({prefix}) title: {title_meta}")
if not response.meta.get('from_cache'):
yield item