modify scripts
This commit is contained in:
@ -90,8 +90,8 @@ class PornboxSpider(BaseSpider):
|
|||||||
|
|
||||||
self.logger.info(f"url: {response.url}, total: {total_pages}, items: {len(data.get('items', []))}")
|
self.logger.info(f"url: {response.url}, total: {total_pages}, items: {len(data.get('items', []))}")
|
||||||
|
|
||||||
|
'''
|
||||||
# 由于 item 中不包含页码信息,我们需要从 spider 的属性中获取
|
# 由于 item 中不包含页码信息,我们需要从 spider 的属性中获取
|
||||||
# 注意:这种方法依赖于 spider 中保存了当前页码
|
|
||||||
json_dir = './pbox'
|
json_dir = './pbox'
|
||||||
os.makedirs(json_dir, exist_ok=True)
|
os.makedirs(json_dir, exist_ok=True)
|
||||||
file_path = os.path.join(json_dir, f"{current_page}.json")
|
file_path = os.path.join(json_dir, f"{current_page}.json")
|
||||||
@ -100,6 +100,7 @@ class PornboxSpider(BaseSpider):
|
|||||||
with open(file_path, 'w', encoding='utf-8') as f:
|
with open(file_path, 'w', encoding='utf-8') as f:
|
||||||
pass
|
pass
|
||||||
#json.dump(data, f, ensure_ascii=False, indent=2)
|
#json.dump(data, f, ensure_ascii=False, indent=2)
|
||||||
|
'''
|
||||||
|
|
||||||
# 处理每个工作室项目
|
# 处理每个工作室项目
|
||||||
for item in data.get('items', []):
|
for item in data.get('items', []):
|
||||||
|
|||||||
Reference in New Issue
Block a user