规范下面这段代码格式# Define your item pipelines here # # Don't forget to add your pipeline to the ITEM_PIPELINES setting # See: https://docs.scrapy.org/en/latest/topics/item-pipeline.html # useful for handling different item types with a single interface import openpyxl from itemadapter import ItemAdapter class TaobaospiderPipeline: def init(self): self.wb = openpyxl.Workbook() # 创建工作簿 self.ws = self.wb.active # 拿到默认激活的工作表 self.ws.title = 'TaoBaoData' # 工作表名称 self.ws.append(('标题','价格','销量','店铺名称','店铺地址')) # 表头 def close_spider(self, spider): # 爬虫停止运行的时候执行该方法,钩子函数,自己执行不需要调用 self.wb.save('淘宝商品数据.xlsx') def process_item(self, item, spider): title = item.get('title', '') # 如果字典中的title值为空的话,就把''(空值)赋给title变量,写法一 price = item.get('price') or 0 # 如果字典中的title值为空的话,就把''(空值)赋给title变量,写法二 deal_count = item.get('deal_count', '') shop = item.get('shop', '') location = item.get('location', '') self.ws.append((title, price, deal_count, shop, location)) # return item
时间: 2023-12-29 17:02:27 浏览: 158
# Define your item pipelines here
# Don't forget to add your pipeline to the ITEM_PIPELINES setting
# See: https://docs.scrapy.org/en/latest/topics/item-pipeline.html
# useful for handling different item types with a single interface
import openpyxl
from itemadapter import ItemAdapter
class TaobaoSpiderPipeline:
def __init__(self):
self.wb = openpyxl.Workbook() # 创建工作簿
self.ws = self.wb.active # 拿到默认激活的工作表
self.ws.title = 'TaoBaoData' # 工作表名称
self.ws.append(('标题','价格','销量','店铺名称','店铺地址')) # 表头
def close_spider(self, spider):
# 爬虫停止运行的时候执行该方法,钩子函数,自己执行不需要调用
self.wb.save('淘宝商品数据.xlsx')
def process_item(self, item, spider):
title = item.get('title', '') # 如果字典中的title值为空的话,就把''(空值)赋给title变量,写法一
price = item.get('price') or 0 # 如果字典中的title值为空的话,就把''(空值)赋给title变量,写法二
deal_count = item.get('deal_count', '')
shop = item.get('shop', '')
location = item.get('location', '')
self.ws.append((title, price, deal_count, shop, location))
return item
阅读全文