目的:提取内容进行格式化输出,类似于字典

编写item文件

class   JobBoleArticleItem(scrapy.Item):
    title = scrapy.Field()  #支持传进任何数据类型
    date =  scrapy.Field() 
    praise_num = scrapy.Field() 
    content = scrapy.Field() 

 爬虫文件中引入item类

from Redbacktest.items import JobBoleArticleItem    #按需更改

实例化

    def parse_detail(self,response):
        article_item = JobBoleArticleItem()

传值

        article_item["title"] = title
        article_item["date"] = date
        article_item['praise_num'] = praise_num
        article_item["content"] = content
       
        yield article_item  #item传递到pipeline中

 修改setting文件使item_pipeline生效

ITEM_PIPELINES = {
   'Redbacktest.pipelines.RedbacktestPipeline': 300,
}

 pipeline调试

step6: item与pipeline

 

step6: item与pipeline

相关文章:

  • 2022-01-09
  • 2021-11-28
  • 2021-05-24
  • 2021-09-03
  • 2022-12-23
  • 2021-10-17
  • 2022-12-23
  • 2021-12-27
猜你喜欢
  • 2022-12-23
  • 2022-12-23
  • 2022-12-23
  • 2021-10-06
  • 2021-07-09
  • 2022-12-23
相关资源
相似解决方案