items.py 677 B

123456789101112131415161718192021222324252627
  1. # -*- coding: utf-8 -*-
  2. # Define here the models for your scraped items
  3. #
  4. # See documentation in:
  5. # https://docs.scrapy.org/en/latest/topics/items.html
  6. import scrapy
  7. class SpidernoticesItem(scrapy.Item):
  8. # define the fields for your item here like:
  9. # name = scrapy.Field()
  10. pass
  11. class NoticeItem(scrapy.Item):
  12. code = scrapy.Field() # 证券代码xxxxxx六位数字
  13. ann_date = scrapy.Field() # 公告日期
  14. ann_title = scrapy.Field()
  15. ann_type = scrapy.Field()
  16. href = scrapy.Field()
  17. href_md5 = scrapy.Field()
  18. content = scrapy.Field()
  19. content_source = scrapy.Field() # 公告内容来源,0 空,1 网页text, 2 pdf解析