You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
69 lines
1.4 KiB
Python
69 lines
1.4 KiB
Python
# Define here the models for your scraped items
|
|
#
|
|
# See documentation in:
|
|
# https://docs.scrapy.org/en/latest/topics/items.html
|
|
|
|
import scrapy
|
|
|
|
|
|
class ScienceArticlCnkiItem(scrapy.Item):
|
|
# define the fields for your item here like:
|
|
# name = scrapy.Field()
|
|
pass
|
|
|
|
|
|
class AddItemBase(scrapy.Item):
|
|
third_id = scrapy.Field()
|
|
updated_at = scrapy.Field()
|
|
|
|
|
|
class ArticleItem(AddItemBase):
|
|
exported = scrapy.Field()
|
|
|
|
|
|
class CnkiArticleItem(ArticleItem):
|
|
"""cnki文章item"""
|
|
__tablename__ = 'data_cnki_article'
|
|
|
|
third_id = scrapy.Field()
|
|
exported = scrapy.Field()
|
|
updated_at = scrapy.Field()
|
|
|
|
|
|
class CnkiIdRelationItem(AddItemBase):
|
|
__tablename__ = 'relation_school_cnki'
|
|
|
|
query_ids = scrapy.Field()
|
|
school_ids = scrapy.Field()
|
|
task_ids = scrapy.Field()
|
|
year = scrapy.Field()
|
|
|
|
|
|
class CnkiArticleTodoIdItem(scrapy.Item):
|
|
__tablename__ = 'todo_ids_cnki'
|
|
|
|
third_id = scrapy.Field()
|
|
db_code = scrapy.Field()
|
|
state = scrapy.Field()
|
|
ti = scrapy.Field()
|
|
v = scrapy.Field()
|
|
|
|
|
|
class ArticleCitedItem(AddItemBase):
|
|
cited = scrapy.Field()
|
|
|
|
|
|
class CnkiCitedNumberItem(ArticleCitedItem):
|
|
__tablename__ = 'relation_cited_number_cnki'
|
|
|
|
"""发文被引量item"""
|
|
third_id = scrapy.Field()
|
|
cited = scrapy.Field()
|
|
updated_at = scrapy.Field()
|
|
|
|
|
|
class CnkiArticeSourceItem(scrapy.Item):
|
|
__tablename__ = 'relation_sourcetype_cnki'
|
|
third_id = scrapy.Field()
|
|
source_types = scrapy.Field()
|