|
|
|
@ -17,10 +17,6 @@ if TYPE_CHECKING:
|
|
|
|
class CnkiCitedNumberSpider(scrapy.Spider):
|
|
|
|
class CnkiCitedNumberSpider(scrapy.Spider):
|
|
|
|
name = "cnki_cited_number"
|
|
|
|
name = "cnki_cited_number"
|
|
|
|
custom_settings = dict(
|
|
|
|
custom_settings = dict(
|
|
|
|
DEFAULT_REQUEST_HEADERS={
|
|
|
|
|
|
|
|
"Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8",
|
|
|
|
|
|
|
|
"Accept-Language": "en",
|
|
|
|
|
|
|
|
},
|
|
|
|
|
|
|
|
DOWNLOADER_MIDDLEWARES={
|
|
|
|
DOWNLOADER_MIDDLEWARES={
|
|
|
|
"science_article_cnki.middlewares.CnkiSearchHeadersDownloaderMiddleware": 540,
|
|
|
|
"science_article_cnki.middlewares.CnkiSearchHeadersDownloaderMiddleware": 540,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
@ -50,7 +46,8 @@ class CnkiCitedNumberSpider(scrapy.Spider):
|
|
|
|
query_body = model.adv_refine_search(**m)
|
|
|
|
query_body = model.adv_refine_search(**m)
|
|
|
|
search_param = model.adv_query_search(query_body, **m)
|
|
|
|
search_param = model.adv_query_search(query_body, **m)
|
|
|
|
yield scrapy.FormRequest(
|
|
|
|
yield scrapy.FormRequest(
|
|
|
|
url=config.CNKI_ADV_SEARCH_API, method="POST", formdata=search_param, meta=m
|
|
|
|
url=config.CNKI_ADV_SEARCH_API, method="POST",
|
|
|
|
|
|
|
|
formdata=search_param, meta=m
|
|
|
|
)
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
def parse(self, response, **kwargs):
|
|
|
|
def parse(self, response, **kwargs):
|
|
|
|
@ -84,7 +81,8 @@ class CnkiCitedNumberSpider(scrapy.Spider):
|
|
|
|
query_body = model.adv_refine_search(**meta_copy)
|
|
|
|
query_body = model.adv_refine_search(**meta_copy)
|
|
|
|
search_param = model.adv_query_search(query_body, **meta_copy)
|
|
|
|
search_param = model.adv_query_search(query_body, **meta_copy)
|
|
|
|
yield scrapy.FormRequest(
|
|
|
|
yield scrapy.FormRequest(
|
|
|
|
url=config.CNKI_ADV_SEARCH_API, method="POST", formdata=search_param,
|
|
|
|
url=config.CNKI_ADV_SEARCH_API, method="POST",
|
|
|
|
|
|
|
|
formdata=search_param,
|
|
|
|
meta=meta_copy
|
|
|
|
meta=meta_copy
|
|
|
|
)
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
|