wos:用科学平台的wos_raw_data当去重库

main
zhaoxiangpeng 3 weeks ago
parent 1bf0703dba
commit 9e0f6b8b55

@ -195,7 +195,7 @@ class DupTodoBySciencePipeline(DupTodoPipeline):
settings = spider.settings
dup_uri = settings.get("MONGO_URI_SCIENCE")
cli = MongoClient(dup_uri)
dup_db = cli.get_database("MONGO_DATABASE_SCIENCE")
dup_db = cli.get_database(settings.get("MONGO_DATABASE_SCIENCE"))
self.dup_collection = dup_db.get_collection('wos_raw_data')
def is_exists(self, item, filter_key) -> bool:

Loading…
Cancel
Save