From f3f7696f44fd69f8b1b497e56a560b1cbb0fc97f Mon Sep 17 00:00:00 2001 From: "Moore.Huang" Date: Sun, 17 Jun 2018 11:27:09 +0800 Subject: [PATCH] =?UTF-8?q?Feature:=20=E4=B8=BAspider=5Fpost=E4=BB=BB?= =?UTF-8?q?=E5=8A=A1=E5=A2=9E=E5=8A=A0=E8=B0=83=E7=94=A8=E7=88=AC=E8=99=AB?= =?UTF-8?q?=E7=9A=84=E5=AE=9A=E5=88=B6=E4=BC=A0=E5=8F=82=E6=94=AF=E6=8C=81?= =?UTF-8?q?=EF=BC=8C=E4=BE=BF=E4=BA=8E=E5=90=8E=E5=8F=B0=E7=AE=A1=E7=90=86?= =?UTF-8?q?=E6=97=B6=E7=88=AC=E5=8F=96=E6=8C=87=E5=AE=9A=E6=97=A5=E6=9C=9F?= =?UTF-8?q?=E7=9A=84=E6=96=87=E7=AB=A0?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- server/spiders/admin.py | 2 +- server/spiders/tasks.py | 10 ++++++---- 2 files changed, 7 insertions(+), 5 deletions(-) diff --git a/server/spiders/admin.py b/server/spiders/admin.py index f590bdd..37e7b90 100644 --- a/server/spiders/admin.py +++ b/server/spiders/admin.py @@ -25,7 +25,7 @@ def action_spider_post(self, request, queryset): c = (group( tasks.spider_post.s(spider.name) for spider in queryset )) - c.delay() + c.delay() # 测试时指定爬取日期: date='20180530' self.message_user( request, _('共触发 {num} 个爬虫源').format( diff --git a/server/spiders/tasks.py b/server/spiders/tasks.py index 4c2264f..f36b1db 100644 --- a/server/spiders/tasks.py +++ b/server/spiders/tasks.py @@ -13,7 +13,7 @@ @shared_task -def spider_post(spider_name): +def spider_post(spider_name, **kwargs): """ 爬取文章数据 """ @@ -24,14 +24,16 @@ def spider_post(spider_name): invoke_on_load=True, ) - def crawl(ext, *args): - rc = ext.obj.crawl() # 测试时指定爬取日期: date='20180507' + def crawl(ext, **kwargs): + log.info('[{name}]调用爬虫传参: {kwargs}'.format( + name=ext.name, kwargs=kwargs)) + rc = ext.obj.crawl(**kwargs) data = json.dumps(rc, ensure_ascii=False) log.debug('[{name}]爬取返回包:{pack}'.format( name=ext.name, pack=data)) return (ext.name, rc) - results = mgr.map(crawl) + results = mgr.map(crawl, **kwargs) log.debug('结果对象:{results}'.format( results=results))