From 1697e719ea4d10591dd2b0e199bdf19d738b815f Mon Sep 17 00:00:00 2001 From: Marvin Zhang Date: Thu, 6 Jun 2019 17:24:00 +0800 Subject: [PATCH] updated spiders --- crawlab/routes/spiders.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/crawlab/routes/spiders.py b/crawlab/routes/spiders.py index 91ab8608..a0a902da 100644 --- a/crawlab/routes/spiders.py +++ b/crawlab/routes/spiders.py @@ -509,7 +509,7 @@ class SpiderApi(BaseApi): }, r.status_code # get html parse tree - sel = etree.HTML(r.content) + sel = etree.HTML(r.content.decode('utf-8')) # remove unnecessary tags unnecessary_tags = [