diff --git a/crawlab/routes/spiders.py b/crawlab/routes/spiders.py index 91ab8608..a0a902da 100644 --- a/crawlab/routes/spiders.py +++ b/crawlab/routes/spiders.py @@ -509,7 +509,7 @@ class SpiderApi(BaseApi): }, r.status_code # get html parse tree - sel = etree.HTML(r.content) + sel = etree.HTML(r.content.decode('utf-8')) # remove unnecessary tags unnecessary_tags = [