mirror of
https://github.com/crawlab-team/crawlab.git
synced 2026-01-22 17:31:03 +01:00
added automatic extraction of fields functionality
This commit is contained in:
@@ -523,7 +523,7 @@ class SpiderApi(BaseApi):
|
||||
tags = []
|
||||
for tag in sel.iter():
|
||||
if tag.tag == 'a':
|
||||
if not tag.get('href').startswith('#') and not tag.get('href').startswith('javascript'):
|
||||
if tag.get('href') is not None and not tag.get('href').startswith('#') and not tag.get('href').startswith('javascript'):
|
||||
tags.append(tag)
|
||||
|
||||
return tags
|
||||
|
||||
Reference in New Issue
Block a user