don't rescrape if simple.
This commit is contained in:
parent
ce9694b70c
commit
4e5dc65461
|
@ -134,9 +134,9 @@ def update_story(story, is_manual=False, urlref=None):
|
||||||
|
|
||||||
has_url = story.get('url') or False
|
has_url = story.get('url') or False
|
||||||
has_text = story.get('text') or False
|
has_text = story.get('text') or False
|
||||||
is_simple = story.get('scaper', '') == 'simple'
|
#is_simple = story.get('scaper', '') == 'simple'
|
||||||
|
|
||||||
if has_url and (not has_text or is_simple):
|
if has_url and not has_text:
|
||||||
if not get_content_type(story['url']).startswith('text/'):
|
if not get_content_type(story['url']).startswith('text/'):
|
||||||
logging.info('URL invalid file type / content type:')
|
logging.info('URL invalid file type / content type:')
|
||||||
logging.info(story['url'])
|
logging.info(story['url'])
|
||||||
|
|
|
@ -1 +1 @@
|
||||||
Subproject commit a51ea0e42391c8ab5e9b166754131bf3934cba40
|
Subproject commit 91c0a71ccd60bd2af7ce039d5159f3afa0cd3d64
|
Loading…
Reference in New Issue
Block a user