Remove get first image
This commit is contained in:
parent
850b30e353
commit
f1c846acd0
|
@ -56,19 +56,6 @@ def get_article(url):
|
||||||
logging.error('Problem getting article: {}'.format(str(e)))
|
logging.error('Problem getting article: {}'.format(str(e)))
|
||||||
return ''
|
return ''
|
||||||
|
|
||||||
def get_first_image(text):
|
|
||||||
soup = BeautifulSoup(text, features='html.parser')
|
|
||||||
|
|
||||||
try:
|
|
||||||
first_img = soup.find('img')
|
|
||||||
url = first_img['src']
|
|
||||||
headers = {'User-Agent': 'Twitterbot/1.0'}
|
|
||||||
length = requests.get(url, headers=headers, timeout=4).headers['content-length']
|
|
||||||
if int(length) > 1000000: raise
|
|
||||||
return url
|
|
||||||
except:
|
|
||||||
return ''
|
|
||||||
|
|
||||||
def get_content_type(url):
|
def get_content_type(url):
|
||||||
try:
|
try:
|
||||||
headers = {'User-Agent': 'Twitterbot/1.0'}
|
headers = {'User-Agent': 'Twitterbot/1.0'}
|
||||||
|
@ -130,8 +117,6 @@ def update_story(story, is_manual=False):
|
||||||
story['text'] = get_article(story['url'])
|
story['text'] = get_article(story['url'])
|
||||||
if not story['text']: return False
|
if not story['text']: return False
|
||||||
|
|
||||||
story['img'] = get_first_image(story['text'])
|
|
||||||
|
|
||||||
return True
|
return True
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
|
@ -147,7 +132,5 @@ if __name__ == '__main__':
|
||||||
|
|
||||||
a = get_article('https://blog.joinmastodon.org/2019/10/mastodon-3.0/')
|
a = get_article('https://blog.joinmastodon.org/2019/10/mastodon-3.0/')
|
||||||
print(a)
|
print(a)
|
||||||
u = get_first_image(a)
|
|
||||||
print(u)
|
|
||||||
|
|
||||||
print('done')
|
print('done')
|
||||||
|
|
Loading…
Reference in New Issue
Block a user