mirror of
https://gitlab.com/jeancf/twoot.git
synced 2024-11-23 20:11:11 +00:00
Added tolerance for ConnectionError when visiting linked page to extract picture
This commit is contained in:
parent
1b1faf2d59
commit
1ec03c7d81
15
twoot.py
15
twoot.py
|
@ -219,12 +219,15 @@ def main(argv):
|
|||
m = re.search(r"http[^ \n\xa0]*", tweet_text)
|
||||
if m is not None:
|
||||
link_url = m.group(0)
|
||||
r = requests.get(link_url)
|
||||
if r.status_code == 200:
|
||||
# Matches the first instance of either twitter:image or twitter:image:src meta tag
|
||||
match = re.search(r'<meta name="twitter:image(?:|:src)" content="(.+?)".*?>', r.text)
|
||||
if match is not None:
|
||||
photos.append(match.group(1))
|
||||
try:
|
||||
r = requests.get(link_url)
|
||||
if r.status_code == 200:
|
||||
# Matches the first instance of either twitter:image or twitter:image:src meta tag
|
||||
match = re.search(r'<meta name="twitter:image(?:|:src)" content="(.+?)".*?>', r.text)
|
||||
if match is not None:
|
||||
photos.append(match.group(1))
|
||||
except ConnectionError:
|
||||
pass
|
||||
|
||||
# Add dictionary with content of tweet to list
|
||||
tweet = {
|
||||
|
|
Loading…
Reference in New Issue
Block a user