mirror of
https://github.com/ArchiveBox/ArchiveBox.git
synced 2025-05-13 14:44:29 -04:00
add timeout to title fetching
This commit is contained in:
parent
e1be96e597
commit
db0461ec4e
1 changed files with 1 additions and 1 deletions
|
@ -234,7 +234,7 @@ def fetch_page_title(url, default=True):
|
|||
default = url
|
||||
|
||||
try:
|
||||
html_content = urllib.request.urlopen(url).read().decode('utf-8')
|
||||
html_content = urllib.request.urlopen(url, timeout=10).read().decode('utf-8')
|
||||
|
||||
match = re.search('<title>(.*?)</title>', html_content)
|
||||
return match.group(1) if match else default or None
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue