Browse Source

fix fetch page title default

Nick Sweeting 7 years ago
parent
commit
d35c6cf8b5
1 changed files with 7 additions and 3 deletions
  1. 7 3
      archivebox/util.py

+ 7 - 3
archivebox/util.py

@@ -212,15 +212,19 @@ def download_url(url):
     return source_path
 
 
-def fetch_page_title(url, default=None):
+def fetch_page_title(url, default=True):
     """Attempt to guess a page's title by downloading the html"""
-    
+    if default is True:
+        default = url
+
     try:
         html_content = urllib.request.urlopen(url).read().decode('utf-8')
 
         match = re.search('<title>(.*?)</title>', html_content)
-        return match.group(1) if match else default
+        return match.group(1) if match else default or None
     except Exception:
+        if default is False:
+            raise
         return default