fetch page title during archiving process

This commit is contained in:
Nick Sweeting
2019-02-19 01:44:54 -05:00
parent bb5879a4f7
commit 5a7d00a639
5 changed files with 44 additions and 15 deletions

View File

@@ -57,7 +57,7 @@ def validate_links(links):
raise SystemExit(1)
for link in links:
link['title'] = unescape(link['title'])
link['title'] = unescape(link['title']) if link['title'] else None
link['latest'] = link.get('latest') or {}
latest = link['latest']
@@ -76,6 +76,9 @@ def validate_links(links):
if not latest.get('favicon'):
latest['favicon'] = None
if not link['latest'].get('title'):
link['latest']['title'] = link['title']
return list(links)
def new_links(all_links, existing_links):