1
0
Fork 0
mirror of synced 2024-06-24 17:10:21 +12:00

fix pinboard RSS parser

This commit is contained in:
Nick Sweeting 2019-03-19 18:44:22 -04:00
parent 61ec4971e9
commit f9a7c530b9
2 changed files with 5 additions and 5 deletions

View file

@ -228,9 +228,9 @@ def parse_pinboard_rss_export(rss_file):
items = root.findall("{http://purl.org/rss/1.0/}item")
for item in items:
url = item.find("{http://purl.org/rss/1.0/}link").text
tags = item.find("{http://purl.org/dc/elements/1.1/}subject").text
title = item.find("{http://purl.org/rss/1.0/}title").text.strip()
ts_str = item.find("{http://purl.org/dc/elements/1.1/}date").text
tags = item.find("{http://purl.org/dc/elements/1.1/}subject").text if item.find("{http://purl.org/dc/elements/1.1/}subject") else None
title = item.find("{http://purl.org/rss/1.0/}title").text.strip() if item.find("{http://purl.org/rss/1.0/}title").text.strip() else None
ts_str = item.find("{http://purl.org/dc/elements/1.1/}date").text if item.find("{http://purl.org/dc/elements/1.1/}date").text else None
# = 🌈🌈🌈🌈
# = 🌈🌈🌈🌈
# = 🏆🏆🏆🏆
@ -243,7 +243,7 @@ def parse_pinboard_rss_export(rss_file):
info = {
'url': url,
'timestamp': str(time.timestamp()),
'tags': tags,
'tags': tags or '',
'title': title or None,
'sources': [rss_file.name],
}

View file

@ -413,7 +413,7 @@ def derived_link_info(link):
'is_archived': os.path.exists(os.path.join(
ARCHIVE_DIR,
link['timestamp'],
wget_output_path(link) or domain(url)
domain(url),
)),
'num_outputs': len([entry for entry in link['latest'].values() if entry]) if 'latest' in link else 0,
}