From a6921cc7bcfc867daf512ff0dfb56959b1969fc9 Mon Sep 17 00:00:00 2001 From: Remi Rampin Date: Thu, 20 Jul 2017 10:13:22 -0400 Subject: [PATCH 1/2] Add print statements to import_feed.py --- import_feed.py | 8 ++++++++ 1 file changed, 8 insertions(+) diff --git a/import_feed.py b/import_feed.py index 2affb46..fcebd2a 100755 --- a/import_feed.py +++ b/import_feed.py @@ -15,7 +15,11 @@ def main(): req = requests.get('https://share.osf.io/api/v2/atom/?elasticQuery=%7B%22bool%22%3A%7B%22must%22%3A%7B%22query_string%22%3A%7B%22query%22%3A%22*%22%7D%7D%2C%22filter%22%3A%5B%7B%22term%22%3A%7B%22sources%22%3A%22LIS%20Scholarship%20Archive%22%7D%7D%2C%7B%22term%22%3A%7B%22types%22%3A%22preprint%22%7D%7D%5D%7D%7D') feed = feedparser.parse(req.content) + print("Downloaded feed, %d entries" % len(feed['entries'])) + for d in feed['entries']: + print("Title: %s" % d['title'].strip()) + # Generate file name url = urlparse(d['link']).path @@ -23,11 +27,13 @@ def main(): while non_slug_chars.match(slug[0]): slug = slug[1:] slug = non_slug_chars.sub('_', slug) + print("Filename: %s" % slug) file_name = 'scholarship/%s.html' % slug # Parse date date = dateutil.parser.parse(d['date']) + print("Date: %s" % date.strftime('%Y-%m-%d %H:%M:%S')) # Open output file with io.open(file_name, 'w', encoding='utf-8') as fp: @@ -50,6 +56,8 @@ def main(): link=d['link'].strip(), text=d['summary'].strip())) + print() + if __name__ == '__main__': main() From 2468abd1b721a9b9e2ea8a657712ced98decd12d Mon Sep 17 00:00:00 2001 From: Remi Rampin Date: Thu, 20 Jul 2017 10:13:34 -0400 Subject: [PATCH 2/2] Read published date from feed instead of updated --- import_feed.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/import_feed.py b/import_feed.py index fcebd2a..e46c3c3 100755 --- a/import_feed.py +++ b/import_feed.py @@ -32,7 +32,7 @@ def main(): file_name = 'scholarship/%s.html' % slug # Parse date - date = dateutil.parser.parse(d['date']) + date = dateutil.parser.parse(d['published']) print("Date: %s" % date.strftime('%Y-%m-%d %H:%M:%S')) # Open output file