From 33a6e74aa887c45f26511b577b5f62a4f3442213 Mon Sep 17 00:00:00 2001 From: Thomas Renger Date: Sat, 29 Feb 2020 16:13:13 +0100 Subject: [PATCH] Skip inactive bloggers Don't try to parse the feeds of bloggers with "end:" date in the past. --- scan-feeds.py | 15 +++++++++++---- 1 file changed, 11 insertions(+), 4 deletions(-) diff --git a/scan-feeds.py b/scan-feeds.py index 644ea6d..2fef596 100755 --- a/scan-feeds.py +++ b/scan-feeds.py @@ -28,6 +28,7 @@ def parse_published(pub): return parse(pub).astimezone(tz.tzlocal()).replace(tzinfo=None) except: return parse(pub).replace(tzinfo=None) + def get_date(post): for k in ('published', 'created', 'updated'): if k in post: @@ -71,10 +72,16 @@ if len(sys.argv) > 1: parse_feeds(weeks, l[3]) else: for (username, u) in list(users.items()): - blogs = log.setdefault(username, {}) - for l in u['links']: - weeks = blogs.setdefault(l[0], []) - parse_feeds(weeks, l[3]) + print("User: ",u) + if 'end' in u: + enddate = datetime.datetime.strptime(u['end'],'%Y/%m/%d') + if enddate < datetime.datetime.now(): + print("User inactive") + continue + blogs = log.setdefault(username, {}) + for l in u['links']: + weeks = blogs.setdefault(l[0], []) + parse_feeds(weeks, l[3]) with open('out/report.yml', 'w') as f: yaml.safe_dump(log, f)