From 6114afb53f336c1ddf335becde7ea74d26b77423 Mon Sep 17 00:00:00 2001 From: Watchful1 Date: Sun, 7 Jan 2024 10:45:51 -0800 Subject: [PATCH] Fix last month of year --- personal/combine/build_month.py | 5 ++++- personal/diagnostic/comments_per_day.py | 4 ++-- scripts/find_overlapping_users.py | 6 ++---- 3 files changed, 8 insertions(+), 7 deletions(-) diff --git a/personal/combine/build_month.py b/personal/combine/build_month.py index 663183d..88f005d 100644 --- a/personal/combine/build_month.py +++ b/personal/combine/build_month.py @@ -60,7 +60,10 @@ if __name__ == "__main__": total_objects = 0 total_bytes = 0 minute_iterator = month - end_time = month.replace(month=month.month + 1) + if month == 12: + end_time = month.replace(year=month.year + 1, month=1) + else: + end_time = month.replace(month=month.month + 1) while minute_iterator < end_time: minute_file_path = os.path.join(args.input, args.type, minute_iterator.strftime('%y-%m-%d'), f"{prefix}_{minute_iterator.strftime('%y-%m-%d_%H-%M')}.zst") for obj, line, _ in utils.read_obj_zst_meta(minute_file_path): diff --git a/personal/diagnostic/comments_per_day.py b/personal/diagnostic/comments_per_day.py index 797ba07..e07eee5 100644 --- a/personal/diagnostic/comments_per_day.py +++ b/personal/diagnostic/comments_per_day.py @@ -8,8 +8,8 @@ log = discord_logging.init_logging() if __name__ == "__main__": day = None day_comments = 0 - for comment in utils.read_obj_zst(r"\\MYCLOUDPR4100\Public\reddit_final\wallstreetbets_comments.zst"): - created_day = datetime.utcfromtimestamp(int(comment['created_utc'])).strftime("%m/%d/%y") + for comment in utils.read_obj_zst(r"C:\Users\greg\Desktop\Drive\pushshift\haley0530\chatbots_submissions.zst"): + created_day = datetime.utcfromtimestamp(int(comment['created_utc'])).strftime("%y-%m-%d") if day is None: day = created_day if day != created_day: diff --git a/scripts/find_overlapping_users.py b/scripts/find_overlapping_users.py index 5099557..5e472da 100644 --- a/scripts/find_overlapping_users.py +++ b/scripts/find_overlapping_users.py @@ -7,10 +7,8 @@ import zstandard import json input_files = [ - r"\\MYCLOUDPR4100\Public\reddit\subreddits\PersonalFinanceCanada_comments.zst", - r"\\MYCLOUDPR4100\Public\reddit\subreddits\hacking_comments.zst", - r"\\MYCLOUDPR4100\Public\reddit\subreddits\alberta_comments.zst", - r"\\MYCLOUDPR4100\Public\reddit\subreddits\GothGirls_comments.zst", + r"\\MYCLOUDPR4100\Public\reddit\subreddits\srilanka_comments.zst", + r"\\MYCLOUDPR4100\Public\reddit\subreddits\Warthunder_comments.zst", ] ignored_users = ['[deleted]', 'automoderator'] min_comments_per_sub = 1