From bda7a4c8d64bd4baef57bb4f4c112abce08f1cde Mon Sep 17 00:00:00 2001 From: Watchful1 Date: Fri, 21 Jun 2024 10:12:09 -0700 Subject: [PATCH] Print the full file name when it doesn't exist --- scripts/find_overlapping_users.py | 13 +++---------- 1 file changed, 3 insertions(+), 10 deletions(-) diff --git a/scripts/find_overlapping_users.py b/scripts/find_overlapping_users.py index efd8b03..d0e6803 100644 --- a/scripts/find_overlapping_users.py +++ b/scripts/find_overlapping_users.py @@ -14,15 +14,8 @@ import json # the script will look for both comments and submissions files for each subreddit folder = r"\\MYCLOUDPR4100\Public\reddit\subreddits23" subreddits = [ - "aquarium", - "opiates", - "axolotls", - "piercing", - "titanfolk", - "AskOuija", - "piercing", - "DPH", - "dxm", + "JEENEETards", + "TwoXIndia", ] ignored_users = {'[deleted]', 'automoderator'} # this is a list of users to ignore when doing the comparison. Most popular bots post in many subreddits and aren't the person you're looking for @@ -128,7 +121,7 @@ if __name__ == "__main__": for file_type in ["submissions", "comments"]: subreddit_file = os.path.join(folder, f"{subreddit}_{file_type}.zst") if not os.path.exists(subreddit_file): - log.info(f"{file_type} for {subreddit} does not exist, skipping") + log.info(f"{file_type} for {subreddit} does not exist, skipping: {subreddit_file}") continue subreddit_exists = True total_lines = get_commenters_from_file(subreddit_file, commenters, total_lines)