diff --git a/personal/diagnostic/count_subreddits_multiprocess.py b/personal/diagnostic/count_subreddits_multiprocess.py index dacd313..0a1e6ef 100644 --- a/personal/diagnostic/count_subreddits_multiprocess.py +++ b/personal/diagnostic/count_subreddits_multiprocess.py @@ -238,7 +238,7 @@ if __name__ == '__main__': # start the workers with multiprocessing.Pool(processes=min(args.processes, len(files_to_process))) as pool: workers = pool.starmap_async(process_file, [(file, queue, args.field) for file in files_to_process], chunksize=1, error_callback=log.info) - while not workers.ready(): + while not workers.ready() or not queue.empty(): # loop until the workers are all done, pulling in status messages as they are sent file_update = queue.get() if file_update.error_message is not None: diff --git a/personal/diagnostic/test_file.py b/personal/diagnostic/test_file.py index dfcb42e..21c546a 100644 --- a/personal/diagnostic/test_file.py +++ b/personal/diagnostic/test_file.py @@ -8,7 +8,7 @@ log = discord_logging.init_logging() if __name__ == "__main__": - input_path = r"\\MYCLOUDPR4100\Public\reddit\submissions\RS_2025-05.zst" + input_path = r"\\MYCLOUDPR4100\Public\reddit\comments\RC_2025-06.zst" input_file_paths = [] if os.path.isdir(input_path):