From 78c1814a60f4ffdfcbc57293c92ac1a386035d1e Mon Sep 17 00:00:00 2001 From: Watchful1 Date: Mon, 21 Aug 2023 21:45:58 -0700 Subject: [PATCH] Support empty filter --- scripts/filter_file.py | 29 +++++++++++++++-------------- 1 file changed, 15 insertions(+), 14 deletions(-) diff --git a/scripts/filter_file.py b/scripts/filter_file.py index c330e04..0c49073 100644 --- a/scripts/filter_file.py +++ b/scripts/filter_file.py @@ -7,7 +7,7 @@ from datetime import datetime import logging.handlers # put the path to the input file -input_file = r"\\MYCLOUDPR4100\Public\reddit\submissions\RS_2023-02.zst" +input_file = r"\\MYCLOUDPR4100\Public\reddit\subreddits\redditdev_submissions.zst" # put the name or path to the output file. The file extension from below will be added automatically output_file = r"\\MYCLOUDPR4100\Public\output" # the format to output in, pick from the following options @@ -233,19 +233,20 @@ if __name__ == "__main__": if created > to_date: continue - field_value = obj[field].lower() - matched = False - for value in values: - if exact_match: - if value == field_value: - matched = True - break - else: - if value in field_value: - matched = True - break - if not matched: - continue + if field is not None: + field_value = obj[field].lower() + matched = False + for value in values: + if exact_match: + if value == field_value: + matched = True + break + else: + if value in field_value: + matched = True + break + if not matched: + continue matched_lines += 1 if output_format == "zst":