mirror of
https://github.com/Watchful1/PushshiftDumps.git
synced 2025-07-25 07:35:24 -04:00
rte_mode
This commit is contained in:
parent
1dfdea9458
commit
2f3c3c8f88
3 changed files with 4 additions and 2 deletions
|
@ -188,7 +188,8 @@ def build_day(day_to_process, input_folders, output_folder, object_type, reddit)
|
|||
|
||||
discord_logging.flush_discord()
|
||||
if unmatched_field:
|
||||
log.info(f"Unmatched field, aborting")
|
||||
log.warning(f"Unmatched field, aborting")
|
||||
discord_logging.flush_discord()
|
||||
sys.exit(1)
|
||||
|
||||
minute_iterator += timedelta(minutes=1)
|
||||
|
|
|
@ -93,6 +93,7 @@ field_actions = {
|
|||
"report_reasons": FieldAction.SPECIAL_NO_OVERWRITE,
|
||||
"retrieved_on": FieldAction.SPECIAL,
|
||||
"retrieved_utc": FieldAction.SPECIAL,
|
||||
"rte_mode": FieldAction.OVERWRITE_NOT_NONE,
|
||||
"saved": FieldAction.SPECIAL_NO_OVERWRITE,
|
||||
"score": FieldAction.OVERWRITE_NOT_NONE,
|
||||
"score_hidden": FieldAction.OVERWRITE,
|
||||
|
|
|
@ -12,7 +12,7 @@ NEWLINE_ENCODED = "\n".encode('utf-8')
|
|||
|
||||
|
||||
if __name__ == "__main__":
|
||||
input_file = r"\\MYCLOUDPR4100\Public\RC_2023-06.zst"
|
||||
input_file = r"\\MYCLOUDPR4100\Public\RC_2023-08.zst"
|
||||
output_folder = r"\\MYCLOUDPR4100\Public\ingest\download"
|
||||
file_type = "comments" if "RC" in input_file else "submissions"
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue