mirror of
https://github.com/Watchful1/PushshiftDumps.git
synced 2025-07-24 15:15:24 -04:00
ad_supplementary_text_md
This commit is contained in:
parent
5405b8dc0d
commit
48906daaea
3 changed files with 3 additions and 3 deletions
|
@ -239,7 +239,7 @@ class ObjectDict:
|
|||
if minute_dict is None:
|
||||
range_string = ""
|
||||
else:
|
||||
range_string = f" - {len(minute_dict.obj_list)} ({minute_dict.max_id - minute_dict.min_id}) ({utils.base36encode(minute_dict.min_id)}-{utils.base36encode(minute_dict.max_id)})"
|
||||
range_string = f" - {len(minute_dict.obj_list)}({minute_dict.max_id - minute_dict.min_id}) ({utils.base36encode(minute_dict.min_id)}-{utils.base36encode(minute_dict.max_id)})"
|
||||
return count_string + range_string
|
||||
|
||||
def get_counts_string(self):
|
||||
|
|
|
@ -116,7 +116,7 @@ field_actions = {
|
|||
},
|
||||
ObjectType.SUBMISSION: {
|
||||
"ad_promoted_user_posts": FieldAction.OVERWRITE_NOT_NONE,
|
||||
"ad_supplementary_text_md": FieldAction.ALLOW,
|
||||
"ad_supplementary_text_md": FieldAction.OVERWRITE_NOT_NONE,
|
||||
"adserver_click_url": FieldAction.ALLOW_EMPTY,
|
||||
"adserver_imp_pixel": FieldAction.ALLOW_EMPTY,
|
||||
"all_awardings": FieldAction.OVERWRITE_NOT_NONE,
|
||||
|
|
|
@ -12,7 +12,7 @@ NEWLINE_ENCODED = "\n".encode('utf-8')
|
|||
|
||||
|
||||
if __name__ == "__main__":
|
||||
input_file = r"\\MYCLOUDPR4100\Public\RC_2023-05.zst"
|
||||
input_file = r"\\MYCLOUDPR4100\Public\RC_2023-06.zst"
|
||||
output_folder = r"\\MYCLOUDPR4100\Public\ingest\download"
|
||||
file_type = "comments" if "RC" in input_file else "submissions"
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue