mirror of
https://github.com/Watchful1/PushshiftDumps.git
synced 2025-07-25 15:45:19 -04:00
ad_supplementary_text_md
This commit is contained in:
parent
5405b8dc0d
commit
48906daaea
3 changed files with 3 additions and 3 deletions
|
@ -239,7 +239,7 @@ class ObjectDict:
|
||||||
if minute_dict is None:
|
if minute_dict is None:
|
||||||
range_string = ""
|
range_string = ""
|
||||||
else:
|
else:
|
||||||
range_string = f" - {len(minute_dict.obj_list)} ({minute_dict.max_id - minute_dict.min_id}) ({utils.base36encode(minute_dict.min_id)}-{utils.base36encode(minute_dict.max_id)})"
|
range_string = f" - {len(minute_dict.obj_list)}({minute_dict.max_id - minute_dict.min_id}) ({utils.base36encode(minute_dict.min_id)}-{utils.base36encode(minute_dict.max_id)})"
|
||||||
return count_string + range_string
|
return count_string + range_string
|
||||||
|
|
||||||
def get_counts_string(self):
|
def get_counts_string(self):
|
||||||
|
|
|
@ -116,7 +116,7 @@ field_actions = {
|
||||||
},
|
},
|
||||||
ObjectType.SUBMISSION: {
|
ObjectType.SUBMISSION: {
|
||||||
"ad_promoted_user_posts": FieldAction.OVERWRITE_NOT_NONE,
|
"ad_promoted_user_posts": FieldAction.OVERWRITE_NOT_NONE,
|
||||||
"ad_supplementary_text_md": FieldAction.ALLOW,
|
"ad_supplementary_text_md": FieldAction.OVERWRITE_NOT_NONE,
|
||||||
"adserver_click_url": FieldAction.ALLOW_EMPTY,
|
"adserver_click_url": FieldAction.ALLOW_EMPTY,
|
||||||
"adserver_imp_pixel": FieldAction.ALLOW_EMPTY,
|
"adserver_imp_pixel": FieldAction.ALLOW_EMPTY,
|
||||||
"all_awardings": FieldAction.OVERWRITE_NOT_NONE,
|
"all_awardings": FieldAction.OVERWRITE_NOT_NONE,
|
||||||
|
|
|
@ -12,7 +12,7 @@ NEWLINE_ENCODED = "\n".encode('utf-8')
|
||||||
|
|
||||||
|
|
||||||
if __name__ == "__main__":
|
if __name__ == "__main__":
|
||||||
input_file = r"\\MYCLOUDPR4100\Public\RC_2023-05.zst"
|
input_file = r"\\MYCLOUDPR4100\Public\RC_2023-06.zst"
|
||||||
output_folder = r"\\MYCLOUDPR4100\Public\ingest\download"
|
output_folder = r"\\MYCLOUDPR4100\Public\ingest\download"
|
||||||
file_type = "comments" if "RC" in input_file else "submissions"
|
file_type = "comments" if "RC" in input_file else "submissions"
|
||||||
|
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue