mirror of
https://github.com/Watchful1/PushshiftDumps.git
synced 2025-07-23 06:40:47 -04:00
Add recompress file test script
This commit is contained in:
parent
c9b0d5280e
commit
4e140e218b
3 changed files with 70 additions and 5 deletions
|
@ -7,8 +7,10 @@ import zstandard
|
|||
import json
|
||||
|
||||
input_files = [
|
||||
r"\\MYCLOUDPR4100\Public\reddit\subreddits\collapse_comments.zst",
|
||||
r"\\MYCLOUDPR4100\Public\reddit\subreddits\Slovakia_comments.zst",
|
||||
r"\\MYCLOUDPR4100\Public\reddit\subreddits\PersonalFinanceCanada_comments.zst",
|
||||
r"\\MYCLOUDPR4100\Public\reddit\subreddits\hacking_comments.zst",
|
||||
r"\\MYCLOUDPR4100\Public\reddit\subreddits\alberta_comments.zst",
|
||||
r"\\MYCLOUDPR4100\Public\reddit\subreddits\GothGirls_comments.zst",
|
||||
]
|
||||
ignored_users = ['[deleted]', 'automoderator']
|
||||
min_comments_per_sub = 1
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue