mirror of
https://github.com/Watchful1/PushshiftDumps.git
synced 2025-07-25 07:35:24 -04:00
Rename merge, add build_month.py
This commit is contained in:
parent
2f3c3c8f88
commit
aa4cc85334
5 changed files with 347 additions and 1 deletions
30
personal/move/rename_files.py
Normal file
30
personal/move/rename_files.py
Normal file
|
@ -0,0 +1,30 @@
|
|||
import os
|
||||
import discord_logging
|
||||
import re
|
||||
from datetime import datetime
|
||||
|
||||
log = discord_logging.init_logging()
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
parent_folder = r"\\MYCLOUDPR4100\Public\ingest\combined\submissions"
|
||||
files = []
|
||||
for folder_name in os.listdir(parent_folder):
|
||||
folder = os.path.join(parent_folder, folder_name)
|
||||
for file in os.listdir(folder):
|
||||
file_path = os.path.join(parent_folder, folder, file)
|
||||
if file.endswith(".zst"):
|
||||
files.append((folder, file))
|
||||
log.info(f"{parent_folder}: {len(files):,}")
|
||||
|
||||
count_moved = 0
|
||||
for folder, old_file in files:
|
||||
old_path = os.path.join(folder, old_file)
|
||||
new_file = old_file.replace("RC_", "RS_")
|
||||
new_path = os.path.join(folder, new_file)
|
||||
|
||||
os.rename(old_path, new_path)
|
||||
count_moved += 1
|
||||
if count_moved % 100 == 0:
|
||||
log.info(f"{count_moved:,}/{len(files):,}: {folder}")
|
||||
log.info(f"{count_moved:,}/{len(files):,}")
|
Loading…
Add table
Add a link
Reference in a new issue