mirror of
https://github.com/Watchful1/PushshiftDumps.git
synced 2025-07-26 16:15:37 -04:00
Reorganize
This commit is contained in:
parent
3700b21b81
commit
4f1d70d34a
19 changed files with 0 additions and 105 deletions
33
personal/diagnostic/compare_lines.py
Normal file
33
personal/diagnostic/compare_lines.py
Normal file
|
@ -0,0 +1,33 @@
|
|||
import utils
|
||||
import discord_logging
|
||||
import os
|
||||
import sys
|
||||
from datetime import datetime
|
||||
|
||||
log = discord_logging.init_logging()
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
file_one = open(r"\\MYCLOUDPR4100\Public\reddit_final\RelationshipsOver35_comments_dump.txt", 'r')
|
||||
file_two = open(r"\\MYCLOUDPR4100\Public\reddit_final\RelationshipsOver35_comments_mongo.txt", 'r')
|
||||
|
||||
file_lines = 0
|
||||
while True:
|
||||
file_lines += 1
|
||||
line_one = file_one.readline().rstrip()
|
||||
line_two = file_two.readline().rstrip()
|
||||
if line_one != line_two:
|
||||
log.info(f"lines not matching: {file_lines}")
|
||||
log.info(line_one)
|
||||
log.info(line_two)
|
||||
#break
|
||||
|
||||
if file_lines % 100000 == 0:
|
||||
log.info(f"{file_lines:,}")
|
||||
|
||||
if not line_one:
|
||||
break
|
||||
|
||||
log.info(f"{file_lines:,}")
|
||||
file_one.close()
|
||||
file_two.close()
|
Loading…
Add table
Add a link
Reference in a new issue