fix: don't rewrite clean file if exists!

This commit is contained in:
Zach Nussbaum 2023-03-26 18:15:22 +00:00
parent eac7734cbf
commit dfee6963a1

View File

@ -6,8 +6,10 @@ import jsonlines
import pandas as pd
prompt_generation_dir = "prompts-reponses"
prompt_generation_dir = "raw_data_sanity_cleaned_delobotomized"
for file in glob.glob(os.path.join(prompt_generation_dir, "*.jsonl")):
if "clean" in file:
continue
data = []
print(file)
with open(file) as f: