mirror of
https://github.com/nomic-ai/gpt4all.git
synced 2024-10-01 01:06:10 -04:00
fix: don't rewrite clean file if exists!
This commit is contained in:
parent
eac7734cbf
commit
dfee6963a1
4
clean.py
4
clean.py
@ -6,8 +6,10 @@ import jsonlines
|
||||
import pandas as pd
|
||||
|
||||
|
||||
prompt_generation_dir = "prompts-reponses"
|
||||
prompt_generation_dir = "raw_data_sanity_cleaned_delobotomized"
|
||||
for file in glob.glob(os.path.join(prompt_generation_dir, "*.jsonl")):
|
||||
if "clean" in file:
|
||||
continue
|
||||
data = []
|
||||
print(file)
|
||||
with open(file) as f:
|
||||
|
Loading…
Reference in New Issue
Block a user