mirror of
https://github.com/nomic-ai/gpt4all.git
synced 2025-09-26 23:45:12 +00:00
fix: don't rewrite clean file if exists!
This commit is contained in:
4
clean.py
4
clean.py
@@ -6,8 +6,10 @@ import jsonlines
|
||||
import pandas as pd
|
||||
|
||||
|
||||
prompt_generation_dir = "prompts-reponses"
|
||||
prompt_generation_dir = "raw_data_sanity_cleaned_delobotomized"
|
||||
for file in glob.glob(os.path.join(prompt_generation_dir, "*.jsonl")):
|
||||
if "clean" in file:
|
||||
continue
|
||||
data = []
|
||||
print(file)
|
||||
with open(file) as f:
|
||||
|
Reference in New Issue
Block a user