Spaces:
Sleeping
Sleeping
import jsonlines | |
# Path to your dataset file | |
dataset_file = "data/train200.jsonl" | |
# Path to the output file | |
output_file = "data/firstStep_file.jsonl" | |
# Open the JSONL file and extract text and labels | |
try: | |
with jsonlines.open(dataset_file) as reader, jsonlines.open(output_file, mode='w') as writer: | |
for obj in reader: | |
text = obj.get("text") | |
label = obj.get("accept", [])[0] # Get the first accepted label if available | |
if text and label: | |
writer.write({"text": text, "label": label}) | |
else: | |
print("Warning: Text or label missing in the JSON object.") | |
print("Processing completed. Output written to:", output_file) | |
except Exception as e: | |
print("Error:", e) | |