igedi / utils /merge_jsons.py
Andrea Maldonado
directory structure
a451e02
raw
history blame
1.3 kB
import argparse
import json
import csv
import os
"""
Run using:
python merge_jsons.py path_to_your_json_directory output.csv
"""
def json_to_csv(json_dir, output_csv):
json_files = [os.path.join(json_dir, file) for file in os.listdir(json_dir) if file.endswith('.json')]
# Collect data from all JSON files
all_data = []
for json_file in json_files:
with open(json_file, 'r') as f:
data = json.load(f)
all_data.append(data)
# Extract the headers from the first JSON object
if all_data:
headers = {elem for s in [set(i) for i in [d.keys() for d in all_data]] for elem in s}
else:
raise ValueError("No data found in JSON files")
# Write data to CSV
with open(output_csv, 'w', newline='') as f:
writer = csv.DictWriter(f, fieldnames=headers)
writer.writeheader()
writer.writerows(all_data)
# Example usage
if __name__ == '__main__':
parser = argparse.ArgumentParser(description='Convert JSON files in a directory to a CSV file.')
parser.add_argument('json_dir', type=str, help='The directory containing JSON files')
parser.add_argument('output_csv', type=str, help='The output CSV file path')
args = parser.parse_args()
json_to_csv(args.json_dir, args.output_csv)