| import os | |
| import json | |
| def merge_json_files(folder_path, output_file): | |
| merged_data = [] | |
| # Iterate over all files in the folder | |
| for filename in os.listdir(folder_path): | |
| if filename.endswith(".jsonl"): | |
| file_path = os.path.join(folder_path, filename) | |
| print(file_path) | |
| with open(file_path) as f: | |
| data=[json.loads(line) for line in f] | |
| merged_data.extend(data) | |
| # Write the merged data to the output file | |
| with open(output_file, "w", encoding="utf-8") as out_f: | |
| json.dump(merged_data, out_f, indent=4, ensure_ascii=False) | |
| print(f"Merged {len(merged_data)} entries into {output_file}") | |
| # Example usage: | |
| merge_json_files("/home/gs4288/visual_pruning_kl/data/playground", "/home/gs4288/visual_pruning_kl/data/playground/merged.json") | |