| import json | |
| # Test the exact JSON structure from the file | |
| with open('Quillan_finetune_full_dataset.jsonl', 'r', encoding='utf-8') as f: | |
| for i, line in enumerate(f, 1): | |
| line = line.strip() | |
| if not line: | |
| continue | |
| try: | |
| data = json.loads(line) | |
| print(f"Line {i} keys:", list(data.keys())) | |
| # Check Output_Sections for Final output | |
| if 'Output_Sections' in data: | |
| output_sections = data['Output_Sections'] | |
| print("Output_Sections keys:", list(output_sections.keys())) | |
| # Look for content in various possible keys | |
| for key in ['Final output', 'Final output', 'Final output']: | |
| if key in output_sections: | |
| print(f"Found content in '{key}'") | |
| content = output_sections[key] | |
| print(f"Content length: {len(str(content))}") | |
| print(f"Content preview: {str(content)[:200]}...") | |
| break | |
| else: | |
| print("Available Output_Sections keys:", list(output_sections.keys())) | |
| if i > 2: # Only check first few lines | |
| break | |
| except Exception as e: | |
| print(f"Line {i} JSON error: {e}") | |
| continue | |