| { | |
| "parse_failure_count": 45, | |
| "total_failure_count": 74, | |
| "source_unavailable_failure_count": 29, | |
| "parse_failures_by_group": { | |
| "house_clerk_disclosures": 28, | |
| "house_cpf": 17 | |
| }, | |
| "parse_failures_by_reason": { | |
| "parse_failed": 45 | |
| }, | |
| "failure_reason_counts": { | |
| "parse_failed": 45, | |
| "source_unavailable": 29 | |
| }, | |
| "parse_failures_by_detail": { | |
| "ocr_text_unparseable": 28, | |
| "pdf_text_unparseable_after_ocr": 4, | |
| "pdf_text_unparseable": 13 | |
| }, | |
| "top_parse_failure_members": [ | |
| { | |
| "member_slug": "michael_t_mccaul", | |
| "count": 8 | |
| }, | |
| { | |
| "member_slug": "ro_khanna", | |
| "count": 6 | |
| }, | |
| { | |
| "member_slug": "harold_rogers", | |
| "count": 5 | |
| }, | |
| { | |
| "member_slug": "nicole_malliotakis", | |
| "count": 3 | |
| }, | |
| { | |
| "member_slug": "harriet_m_hageman", | |
| "count": 3 | |
| }, | |
| { | |
| "member_slug": "beth_van_duyne", | |
| "count": 3 | |
| }, | |
| { | |
| "member_slug": "keith_self", | |
| "count": 2 | |
| }, | |
| { | |
| "member_slug": "christopher_h_smith", | |
| "count": 2 | |
| }, | |
| { | |
| "member_slug": "ann_wagner", | |
| "count": 2 | |
| }, | |
| { | |
| "member_slug": "tony_wied", | |
| "count": 2 | |
| }, | |
| { | |
| "member_slug": "ken_calvert", | |
| "count": 1 | |
| }, | |
| { | |
| "member_slug": "byron_donalds", | |
| "count": 1 | |
| }, | |
| { | |
| "member_slug": "mike_ezell", | |
| "count": 1 | |
| }, | |
| { | |
| "member_slug": "charles_j_chuck_fleischmann", | |
| "count": 1 | |
| }, | |
| { | |
| "member_slug": "seth_moulton", | |
| "count": 1 | |
| }, | |
| { | |
| "member_slug": "mark_pocan", | |
| "count": 1 | |
| }, | |
| { | |
| "member_slug": "david_rouzer", | |
| "count": 1 | |
| }, | |
| { | |
| "member_slug": "michael_k_simpson", | |
| "count": 1 | |
| }, | |
| { | |
| "member_slug": "mike_thompson", | |
| "count": 1 | |
| } | |
| ], | |
| "source_unavailable_by_group": { | |
| "house_votes": 9, | |
| "lda_public_search": 1, | |
| "usaspending_public_site": 233 | |
| }, | |
| "partial_recovery_counts": { | |
| "reused_existing_raw_artifact": 50702, | |
| "pdf_parse_failed_but_page_context_preserved": 150, | |
| "page_supported_unresolved_request_recovered": 100, | |
| "ocr_candidate_ptr_rows_recovered": 11, | |
| "pdf_url_returned_html_but_recipient_recovered": 11, | |
| "usaspending_award_public_page": 14016, | |
| "recovered_public_award_pages_prelink:14016": 1 | |
| }, | |
| "guidance_signal_counts": { | |
| "house_cpf needs deterministic fallback or parser hardening": 84, | |
| "house_clerk_disclosures needs deterministic fallback or parser hardening": 28, | |
| "house_votes needs deterministic fallback or parser hardening": 9, | |
| "lda_public_search needs deterministic fallback or parser hardening": 2, | |
| "usaspending_public_site needs deterministic fallback or parser hardening": 1634 | |
| }, | |
| "house_cpf_filename_recovered_requests": 10, | |
| "house_cpf_unresolved_requests": 1866, | |
| "house_cpf_page_supported_requests": 3173 | |
| } |