Spaces:

ifgr003
/

ocr

Sleeping

App Files Files Community

Hanz Pillerva commited on May 2

Commit

5ee27ce

1 Parent(s): 7a4ffc1

update

Browse files

Files changed (2) hide show

app.py +0 -6
template_matcher.py +6 -2

app.py CHANGED Viewed

@@ -443,7 +443,6 @@ def _map_confidence_for_form(raw_confidence, form_hint):
         return {
             'registry_no':            p('registry_no'),
             'city_municipality':      p('city_municipality'),
-            'date_submitted':         p('registration_date'),
             'child_first':            p('name_first'),
             'child_middle':           p('name_middle'),
             'child_last':             p('name_last'),
@@ -463,11 +462,9 @@ def _map_confidence_for_form(raw_confidence, form_hint):
     if form_hint == '2A':
         # Keys must match what Form2A Val looks up:
         # registry → registry_no (via confidenceKeyMap)
-        # date_reg → date_submitted (via confidenceKeyMap)
         # all others are direct display-key lookups
         return {
             'registry_no':    p('registry_no'),
-            'date_submitted': p('registration_date'),
             'deceased_name':  p('deceased_name'),
             'sex':            p('sex'),
             'age':            p('age'),
@@ -694,7 +691,6 @@ def _map_template_output(raw: dict, form_hint: str) -> dict:
             'registry_no': g('registry_no'),
             'city_municipality': g('city_municipality'),
             'province': g('province'),
-            'date_submitted': g('registration_date'),
             'child_first': g('name_first'),
             'child_middle': g('name_middle'),
             'child_last': g('name_last'),
@@ -719,7 +715,6 @@ def _map_template_output(raw: dict, form_hint: str) -> dict:
             'registry_no': g('registry_no'),
             'city_municipality': g('city_municipality'),
             'province': g('province'),
-            'date_submitted': g('registration_date'),
             'deceased_first': g('deceased_name'),
             'sex': g('sex'),
             'age_years': g('age'),
@@ -735,7 +730,6 @@ def _map_template_output(raw: dict, form_hint: str) -> dict:
             'registry_no': g('registry_no'),
             'city_municipality': g('city_municipality'),
             'province': g('province'),
-            'date_submitted': g('registration_date'),
             'husband_first': g('husband_name_first'),
             'husband_middle': g('husband_name_middle'),
             'husband_last': g('husband_name_last'),

         return {
             'registry_no':            p('registry_no'),
             'city_municipality':      p('city_municipality'),
             'child_first':            p('name_first'),
             'child_middle':           p('name_middle'),
             'child_last':             p('name_last'),
     if form_hint == '2A':
         # Keys must match what Form2A Val looks up:
         # registry → registry_no (via confidenceKeyMap)
         # all others are direct display-key lookups
         return {
             'registry_no':    p('registry_no'),
             'deceased_name':  p('deceased_name'),
             'sex':            p('sex'),
             'age':            p('age'),
             'registry_no': g('registry_no'),
             'city_municipality': g('city_municipality'),
             'province': g('province'),
             'child_first': g('name_first'),
             'child_middle': g('name_middle'),
             'child_last': g('name_last'),
             'registry_no': g('registry_no'),
             'city_municipality': g('city_municipality'),
             'province': g('province'),
             'deceased_first': g('deceased_name'),
             'sex': g('sex'),
             'age_years': g('age'),
             'registry_no': g('registry_no'),
             'city_municipality': g('city_municipality'),
             'province': g('province'),
             'husband_first': g('husband_name_first'),
             'husband_middle': g('husband_name_middle'),
             'husband_last': g('husband_name_last'),

template_matcher.py CHANGED Viewed

@@ -187,8 +187,12 @@ def _crnn_read_batch_with_confidence(crops: list) -> list:
                 # Mean confidence over character-bearing frames
                 conf = float(max_probs[:, n][non_blank_mask].mean().item())
             else:
-                # All blanks → field is empty; correctly extracting nothing
-                # is 100% accurate, so return 1.0 instead of a low soft indicator.
                 conf = 1.0
             results.append((text, round(conf, 4)))

                 # Mean confidence over character-bearing frames
                 conf = float(max_probs[:, n][non_blank_mask].mean().item())
             else:
+                conf = 1.0
+            # If the final decoded text is empty (line noise, form borders,
+            # or unrecognised characters all got decoded away), the extraction
+            # is still "correct" — nothing was there — so override to 100%.
+            if not text:
                 conf = 1.0
             results.append((text, round(conf, 4)))