Marthee commited on
Commit
9e1773c
·
verified ·
1 Parent(s): 146d5bc

Update InitialMarkups.py

Browse files
Files changed (1) hide show
  1. InitialMarkups.py +6 -1
InitialMarkups.py CHANGED
@@ -997,7 +997,12 @@ def extract_section_under_header(multiplePDF_Paths):
997
  i += 2
998
  continue
999
  if collecting:
1000
-
 
 
 
 
 
1001
  norm_line = normalize_text(line_text)
1002
 
1003
  # Optimized URL check
 
997
  i += 2
998
  continue
999
  if collecting:
1000
+ try:
1001
+ if dateparse(line_text, fuzzy=True):
1002
+ collecting=False
1003
+ break
1004
+ except (ParserError, ValueError, OverflowError):
1005
+ pass
1006
  norm_line = normalize_text(line_text)
1007
 
1008
  # Optimized URL check