Marthee commited on
Commit
8440059
·
verified ·
1 Parent(s): e4615c4

Update InitialMarkups.py

Browse files
Files changed (1) hide show
  1. InitialMarkups.py +5 -2
InitialMarkups.py CHANGED
@@ -997,8 +997,11 @@ def extract_section_under_header(multiplePDF_Paths):
997
  i += 2
998
  continue
999
  if collecting:
1000
- if dateparse(line_text, fuzzy=True):
1001
- continue
 
 
 
1002
  norm_line = normalize_text(line_text)
1003
 
1004
  # Optimized URL check
 
997
  i += 2
998
  continue
999
  if collecting:
1000
+ try:
1001
+ if dateparse(line_text, fuzzy=True):
1002
+ break
1003
+ except (ParserError, ValueError, OverflowError):
1004
+ pass
1005
  norm_line = normalize_text(line_text)
1006
 
1007
  # Optimized URL check