Update TextProcessor.py
Browse files- TextProcessor.py +2 -2
TextProcessor.py
CHANGED
|
@@ -58,14 +58,14 @@ def paragraphs(folderpath):
|
|
| 58 |
is_start_blockquote = (prior_endswith_period and current_supertabbed and prior_more_left and not is_inblock)
|
| 59 |
is_after_blockquote = (prior_endswith_period and not current_supertabbed and is_inblock)
|
| 60 |
is_after_disposition = (prior_right_margin and current_tabbed)
|
| 61 |
-
is_after_oneline_paragraph = (prior_tabbed and current_tabbed and not prior_supertabbed and not current_supertabbed and not is_inblock)
|
| 62 |
|
| 63 |
if is_start_blockquote and not is_section_header:
|
| 64 |
is_inblock = True
|
| 65 |
if is_after_blockquote or prior_is_date: # This date hack helps ensure that slip opinion headers do not get caught
|
| 66 |
is_inblock = False
|
| 67 |
|
| 68 |
-
if is_section_header or is_the_classic or
|
| 69 |
paras.append(para)
|
| 70 |
types.append(is_inblock)
|
| 71 |
para = []
|
|
|
|
| 58 |
is_start_blockquote = (prior_endswith_period and current_supertabbed and prior_more_left and not is_inblock)
|
| 59 |
is_after_blockquote = (prior_endswith_period and not current_supertabbed and is_inblock)
|
| 60 |
is_after_disposition = (prior_right_margin and current_tabbed)
|
| 61 |
+
# is_after_oneline_paragraph = (prior_tabbed and current_tabbed and not prior_supertabbed and not current_supertabbed and not is_inblock)
|
| 62 |
|
| 63 |
if is_start_blockquote and not is_section_header:
|
| 64 |
is_inblock = True
|
| 65 |
if is_after_blockquote or prior_is_date: # This date hack helps ensure that slip opinion headers do not get caught
|
| 66 |
is_inblock = False
|
| 67 |
|
| 68 |
+
if is_section_header or is_the_classic or is_start_blockquote or is_after_blockquote or is_after_disposition:
|
| 69 |
paras.append(para)
|
| 70 |
types.append(is_inblock)
|
| 71 |
para = []
|