Spaces:
Running
Running
Update parser/table_extractorgo.py
Browse files
parser/table_extractorgo.py
CHANGED
|
@@ -1,7 +1,9 @@
|
|
| 1 |
# parser/table_extractorgo.py
|
| 2 |
from bs4 import BeautifulSoup, Tag
|
| 3 |
from typing import List, Dict, Any
|
| 4 |
-
from helpers.cleaner import clean_text
|
|
|
|
|
|
|
| 5 |
|
| 6 |
def tables_from_soup(soup: BeautifulSoup) -> List[Tag]:
|
| 7 |
"""استخراج جميع عناصر الجدول من صفحة HTML"""
|
|
|
|
| 1 |
# parser/table_extractorgo.py
|
| 2 |
from bs4 import BeautifulSoup, Tag
|
| 3 |
from typing import List, Dict, Any
|
| 4 |
+
from helpers.cleaner import clean_text
|
| 5 |
+
from helpers.utils import is_section, extract_article_number, is_article
|
| 6 |
+
|
| 7 |
|
| 8 |
def tables_from_soup(soup: BeautifulSoup) -> List[Tag]:
|
| 9 |
"""استخراج جميع عناصر الجدول من صفحة HTML"""
|