Spaces:

Mazenbs
/

extract_html_full

Sleeping

Mazenbs commited on Dec 17, 2025

Commit

cd3c116

verified ·

1 Parent(s): fde8374

Update parser/assembler.py

Files changed (1) hide show

parser/assembler.py CHANGED Viewed

@@ -140,44 +140,3 @@ def parse_law_from_texts(text_blocks: List[Dict[str, str]], url: str = None) ->
         }
     }
-def parse_law_from_textsx(text_blocks: List[Dict[str, str]]) -> Dict:
-    title, preamble, remaining_blocks = extract_title_and_preamble(text_blocks)
-    sections_raw = extract_sections(remaining_blocks)
-    # 🔥 استخراج رقم القانون والسنة من المقدمة
-    law_info = extract_law_number_and_year(preamble)  # <-- تمت إضافتها هنا
-    sections = []
-    for sec in sections_raw:
-        raw_blocks = sec["texts"]
-        # دمج نصوص القسم مع تطبيق merge_colon_lines
-        content = "\n".join([b["text"] for b in raw_blocks if not is_article(b["text"])]).strip()
-        content = merge_colon_lines(content)
-        articles = extract_articles_from_blocks(raw_blocks)
-        sections.append({
-            "title": sec["name"],
-            "content": content,
-            "articles": [
-                {"tag": a["text"]} if a["number"] is None else {"number": a["number"], "text": a["text"]}
-                for a in articles
-            ]
-        })
-    return {
-        "message": "success",
-        "blocks": {
-            "count": len(text_blocks),
-        },
-        "law": {
-            "title": title,
-            "preamble": preamble,
-            "number": law_info.get("law_number"),
-            "year": law_info.get("year"),
-            "sections": sections
-        }
-    }