fix metadata
Browse files
app/law_document_chunker.py
CHANGED
|
@@ -420,6 +420,8 @@ class LawDocumentChunker:
|
|
| 420 |
try:
|
| 421 |
# Tạo embedding
|
| 422 |
embedding = await self.embedding_client.create_embedding(chunk.content, task_type="retrieval_document")
|
|
|
|
|
|
|
| 423 |
|
| 424 |
# Chuẩn bị data cho Supabase
|
| 425 |
chunk_dict = {
|
|
@@ -433,7 +435,7 @@ class LawDocumentChunker:
|
|
| 433 |
'article_title': chunk.article_title,
|
| 434 |
'clause_number': chunk.clause_number,
|
| 435 |
'sub_clause_letter': chunk.sub_clause_letter,
|
| 436 |
-
'context_summary': f"Structure: {chunk.context_summary}|Semantic: {
|
| 437 |
}
|
| 438 |
|
| 439 |
# Lưu ngay lập tức vào Supabase
|
|
|
|
| 420 |
try:
|
| 421 |
# Tạo embedding
|
| 422 |
embedding = await self.embedding_client.create_embedding(chunk.content, task_type="retrieval_document")
|
| 423 |
+
# Sinh semantic summary bằng LLM
|
| 424 |
+
semantic_summary = await self._create_semantic_summary_with_llm(chunk.content)
|
| 425 |
|
| 426 |
# Chuẩn bị data cho Supabase
|
| 427 |
chunk_dict = {
|
|
|
|
| 435 |
'article_title': chunk.article_title,
|
| 436 |
'clause_number': chunk.clause_number,
|
| 437 |
'sub_clause_letter': chunk.sub_clause_letter,
|
| 438 |
+
'context_summary': f"Structure: {chunk.context_summary}|Semantic: {semantic_summary}"
|
| 439 |
}
|
| 440 |
|
| 441 |
# Lưu ngay lập tức vào Supabase
|