Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -483,14 +483,20 @@ class TextToSQLSystem:
|
|
| 483 |
|
| 484 |
# in class TextToSQLSystem:
|
| 485 |
|
| 486 |
-
def _validate_and_fix_sql(self,
|
| 487 |
"""
|
| 488 |
-
(
|
| 489 |
一個全面、多層次的 SQL 驗證與生成引擎。
|
| 490 |
-
|
| 491 |
-
|
| 492 |
-
返回一個元組 (SQL字符串或None, 狀態消息)。
|
| 493 |
"""
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 494 |
q_lower = question.lower()
|
| 495 |
|
| 496 |
# ==============================================================================
|
|
@@ -499,56 +505,47 @@ class TextToSQLSystem:
|
|
| 499 |
|
| 500 |
# --- 預先檢測所有可能的意圖和實體 ---
|
| 501 |
job_no_match = re.search(r"(?:工單|jobno)\s*'\"?([A-Z]{2,3}\d+)'\"?", question, re.IGNORECASE)
|
| 502 |
-
|
| 503 |
entity_match_data = None
|
| 504 |
-
ENTITY_TO_COLUMN_MAP = {
|
| 505 |
-
'申請廠商': 'sd.ApplicantName', '申請方': 'sd.ApplicantName', 'applicant': 'sd.ApplicantName',
|
| 506 |
-
'付款廠商': 'sd.InvoiceToName', '付款方': 'sd.InvoiceToName', 'invoiceto': 'sd.InvoiceToName',
|
| 507 |
-
'代理商': 'sd.AgentName', 'agent': 'sd.AgentName',
|
| 508 |
-
'買家': 'sd.BuyerName', 'buyer': 'sd.BuyerName', '客戶': 'sd.BuyerName', '品牌': 'tsr.BuyerName'
|
| 509 |
-
}
|
| 510 |
for keyword, column in ENTITY_TO_COLUMN_MAP.items():
|
| 511 |
if keyword in q_lower:
|
| 512 |
match = re.search(fr"{re.escape(keyword)}[\s:;\'\"-]*([a-zA-Z0-9&.\s-]+?)(?:\s*的|\s+|為|$)", question, re.IGNORECASE)
|
| 513 |
-
if match:
|
| 514 |
-
entity_match_data = {"type": keyword, "name": match.group(1).strip(), "column": column}
|
| 515 |
-
break
|
| 516 |
|
| 517 |
lab_group_match_data = None
|
| 518 |
LAB_GROUP_MAP = {'A':'TA','B':'TB','C':'TC','D':'TD','E':'TE','Y':'TY','TA':'TA','TB':'TB','TC':'TC','TD':'TD','TE':'TE','TY':'TY','WC':'WC','EO':'EO','GCI':'GCI','GCO':'GCO','MI':'MI'}
|
| 519 |
lab_group_match = re.findall(r"([A-Z]+)\s*組", question, re.IGNORECASE)
|
| 520 |
if lab_group_match:
|
| 521 |
codes = [LAB_GROUP_MAP.get(g.upper()) for g in lab_group_match if LAB_GROUP_MAP.get(g.upper())]
|
| 522 |
-
if codes:
|
| 523 |
-
lab_group_match_data = {"codes": codes, "identifiers": lab_group_match}
|
| 524 |
|
| 525 |
is_tat_query = any(k in q_lower for k in ['平均', 'average']) and any(k in q_lower for k in ['時間', '時長', '多久', '天', 'tat', 'turnaround'])
|
| 526 |
-
|
| 527 |
# --- 判斷邏輯: 依優先級進入對應的模板 ---
|
| 528 |
-
|
| 529 |
if job_no_match and any(kw in q_lower for kw in ['工作日', 'workday']):
|
| 530 |
job_no = job_no_match.group(1).upper()
|
| 531 |
self._log(f"🔄 檢測到計算【工單 {job_no}】工作日TAT的意圖,啟用模板。", "INFO")
|
| 532 |
-
|
| 533 |
-
|
| 534 |
|
| 535 |
-
|
| 536 |
job_no = job_no_match.group(1).upper()
|
| 537 |
self._log(f"🔄 檢測到計算【��單 {job_no}】日曆日TAT的意圖,啟用模板。", "INFO")
|
| 538 |
-
|
| 539 |
-
|
| 540 |
|
| 541 |
-
|
| 542 |
job_no = job_no_match.group(1).upper()
|
| 543 |
self._log(f"🔄 檢測到對【單一工作單 '{job_no}'】的【標準金額計算】意圖,啟用模板。", "INFO")
|
| 544 |
-
|
| 545 |
-
|
| 546 |
|
| 547 |
-
|
| 548 |
limit_match = re.search(r'(\d+)', question)
|
| 549 |
limit = limit_match.group(1) if limit_match else '10'
|
| 550 |
self._log(f"🔄 檢測到查詢【Top {limit} 工作單金額】意圖,啟用模板。", "INFO")
|
| 551 |
-
|
| 552 |
WITH JobTotalAmount AS (
|
| 553 |
SELECT JobNo, SUM(LocalAmount) AS TotalAmount
|
| 554 |
FROM (SELECT DISTINCT JobNo, InvoiceCreditNoteNo, LocalAmount FROM TSR53Invoice)
|
|
@@ -559,20 +556,40 @@ FROM JobTotalAmount
|
|
| 559 |
ORDER BY TotalAmount DESC
|
| 560 |
LIMIT {limit};
|
| 561 |
"""
|
| 562 |
-
|
| 563 |
|
| 564 |
-
|
| 565 |
year_match = re.search(r'(\d{4})\s*年?', question)
|
| 566 |
month_match = re.search(r'(\d{1,2})\s*月', question)
|
| 567 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
| 568 |
if year_match:
|
| 569 |
-
year = year_match.group(1)
|
| 570 |
-
|
| 571 |
-
|
| 572 |
-
|
| 573 |
-
|
| 574 |
-
|
| 575 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 576 |
year_match = re.search(r'(\d{4})\s*年?', question)
|
| 577 |
time_condition, time_log = "", "總"
|
| 578 |
if year_match:
|
|
@@ -582,27 +599,27 @@ LIMIT {limit};
|
|
| 582 |
else:
|
| 583 |
time_condition = "WHERE ReportAuthorization IS NOT NULL"
|
| 584 |
self._log(f"🔄 檢測到查詢【{time_log}全局報告總數】意圖,啟用模板。", "INFO")
|
| 585 |
-
|
| 586 |
-
|
| 587 |
|
| 588 |
-
|
| 589 |
entity_type, entity_name, column_name = entity_match_data["type"], entity_match_data["name"], entity_match_data["column"]
|
| 590 |
year = (re.search(r'(\d{4})\s*年?', question) or ['', datetime.now().strftime('%Y')])[1]
|
| 591 |
self._log(f"🔄 檢測到查詢【{entity_type} '{entity_name}' 在 {year} 年的總業績】意圖,啟用模板。", "INFO")
|
| 592 |
-
|
| 593 |
-
|
| 594 |
|
| 595 |
-
|
| 596 |
year_match, month_match = re.search(r'(\d{4})\s*年?', question), re.search(r'(\d{1,2})\s*月', question)
|
| 597 |
time_condition, time_log = "", "總"
|
| 598 |
if year_match:
|
| 599 |
year = year_match.group(1); time_condition = f"WHERE strftime('%Y', InvoiceCreditNoteDate) = '{year}'"; time_log = f"{year}年"
|
| 600 |
if month_match: month = month_match.group(1).zfill(2); time_condition += f" AND strftime('%m', InvoiceCreditNoteDate) = '{month}'"; time_log += f"{month}月"
|
| 601 |
self._log(f"🔄 檢測到查詢【{time_log}全局總業績】意圖,啟用模板。", "INFO")
|
| 602 |
-
|
| 603 |
-
|
| 604 |
|
| 605 |
-
|
| 606 |
lab_group_code = lab_group_match_data["codes"][0]
|
| 607 |
target_table = f"JobTimeline_{lab_group_code}"
|
| 608 |
year = (re.search(r'(\d{4})\s*年', question) or ['', datetime.now().strftime('%Y')])[1]
|
|
@@ -614,60 +631,61 @@ LIMIT {limit};
|
|
| 614 |
time_condition += f" AND strftime('%m', end_time) = '{month}'"
|
| 615 |
month_str = f"{month}月"
|
| 616 |
self._log(f"🔄 檢測到查詢【{lab_group_code}組】完成的【測試項目數】意圖,啟用專屬模板。", "INFO")
|
| 617 |
-
|
| 618 |
-
|
| 619 |
|
| 620 |
-
|
| 621 |
-
|
| 622 |
-
|
| 623 |
-
|
| 624 |
-
|
| 625 |
-
|
| 626 |
-
|
| 627 |
-
|
| 628 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 629 |
|
| 630 |
-
|
| 631 |
-
|
| 632 |
-
fixed_sql = " " + parsed_sql.strip() + " "
|
| 633 |
-
fixes_applied_fallback = []
|
| 634 |
-
|
| 635 |
-
dialect_corrections = {
|
| 636 |
-
r'YEAR\s*\(([^)]+)\)': r"strftime('%Y', \1)",
|
| 637 |
-
r"(strftime\('%Y',\s*[^)]+\))\s*=\s*(\d{4})": r"\1 = '\2'",
|
| 638 |
-
r"EXTRACT\s*\(\s*YEAR\s+FROM\s+([^)]+)\s*\)": r"strftime('%Y', \1)"
|
| 639 |
-
}
|
| 640 |
-
for pattern, replacement in dialect_corrections.items():
|
| 641 |
-
if re.search(pattern, fixed_sql, re.IGNORECASE):
|
| 642 |
-
fixed_sql = re.sub(pattern, replacement, fixed_sql, flags=re.IGNORECASE)
|
| 643 |
-
fixes_applied_fallback.append(f"修正方言: {pattern}")
|
| 644 |
-
|
| 645 |
-
schema_corrections = {
|
| 646 |
-
'TSR53ReportAuthorization': 'TSR53SampleDescription', 'TSR53TestResult': 'TSR53SampleDescription',
|
| 647 |
-
'JobInvoice': 'TSR53Invoice', 'JobInvoiceAuthorization': 'TSR53Invoice', 'JobInvoiceCreditNote': 'TSR53Invoice',
|
| 648 |
-
'Customer': 'TSR53SampleDescription', 'Customers': 'TSR53SampleDescription',
|
| 649 |
-
'Invoice': 'TSR53Invoice', 'Invoices': 'TSR53Invoice', 'Job': 'JobTimeline', 'Jobs': 'JobsInProgress',
|
| 650 |
-
'Tests': 'TSR53MarsItem', 'TestsLog': 'JobItemsInProgress',
|
| 651 |
-
'AuthorizationDate': 'ReportAuthorization', 'ReportAuthorizationDate': 'ReportAuthorization',
|
| 652 |
-
'LegalAuthorization': 'OverallRating', 'LegalAuthorizationDate': 'ReportAuthorization',
|
| 653 |
-
'TestResult': 'OverallRating', 'Rating': 'OverallRating', 'CustomerName': 'BuyerName', 'InvoiceTo': 'InvoiceToName',
|
| 654 |
-
'Applicant': 'ApplicantName', 'Agent': 'AgentName', 'JobNumber': 'JobNo', 'ReportNo': 'JobNo', 'TestName': 'ItemInvoiceDescriptionJob',
|
| 655 |
-
'CreationDate': 'JobCreation', 'CreateDate': 'JobCreation', 'CompletedDate': 'ReportAuthorization',
|
| 656 |
-
'InvoiceCreditNoteAmount': 'LocalAmount',
|
| 657 |
-
'Amount': 'LocalAmount', 'Price': 'LocalAmount', 'Lab': 'LabGroup'
|
| 658 |
-
}
|
| 659 |
-
for wrong, correct in schema_corrections.items():
|
| 660 |
-
pattern = r'\b' + re.escape(wrong) + r'\b'
|
| 661 |
-
if re.search(pattern, fixed_sql, re.IGNORECASE):
|
| 662 |
-
fixed_sql = re.sub(pattern, correct, fixed_sql, flags=re.IGNORECASE)
|
| 663 |
-
fixes_applied_fallback.append(f"映射 Schema: '{wrong}' -> '{correct}'")
|
| 664 |
-
|
| 665 |
-
if any(kw in q_lower for kw in ['幾份', '多少', 'how many', 'count', '數量']) and 'select ' in fixed_sql.lower() and 'count' not in fixed_sql.lower() and 'group by' not in fixed_sql.lower():
|
| 666 |
-
fixed_sql = re.sub(r'SELECT\s+.*?FROM', 'SELECT COUNT(*) FROM', fixed_sql, count=1, flags=re.IGNORECASE)
|
| 667 |
-
fixes_applied_fallback.append("修正邏輯: 補全 COUNT(*)")
|
| 668 |
-
|
| 669 |
-
log_msg = "AI 生成並成功修正" if fixes_applied_fallback else "AI 生成且無需修正"
|
| 670 |
-
return self._finalize_sql(fixed_sql, log_msg)
|
| 671 |
|
| 672 |
def _finalize_sql(self, sql: str, log_message: str) -> Tuple[str, str]:
|
| 673 |
"""一個輔助函數,用於清理最終的SQL並記錄成功日誌。"""
|
|
|
|
| 483 |
|
| 484 |
# in class TextToSQLSystem:
|
| 485 |
|
| 486 |
+
def _validate_and_fix_sql(self, sql: str, question: str) -> str:
|
| 487 |
"""
|
| 488 |
+
(V20 / 智能列表版)
|
| 489 |
一個全面、多層次的 SQL 驗證與生成引擎。
|
| 490 |
+
強化了“報告列表”意圖模板,使其能夠動態識別並附加額外的篩選條件,
|
| 491 |
+
如報告狀態 (Fail/Pass),從而生成更精準的列表查詢。
|
|
|
|
| 492 |
"""
|
| 493 |
+
if not sql or not self.schema:
|
| 494 |
+
self._log("SQL 修正被跳過,因輸入為空或 schema 未載入。", "WARNING")
|
| 495 |
+
return sql
|
| 496 |
+
|
| 497 |
+
original_sql = sql
|
| 498 |
+
fixed_sql = " " + sql.strip() + " "
|
| 499 |
+
fixes_applied = []
|
| 500 |
q_lower = question.lower()
|
| 501 |
|
| 502 |
# ==============================================================================
|
|
|
|
| 505 |
|
| 506 |
# --- 預先檢測所有可能的意圖和實體 ---
|
| 507 |
job_no_match = re.search(r"(?:工單|jobno)\s*'\"?([A-Z]{2,3}\d+)'\"?", question, re.IGNORECASE)
|
|
|
|
| 508 |
entity_match_data = None
|
| 509 |
+
ENTITY_TO_COLUMN_MAP = {'申請廠商':'sd.ApplicantName','申請方':'sd.ApplicantName','applicant':'sd.ApplicantName','付款廠商':'sd.InvoiceToName','付款方':'sd.InvoiceToName','invoiceto':'sd.InvoiceToName','代理商':'sd.AgentName','agent':'sd.AgentName','買家':'sd.BuyerName','buyer':'sd.BuyerName','客戶':'sd.BuyerName', '品牌': 'tsr.BuyerName'}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 510 |
for keyword, column in ENTITY_TO_COLUMN_MAP.items():
|
| 511 |
if keyword in q_lower:
|
| 512 |
match = re.search(fr"{re.escape(keyword)}[\s:;\'\"-]*([a-zA-Z0-9&.\s-]+?)(?:\s*的|\s+|為|$)", question, re.IGNORECASE)
|
| 513 |
+
if match: entity_match_data = {"type": keyword, "name": match.group(1).strip(), "column": column}; break
|
|
|
|
|
|
|
| 514 |
|
| 515 |
lab_group_match_data = None
|
| 516 |
LAB_GROUP_MAP = {'A':'TA','B':'TB','C':'TC','D':'TD','E':'TE','Y':'TY','TA':'TA','TB':'TB','TC':'TC','TD':'TD','TE':'TE','TY':'TY','WC':'WC','EO':'EO','GCI':'GCI','GCO':'GCO','MI':'MI'}
|
| 517 |
lab_group_match = re.findall(r"([A-Z]+)\s*組", question, re.IGNORECASE)
|
| 518 |
if lab_group_match:
|
| 519 |
codes = [LAB_GROUP_MAP.get(g.upper()) for g in lab_group_match if LAB_GROUP_MAP.get(g.upper())]
|
| 520 |
+
if codes: lab_group_match_data = {"codes": codes, "identifiers": lab_group_match}
|
|
|
|
| 521 |
|
| 522 |
is_tat_query = any(k in q_lower for k in ['平均', 'average']) and any(k in q_lower for k in ['時間', '時長', '多久', '天', 'tat', 'turnaround'])
|
| 523 |
+
|
| 524 |
# --- 判斷邏輯: 依優先級進入對應的模板 ---
|
| 525 |
+
|
| 526 |
if job_no_match and any(kw in q_lower for kw in ['工作日', 'workday']):
|
| 527 |
job_no = job_no_match.group(1).upper()
|
| 528 |
self._log(f"🔄 檢測到計算【工單 {job_no}】工作日TAT的意圖,啟用模板。", "INFO")
|
| 529 |
+
fixed_sql = f"""WITH span AS (SELECT date(jt.JobCreation) AS d1, date(jt.ReportAuthorization) AS d2 FROM JobTimeline jt WHERE jt.JobNo = '{job_no}'), days AS (SELECT 1 FROM calendar_days, span WHERE date BETWEEN d1 AND d2 AND is_workday = 1) SELECT COUNT(*) FROM days;"""
|
| 530 |
+
fixes_applied.append(f"模板覆寫: {job_no} 的工作日天數")
|
| 531 |
|
| 532 |
+
elif job_no_match and any(kw in q_lower for kw in ['總處理時長', '時長', '多少天']):
|
| 533 |
job_no = job_no_match.group(1).upper()
|
| 534 |
self._log(f"🔄 檢測到計算【��單 {job_no}】日曆日TAT的意圖,啟用模板。", "INFO")
|
| 535 |
+
fixed_sql = f"""SELECT ROUND(julianday(ReportAuthorization) - julianday(JobCreation), 2) AS days FROM JobTimeline WHERE JobNo = '{job_no}';"""
|
| 536 |
+
fixes_applied.append(f"模板覆寫: {job_no} 的日曆日總時長")
|
| 537 |
|
| 538 |
+
elif job_no_match and any(kw in q_lower for kw in ['總金額', '金額', '業績', 'total amount']):
|
| 539 |
job_no = job_no_match.group(1).upper()
|
| 540 |
self._log(f"🔄 檢測到對【單一工作單 '{job_no}'】的【標準金額計算】意圖,啟用模板。", "INFO")
|
| 541 |
+
fixed_sql = f"""WITH JobTotalAmount AS (SELECT JobNo, SUM(LocalAmount) AS TotalAmount FROM (SELECT DISTINCT JobNo, InvoiceCreditNoteNo, LocalAmount FROM TSR53Invoice) GROUP BY JobNo) SELECT TotalAmount FROM JobTotalAmount WHERE JobNo = '{job_no}';"""
|
| 542 |
+
fixes_applied.append(f"模板覆寫: 工作單 {job_no} 的標準總金額 (CTE去重)")
|
| 543 |
|
| 544 |
+
elif '總金額最高' in q_lower and '工作單' in q_lower:
|
| 545 |
limit_match = re.search(r'(\d+)', question)
|
| 546 |
limit = limit_match.group(1) if limit_match else '10'
|
| 547 |
self._log(f"🔄 檢測到查詢【Top {limit} 工作單金額】意圖,啟用模板。", "INFO")
|
| 548 |
+
fixed_sql = f"""
|
| 549 |
WITH JobTotalAmount AS (
|
| 550 |
SELECT JobNo, SUM(LocalAmount) AS TotalAmount
|
| 551 |
FROM (SELECT DISTINCT JobNo, InvoiceCreditNoteNo, LocalAmount FROM TSR53Invoice)
|
|
|
|
| 556 |
ORDER BY TotalAmount DESC
|
| 557 |
LIMIT {limit};
|
| 558 |
"""
|
| 559 |
+
fixes_applied.append(f"模板覆寫: Top {limit} 工作單金額")
|
| 560 |
|
| 561 |
+
elif any(kw in q_lower for kw in ['報告號碼', '報告清單', '列出報告', 'report number', 'list of reports']):
|
| 562 |
year_match = re.search(r'(\d{4})\s*年?', question)
|
| 563 |
month_match = re.search(r'(\d{1,2})\s*月', question)
|
| 564 |
+
|
| 565 |
+
from_clause = "FROM JobTimeline AS jt"
|
| 566 |
+
where_conditions = ["jt.ReportAuthorization IS NOT NULL"]
|
| 567 |
+
time_log = ""
|
| 568 |
+
|
| 569 |
if year_match:
|
| 570 |
+
year = year_match.group(1)
|
| 571 |
+
where_conditions.append(f"strftime('%Y', jt.ReportAuthorization) = '{year}'")
|
| 572 |
+
time_log = f"{year}年"
|
| 573 |
+
if month_match:
|
| 574 |
+
month = month_match.group(1).zfill(2)
|
| 575 |
+
where_conditions.append(f"strftime('%m', jt.ReportAuthorization) = '{month}'")
|
| 576 |
+
time_log += f"{month}月"
|
| 577 |
+
|
| 578 |
+
if 'fail' in q_lower or '失敗' in q_lower:
|
| 579 |
+
if "JOIN TSR53SampleDescription" not in from_clause: from_clause = "FROM JobTimeline AS jt JOIN TSR53SampleDescription AS sd ON jt.JobNo = sd.JobNo"
|
| 580 |
+
where_conditions.append("sd.OverallRating = 'Fail'")
|
| 581 |
+
time_log += " Fail"
|
| 582 |
+
elif 'pass' in q_lower or '通過' in q_lower:
|
| 583 |
+
if "JOIN TSR53SampleDescription" not in from_clause: from_clause = "FROM JobTimeline AS jt JOIN TSR53SampleDescription AS sd ON jt.JobNo = sd.JobNo"
|
| 584 |
+
where_conditions.append("sd.OverallRating = 'Pass'")
|
| 585 |
+
time_log += " Pass"
|
| 586 |
+
|
| 587 |
+
final_where_clause = "WHERE " + " AND ".join(where_conditions)
|
| 588 |
+
self._log(f"🔄 檢測到查詢【{time_log} 報告列表】意圖,啟用智能模板。", "INFO")
|
| 589 |
+
fixed_sql = f"SELECT jt.JobNo, jt.ReportAuthorization {from_clause} {final_where_clause} ORDER BY jt.ReportAuthorization DESC;"
|
| 590 |
+
fixes_applied.append(f"模板覆寫: {time_log} 報告列表查詢")
|
| 591 |
+
|
| 592 |
+
elif '報告' in q_lower and any(kw in q_lower for kw in ['幾份', '多少', '數量', '總數']) and not entity_match_data and not lab_group_match_data:
|
| 593 |
year_match = re.search(r'(\d{4})\s*年?', question)
|
| 594 |
time_condition, time_log = "", "總"
|
| 595 |
if year_match:
|
|
|
|
| 599 |
else:
|
| 600 |
time_condition = "WHERE ReportAuthorization IS NOT NULL"
|
| 601 |
self._log(f"🔄 檢測到查詢【{time_log}全局報告總數】意圖,啟用模板。", "INFO")
|
| 602 |
+
fixed_sql = f"SELECT COUNT(DISTINCT JobNo) AS report_count FROM JobTimeline {time_condition};"
|
| 603 |
+
fixes_applied.append(f"模板覆寫: {time_log}全局報告總數查詢")
|
| 604 |
|
| 605 |
+
elif entity_match_data and any(kw in q_lower for kw in ['業績', '營收', '金額', 'sales', 'revenue']):
|
| 606 |
entity_type, entity_name, column_name = entity_match_data["type"], entity_match_data["name"], entity_match_data["column"]
|
| 607 |
year = (re.search(r'(\d{4})\s*年?', question) or ['', datetime.now().strftime('%Y')])[1]
|
| 608 |
self._log(f"🔄 檢測到查詢【{entity_type} '{entity_name}' 在 {year} 年的總業績】意圖,啟用模板。", "INFO")
|
| 609 |
+
fixed_sql = f"""WITH JobTotalAmount AS (SELECT JobNo, SUM(LocalAmount) AS TotalAmount FROM (SELECT DISTINCT JobNo, InvoiceCreditNoteNo, LocalAmount FROM TSR53Invoice) GROUP BY JobNo) SELECT SUM(jta.TotalAmount) AS total_revenue FROM TSR53SampleDescription AS sd JOIN JobTotalAmount AS jta ON sd.JobNo = jta.JobNo WHERE {column_name} LIKE '%{entity_name}%' AND strftime('%Y', sd.FirstReportAuthorizedDate) = '{year}';"""
|
| 610 |
+
fixes_applied.append(f"模板覆寫: 查詢 {entity_type}='{entity_name}' ({year}年) 的總業績")
|
| 611 |
|
| 612 |
+
elif not entity_match_data and any(kw in q_lower for kw in ['業績', '營收', '金額', 'sales', 'revenue']):
|
| 613 |
year_match, month_match = re.search(r'(\d{4})\s*年?', question), re.search(r'(\d{1,2})\s*月', question)
|
| 614 |
time_condition, time_log = "", "總"
|
| 615 |
if year_match:
|
| 616 |
year = year_match.group(1); time_condition = f"WHERE strftime('%Y', InvoiceCreditNoteDate) = '{year}'"; time_log = f"{year}年"
|
| 617 |
if month_match: month = month_match.group(1).zfill(2); time_condition += f" AND strftime('%m', InvoiceCreditNoteDate) = '{month}'"; time_log += f"{month}月"
|
| 618 |
self._log(f"🔄 檢測到查詢【{time_log}全局總業績】意圖,啟用模板。", "INFO")
|
| 619 |
+
fixed_sql = f"""SELECT SUM(LocalAmount) AS total_revenue FROM TSR53Invoice {time_condition};"""
|
| 620 |
+
fixes_applied.append(f"模板覆寫: {time_log}全局總業績查詢")
|
| 621 |
|
| 622 |
+
elif lab_group_match_data and any(kw in q_lower for kw in ['測試項目', 'test item']):
|
| 623 |
lab_group_code = lab_group_match_data["codes"][0]
|
| 624 |
target_table = f"JobTimeline_{lab_group_code}"
|
| 625 |
year = (re.search(r'(\d{4})\s*年', question) or ['', datetime.now().strftime('%Y')])[1]
|
|
|
|
| 631 |
time_condition += f" AND strftime('%m', end_time) = '{month}'"
|
| 632 |
month_str = f"{month}月"
|
| 633 |
self._log(f"🔄 檢測到查詢【{lab_group_code}組】完成的【測試項目數】意圖,啟用專屬模板。", "INFO")
|
| 634 |
+
fixed_sql = f"""SELECT COUNT(JobItemKey) AS test_item_count FROM {target_table} WHERE end_time IS NOT NULL AND {time_condition};"""
|
| 635 |
+
fixes_applied.append(f"模板覆寫: 查詢 {lab_group_code}組 在 {year}年{month_str} 完成的測試項目數")
|
| 636 |
|
| 637 |
+
if not fixes_applied:
|
| 638 |
+
self._log("未觸發任何模板,執行常規修正流程...", "DEBUG")
|
| 639 |
+
|
| 640 |
+
dialect_corrections = {
|
| 641 |
+
r'YEAR\s*\(([^)]+)\)': r"strftime('%Y', \1)",
|
| 642 |
+
r"(strftime\('%Y',\s*[^)]+\))\s*=\s*(\d{4})": r"\1 = '\2'",
|
| 643 |
+
r"EXTRACT\s*\(\s*YEAR\s+FROM\s+([^)]+)\s*\)": r"strftime('%Y', \1)"
|
| 644 |
+
}
|
| 645 |
+
for pattern, replacement in dialect_corrections.items():
|
| 646 |
+
if re.search(pattern, fixed_sql, re.IGNORECASE):
|
| 647 |
+
fixed_sql = re.sub(pattern, replacement, fixed_sql, flags=re.IGNORECASE)
|
| 648 |
+
fixes_applied.append(f"修正方言: {pattern}")
|
| 649 |
+
|
| 650 |
+
schema_corrections = {
|
| 651 |
+
'TSR53ReportAuthorization': 'TSR53SampleDescription', 'TSR53TestResult': 'TSR53SampleDescription',
|
| 652 |
+
'JobInvoice': 'TSR53Invoice', 'JobInvoiceAuthorization': 'TSR53Invoice', 'JobInvoiceCreditNote': 'TSR53Invoice',
|
| 653 |
+
'Customer': 'TSR53SampleDescription', 'Customers': 'TSR53SampleDescription',
|
| 654 |
+
'Invoice': 'TSR53Invoice', 'Invoices': 'TSR53Invoice', 'Job': 'JobTimeline', 'Jobs': 'JobsInProgress',
|
| 655 |
+
'Tests': 'TSR53MarsItem', 'TestsLog': 'JobItemsInProgress',
|
| 656 |
+
'AuthorizationDate': 'ReportAuthorization', 'ReportAuthorizationDate': 'ReportAuthorization',
|
| 657 |
+
'LegalAuthorization': 'OverallRating', 'LegalAuthorizationDate': 'ReportAuthorization',
|
| 658 |
+
'TestResult': 'OverallRating', 'Rating': 'OverallRating', 'CustomerName': 'BuyerName', 'InvoiceTo': 'InvoiceToName',
|
| 659 |
+
'Applicant': 'ApplicantName', 'Agent': 'AgentName', 'JobNumber': 'JobNo', 'ReportNo': 'JobNo', 'TestName': 'ItemInvoiceDescriptionJob',
|
| 660 |
+
'CreationDate': 'JobCreation', 'CreateDate': 'JobCreation', 'CompletedDate': 'ReportAuthorization',
|
| 661 |
+
'InvoiceCreditNoteAmount': 'LocalAmount',
|
| 662 |
+
'Amount': 'LocalAmount', 'Price': 'LocalAmount', 'Lab': 'LabGroup'
|
| 663 |
+
}
|
| 664 |
+
for wrong, correct in schema_corrections.items():
|
| 665 |
+
pattern = r'\b' + re.escape(wrong) + r'\b'
|
| 666 |
+
if re.search(pattern, fixed_sql, re.IGNORECASE):
|
| 667 |
+
fixed_sql = re.sub(pattern, correct, fixed_sql, flags=re.IGNORECASE)
|
| 668 |
+
fixes_applied.append(f"映射 Schema: '{wrong}' -> '{correct}'")
|
| 669 |
+
|
| 670 |
+
if any(kw in q_lower for kw in ['幾份', '多少', 'how many', 'count', '數量']) and 'select ' in fixed_sql.lower() and 'count' not in fixed_sql.lower() and 'group by' not in fixed_sql.lower():
|
| 671 |
+
fixed_sql = re.sub(r'SELECT\s+.*?FROM', 'SELECT COUNT(*) FROM', fixed_sql, count=1, flags=re.IGNORECASE)
|
| 672 |
+
fixes_applied.append("修正邏輯: 補全 COUNT(*)")
|
| 673 |
+
|
| 674 |
+
fixed_sql = fixed_sql.strip()
|
| 675 |
+
if not fixed_sql.endswith(';'):
|
| 676 |
+
fixed_sql += ';'
|
| 677 |
+
fixed_sql = re.sub(r'\s+', ' ', fixed_sql).strip()
|
| 678 |
+
|
| 679 |
+
if fixes_applied:
|
| 680 |
+
self._log("🔄 SQL 已被自動修正:", "INFO")
|
| 681 |
+
self._log(f" - 原始 SQL: {original_sql}", "DEBUG")
|
| 682 |
+
for fix in fixes_applied:
|
| 683 |
+
self._log(f" - 應用規則: {fix}", "DEBUG")
|
| 684 |
+
self._log(f" - 修正後 SQL: {fixed_sql}", "INFO")
|
| 685 |
+
else:
|
| 686 |
+
self._log("✅ SQL 驗證通過,無需常規修正。", "INFO")
|
| 687 |
|
| 688 |
+
return fixed_sql
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 689 |
|
| 690 |
def _finalize_sql(self, sql: str, log_message: str) -> Tuple[str, str]:
|
| 691 |
"""一個輔助函數,用於清理最終的SQL並記錄成功日誌。"""
|