Spaces:
Sleeping
Sleeping
| import gradio as gr | |
| from pathlib import Path | |
| import tempfile, datetime, json, shutil, os | |
| from core import generate_report | |
| from rag import build_or_update_index, answer_with_context | |
| TITLE = "IR/ESG Report Generator (HF Space, Pro)" | |
| DESC = "CSV/YAML から IR/ESG レポート(HTML/PDF/DOCX)を生成。LLM要約+翻訳・グラフ・ベンチマーク・RAG・Hub保存に対応。" | |
| TEMPLATES_DIR = str((Path(__file__).resolve().parent / "templates").absolute()) | |
| import shutil as _shutil | |
| def _to_path(upload_obj, tmpdir: Path, filename: str) -> Path: | |
| dst = tmpdir / filename | |
| if upload_obj is None: | |
| raise ValueError(f"{filename} が未指定です。") | |
| if isinstance(upload_obj, (str, Path)): | |
| src = Path(upload_obj); _shutil.copy(src, dst); return dst | |
| if hasattr(upload_obj, "name"): # NamedString | |
| src = Path(upload_obj.name); _shutil.copy(src, dst); return dst | |
| if hasattr(upload_obj, "read"): | |
| data = upload_obj.read() | |
| if isinstance(data, str): data = data.encode("utf-8") | |
| dst.write_bytes(data); return dst | |
| if isinstance(upload_obj, dict): | |
| if "name" in upload_obj: _shutil.copy(upload_obj["name"], dst); return dst | |
| if "data" in upload_obj: | |
| data = upload_obj["data"] | |
| if isinstance(data, str): data = data.encode("utf-8") | |
| dst.write_bytes(data); return dst | |
| raise TypeError(f"Unsupported upload type: {type(upload_obj)}") | |
| def run(company_yaml, financials_csv, esg_csv, use_llm, lang, template_key, | |
| tenant, push_to_hub, glossary_yaml, benchmarks_yaml, past_reports_zip): | |
| try: | |
| if not company_yaml or not financials_csv or not esg_csv: | |
| return "全ファイルをアップロードしてください。", None, None, None, None, "" | |
| with tempfile.TemporaryDirectory() as td: | |
| tdir = Path(td) | |
| cpath = _to_path(company_yaml, tdir, "company.yaml") | |
| fpath = _to_path(financials_csv, tdir, "financials.csv") | |
| epath = _to_path(esg_csv, tdir, "esg.csv") | |
| gpath = _to_path(glossary_yaml, tdir, "glossary.yaml") if glossary_yaml else None | |
| bpath = _to_path(benchmarks_yaml, tdir, "benchmarks.yaml") if benchmarks_yaml else None | |
| rzip = _to_path(past_reports_zip, tdir, "past_reports.zip") if past_reports_zip else None | |
| if rzip: | |
| build_or_update_index(rzip, index_dir=tdir / "index") | |
| outdir = tdir / "out"; outdir.mkdir(parents=True, exist_ok=True) | |
| llm = None | |
| if use_llm: | |
| try: | |
| from llm import OpenAILLM | |
| llm = OpenAILLM() | |
| except Exception as e: | |
| return f"LLM初期化エラー: {e}", None, None, None, None, "" | |
| html, pdf, docx, meta_json, html_text = generate_report( | |
| company_yaml=str(cpath), | |
| financials_csv=str(fpath), | |
| esg_csv=str(epath), | |
| templates_dir=TEMPLATES_DIR, | |
| template_name={ | |
| "base":"base.html.j2", | |
| "tcfd":"tcfd.html.j2", | |
| "sasab":"sasb.html.j2", | |
| "sasb":"sasb.html.j2", | |
| "gri":"gri.html.j2", | |
| }.get(template_key, "base.html.j2"), | |
| out_html=str(outdir / "report.html"), | |
| out_pdf=str(outdir / "report.pdf"), | |
| out_docx=str(outdir / "report.docx"), | |
| lang=lang, | |
| llm=llm, | |
| glossary_path=str(gpath) if gpath else None, | |
| benchmarks_path=str(bpath) if bpath else None, | |
| tenant=tenant, | |
| rag_index_dir=str(tdir / "index") if rzip else None, | |
| ) | |
| repo_tmp = Path("./tmp"); repo_tmp.mkdir(exist_ok=True) | |
| ts = datetime.datetime.now().strftime("%Y%m%d-%H%M%S") | |
| prefix = f"{tenant or 'default'}-{ts}" | |
| html_out = repo_tmp / f"{prefix}.html" | |
| pdf_out = repo_tmp / f"{prefix}.pdf" | |
| docx_out = repo_tmp / f"{prefix}.docx" | |
| meta_out = repo_tmp / f"{prefix}.json" | |
| _shutil.copy(html, html_out) | |
| _shutil.copy(pdf, pdf_out) | |
| _shutil.copy(docx, docx_out) | |
| Path(meta_out).write_text(json.dumps(meta_json, ensure_ascii=False, indent=2), encoding="utf-8") | |
| if push_to_hub: | |
| try: | |
| from huggingface_hub import HfApi | |
| api = HfApi() | |
| repo_id = os.environ.get("HF_DATASET_REPO", "your-org/ir-esg-reports") | |
| base_path = f"{tenant or 'default'}/{ts}" | |
| for p, name in [(html_out,"report.html"),(pdf_out,"report.pdf"),(docx_out,"report.docx"),(meta_out,"report.json")]: | |
| api.upload_file( | |
| path_or_fileobj=str(p), | |
| path_in_repo=f"{base_path}/{name}", | |
| repo_id=repo_id, | |
| repo_type="dataset" | |
| ) | |
| except Exception as e: | |
| meta_json["hub_error"] = str(e) | |
| Path(meta_out).write_text(json.dumps(meta_json, ensure_ascii=False, indent=2), encoding="utf-8") | |
| return "生成が完了しました。", str(html_out), str(pdf_out), str(docx_out), str(meta_out), html_text | |
| except Exception as e: | |
| import traceback | |
| tb = traceback.format_exc(limit=20) | |
| return f"エラー: {e}\n--- trace ---\n{tb}", None, None, None, None, "" | |
| with gr.Blocks(title=TITLE) as demo: | |
| gr.Markdown(f"# {TITLE}\n{DESC}") | |
| with gr.Row(): | |
| company_yaml = gr.File(label="company.yaml(会社情報・年度等)", file_types=[".yaml", ".yml"]) | |
| financials_csv = gr.File(label="financials.csv(財務KPI)", file_types=[".csv", ".xlsx"]) | |
| esg_csv = gr.File(label="esg_metrics.csv(ESG指標)", file_types=[".csv", ".xlsx"]) | |
| with gr.Row(): | |
| use_llm = gr.Checkbox(label="LLMで要約/翻訳を行う(OPENAI_API_KEY2 必須)", value=True) | |
| lang = gr.Dropdown(choices=["ja","en","zh","ko","de","fr"], value="ja", label="出力言語") | |
| template_key = gr.Dropdown(choices=["base","tcfd","sasb","gri"], value="base", label="テンプレート") | |
| tenant = gr.Textbox(label="テナント名(会社識別子)", value="HitC") | |
| with gr.Row(): | |
| glossary_yaml = gr.File(label="glossary.yaml(用語集・任意)", file_types=[".yaml", ".yml"]) | |
| benchmarks_yaml = gr.File(label="benchmarks.yaml(業界平均など・任意)", file_types=[".yaml", ".yml"]) | |
| past_reports_zip = gr.File(label="過去レポートZip(RAG用・任意)", file_types=[".zip"]) | |
| push_to_hub = gr.Checkbox(label="生成物を Hugging Face Hub(Datasets)へ保存", value=False) | |
| run_btn = gr.Button("レポート生成") | |
| status = gr.Textbox(label="ステータス", interactive=False) | |
| html_file = gr.File(label="HTMLダウンロード") | |
| pdf_file = gr.File(label="PDFダウンロード") | |
| docx_file = gr.File(label="DOCXダウンロード") | |
| meta_file = gr.File(label="メタ情報(JSON)") | |
| html_preview = gr.HTML(label="HTMLプレビュー(抜粋)") | |
| run_btn.click( | |
| fn=run, | |
| inputs=[company_yaml, financials_csv, esg_csv, use_llm, lang, template_key, tenant, push_to_hub, glossary_yaml, benchmarks_yaml, past_reports_zip], | |
| outputs=[status, html_file, pdf_file, docx_file, meta_file, html_preview] | |
| ) | |
| if __name__ == "__main__": | |
| demo.launch() | |