HTMLviewer2_API

Paused

App Files Files Community

tomo2chin2 commited on Apr 9, 2025

Commit

60bdc52

verified ·

1 Parent(s): af31960

Update app.py

Browse files

Files changed (1) hide show

app.py +120 -55

app.py CHANGED Viewed

@@ -28,15 +28,17 @@ logger = logging.getLogger(__name__)
 class GeminiRequest(BaseModel):
     """Geminiへのリクエストデータモデル"""
     text: str
-    extension_percentage: float = 10.0  # デフォルト値8%
-    temperature: float = 0.5  # デフォルト値を0.3に下げて創造性を抑制
     trim_whitespace: bool = True  # 余白トリミングオプション（デフォルト有効）
 class ScreenshotRequest(BaseModel):
     """スクリーンショットリクエストモデル"""
     html_code: str
-    extension_percentage: float = 10.0  # デフォルト値8%
     trim_whitespace: bool = True  # 余白トリミングオプション（デフォルト有効）
 # HTMLのFont Awesomeレイアウトを改善する関数
 def enhance_font_awesome_layout(html_code):
@@ -108,31 +110,74 @@ def enhance_font_awesome_layout(html_code):
     # どちらもない場合は先頭に追加
     return f'<html><head>{fa_fix_css}</head>' + html_code + '</html>'
-def load_system_instruction():
-    """HuggingFaceリポジトリからprompt.txtを直接ダウンロードして読み込む"""
     try:
-        # ファイルを直接ダウンロード
-        logger.info("HuggingFaceリポジトリからprompt.txtをダウンロード中...")
-        file_path = hf_hub_download(
-            repo_id="tomo2chin2/GURAREKOstlyle",
-            filename="prompt.txt",
-            repo_type="dataset"
-        )
-        # ファイルを読み込む
-        with open(file_path, 'r', encoding='utf-8') as file:
-            instruction = file.read()
-        logger.info(f"システムインストラクションを正常に読み込みました: {len(instruction)}バイト")
-        return instruction
     except Exception as e:
-        # エラーが発生した場合
         error_msg = f"システムインストラクションの読み込みに失敗: {str(e)}"
         logger.error(error_msg)
         raise ValueError(error_msg)
-def generate_html_from_text(text, temperature=0.3):
     """テキストからHTMLを生成する"""
     try:
         # APIキーの取得と設定
@@ -148,11 +193,11 @@ def generate_html_from_text(text, temperature=0.3):
         # Gemini APIの設定
         genai.configure(api_key=api_key)
-        # HuggingFaceデータセットからシステムインストラクションを読み込む
-        system_instruction = load_system_instruction()
         # モデル初期化
-        logger.info(f"Gemini APIにリクエストを送信: テキスト長さ = {len(text)}, 温度 = {temperature}")
         # モデル初期化
         model = genai.GenerativeModel(model_name)
@@ -486,11 +531,12 @@ def render_fullpage_screenshot(html_code: str, extension_percentage: float = 6.0
                 logger.error(f"Error removing temporary file {tmp_path}: {e}")
 # --- Geminiを使った新しい関数 ---
-def text_to_screenshot(text: str, extension_percentage: float, temperature: float = 0.3, trim_whitespace: bool = True) -> Image.Image:
     """テキストをGemini APIでHTMLに変換し、スクリーンショットを生成する統合関数"""
     try:
-        # 1. テキストからHTMLを生成（温度パラメータも渡す）
-        html_code = generate_html_from_text(text, temperature)
         # 2. HTMLからスクリーンショットを生成
         return render_fullpage_screenshot(html_code, extension_percentage, trim_whitespace)
@@ -587,14 +633,17 @@ async def api_text_to_screenshot(request: GeminiRequest):
     テキストからHTMLインフォグラフィックを生成してスクリーンショットを返すAPIエンドポイント
     """
     try:
-        logger.info(f"テキスト→スクリーンショットAPIリクエスト受信。テキスト長さ: {len(request.text)}, 拡張率: {request.extension_percentage}%, 温度: {request.temperature}")
-        # テキストからHTMLを生成してスクリーンショットを作成（温度パラメータも渡す）
         pil_image = text_to_screenshot(
             request.text,
             request.extension_percentage,
             request.temperature,
-            request.trim_whitespace
         )
         if pil_image.size == (1, 1):
@@ -615,14 +664,14 @@ async def api_text_to_screenshot(request: GeminiRequest):
 # --- Gradio Interface Definition ---
 # 入力モードの選択用Radioコンポーネント
-def process_input(input_mode, input_text, extension_percentage, temperature, trim_whitespace):
     """入力モードに応じて適切な処理を行う"""
     if input_mode == "HTML入力":
-        # HTMLモードの場合は既存の処理
         return render_fullpage_screenshot(input_text, extension_percentage, trim_whitespace)
     else:
         # テキスト入力モードの場合はGemini APIを使用
-        return text_to_screenshot(input_text, extension_percentage, temperature, trim_whitespace)
 # Gradio UIの定義
 with gr.Blocks(title="Full Page Screenshot (テキスト変換対応)", theme=gr.themes.Base()) as iface:
@@ -644,23 +693,34 @@ with gr.Blocks(title="Full Page Screenshot (テキスト変換対応)", theme=gr
     )
     with gr.Row():
-        extension_percentage = gr.Slider(
-            minimum=0,
-            maximum=30,
-            step=1.0,
-            value=10,    # デフォルト値10%
-            label="上下高さ拡張率（%）"
-        )
-        # 温度調整スライダー（テキストモード時のみ表示）
-        temperature = gr.Slider(
-            minimum=0.0,
-            maximum=1.0,
-            step=0.1,
-            value=0.5,    # デフォルト値を0.5に下げて創造性を抑制
-            label="生成時の温度（低い=一貫性高、高い=創造性高）",
-            visible=False  # 最初は非表示
-        )
     # 余白トリミングオプション
     trim_whitespace = gr.Checkbox(
@@ -672,21 +732,25 @@ with gr.Blocks(title="Full Page Screenshot (テキスト変換対応)", theme=gr
     submit_btn = gr.Button("生成")
     output_image = gr.Image(type="pil", label="ページ全体のスクリーンショット")
-    # 入力モード変更時のイベント処理（テキストモード時のみ温度スライダーを表示）
-    def update_temperature_visibility(mode):
         # Gradio 4.x用のアップデート方法
-        return {"visible": mode == "テキスト入力", "__type__": "update"}
     input_mode.change(
-        fn=update_temperature_visibility,
         inputs=input_mode,
-        outputs=temperature
     )
     # 生成ボタンクリック時のイベント処理
     submit_btn.click(
         fn=process_input,
-        inputs=[input_mode, input_text, extension_percentage, temperature, trim_whitespace],
         outputs=output_image
     )
@@ -699,6 +763,7 @@ with gr.Blocks(title="Full Page Screenshot (テキスト変換対応)", theme=gr
     ## 設定情報
     - 使用モデル: {gemini_model} (環境変数 GEMINI_MODEL で変更可能)
     """)
 # --- Mount Gradio App onto FastAPI ---

 class GeminiRequest(BaseModel):
     """Geminiへのリクエストデータモデル"""
     text: str
+    extension_percentage: float = 10.0  # デフォルト値10%
+    temperature: float = 0.5  # デフォルト値を0.5に設定
     trim_whitespace: bool = True  # 余白トリミングオプション（デフォルト有効）
+    style: str = "standard"  # デフォルトはstandard
 class ScreenshotRequest(BaseModel):
     """スクリーンショットリクエストモデル"""
     html_code: str
+    extension_percentage: float = 10.0  # デフォルト値10%
     trim_whitespace: bool = True  # 余白トリミングオプション（デフォルト有効）
+    style: str = "standard"  # デフォルトはstandard
 # HTMLのFont Awesomeレイアウトを改善する関数
 def enhance_font_awesome_layout(html_code):
     # どちらもない場合は先頭に追加
     return f'<html><head>{fa_fix_css}</head>' + html_code + '</html>'
+def load_system_instruction(style="standard"):
+    """
+    指定されたスタイルのシステムインストラクションを読み込む
+    Args:
+        style: 使用するスタイル名 (standard, cute, resort, cool, dental)
+    Returns:
+        読み込まれたシステムインストラクション
+    """
     try:
+        # 有効なスタイル一覧
+        valid_styles = ["standard", "cute", "resort", "cool", "dental"]
+        # スタイルの検証
+        if style not in valid_styles:
+            logger.warning(f"無効なスタイル '{style}' が指定されました。デフォルトの 'standard' を使用します。")
+            style = "standard"
+        logger.info(f"スタイル '{style}' のシステムインストラクションを読み込みます")
+        # まず、ローカルのスタイルディレクトリ内のprompt.txtを確認
+        local_path = os.path.join(os.path.dirname(__file__), style, "prompt.txt")
+        # ローカルファイルが存在する場合はそれを使用
+        if os.path.exists(local_path):
+            logger.info(f"ローカルファイルを使用: {local_path}")
+            with open(local_path, 'r', encoding='utf-8') as file:
+                instruction = file.read()
+            return instruction
+        # HuggingFaceリポジトリからのファイル読み込みを試行
+        try:
+            # スタイル固有のファイルパスを指定
+            file_path = hf_hub_download(
+                repo_id="tomo2chin2/GURAREKOstlyle",
+                filename=f"{style}/prompt.txt",
+                repo_type="dataset"
+            )
+            logger.info(f"スタイル '{style}' のプロンプトをHuggingFaceから読み込みました: {file_path}")
+            with open(file_path, 'r', encoding='utf-8') as file:
+                instruction = file.read()
+            return instruction
+        except Exception as style_error:
+            # スタイル固有ファイルの読み込みに失敗した場合、デフォルトのprompt.txtを使用
+            logger.warning(f"スタイル '{style}' のプロンプト読み込みに失敗: {str(style_error)}")
+            logger.info("デフォルトのprompt.txtを読み込みます")
+            file_path = hf_hub_download(
+                repo_id="tomo2chin2/GURAREKOstlyle",
+                filename="prompt.txt",
+                repo_type="dataset"
+            )
+            with open(file_path, 'r', encoding='utf-8') as file:
+                instruction = file.read()
+            logger.info("デフォルトのシステムインストラクションを読み込みました")
+            return instruction
     except Exception as e:
         error_msg = f"システムインストラクションの読み込みに失敗: {str(e)}"
         logger.error(error_msg)
         raise ValueError(error_msg)
+def generate_html_from_text(text, temperature=0.3, style="standard"):
     """テキストからHTMLを生成する"""
     try:
         # APIキーの取得と設定
         # Gemini APIの設定
         genai.configure(api_key=api_key)
+        # 指定されたスタイルのシステムインストラクションを読み込む
+        system_instruction = load_system_instruction(style)
         # モデル初期化
+        logger.info(f"Gemini APIにリクエストを送信: テキスト長さ = {len(text)}, 温度 = {temperature}, スタイル = {style}")
         # モデル初期化
         model = genai.GenerativeModel(model_name)
                 logger.error(f"Error removing temporary file {tmp_path}: {e}")
 # --- Geminiを使った新しい関数 ---
+def text_to_screenshot(text: str, extension_percentage: float, temperature: float = 0.3,
+                    trim_whitespace: bool = True, style: str = "standard") -> Image.Image:
     """テキストをGemini APIでHTMLに変換し、スクリーンショットを生成する統合関数"""
     try:
+        # 1. テキストからHTMLを生成（温度パラメータとスタイルも渡す）
+        html_code = generate_html_from_text(text, temperature, style)
         # 2. HTMLからスクリーンショットを生成
         return render_fullpage_screenshot(html_code, extension_percentage, trim_whitespace)
     テキストからHTMLインフォグラフィックを生成してスクリーンショットを返すAPIエンドポイント
     """
     try:
+        logger.info(f"テキスト→スクリーンショットAPIリクエスト受信。テキスト長さ: {len(request.text)}, "
+                   f"拡張率: {request.extension_percentage}%, 温度: {request.temperature}, "
+                   f"スタイル: {request.style}")
+        # テキストからHTMLを生成してスクリーンショットを作成（温度パラメータとスタイルも渡す）
         pil_image = text_to_screenshot(
             request.text,
             request.extension_percentage,
             request.temperature,
+            request.trim_whitespace,
+            request.style
         )
         if pil_image.size == (1, 1):
 # --- Gradio Interface Definition ---
 # 入力モードの選択用Radioコンポーネント
+def process_input(input_mode, input_text, extension_percentage, temperature, trim_whitespace, style):
     """入力モードに応じて適切な処理を行う"""
     if input_mode == "HTML入力":
+        # HTMLモードの場合は既存の処理（スタイルは使わない）
         return render_fullpage_screenshot(input_text, extension_percentage, trim_whitespace)
     else:
         # テキスト入力モードの場合はGemini APIを使用
+        return text_to_screenshot(input_text, extension_percentage, temperature, trim_whitespace, style)
 # Gradio UIの定義
 with gr.Blocks(title="Full Page Screenshot (テキスト変換対応)", theme=gr.themes.Base()) as iface:
     )
     with gr.Row():
+        with gr.Column(scale=1):
+            # スタイル選択ドロップダウン
+            style_dropdown = gr.Dropdown(
+                choices=["standard", "cute", "resort", "cool", "dental"],
+                value="standard",
+                label="デザインスタイル",
+                info="テキスト→HTML変換時のデザインテーマを選択します",
+                visible=False  # テキスト入力モードの時だけ表示
+            )
+        with gr.Column(scale=2):
+            extension_percentage = gr.Slider(
+                minimum=0,
+                maximum=30,
+                step=1.0,
+                value=10,    # デフォルト値10%
+                label="上下高さ拡張率（%）"
+            )
+            # 温度調整スライダー（テキストモード時のみ表示）
+            temperature = gr.Slider(
+                minimum=0.0,
+                maximum=1.0,
+                step=0.1,
+                value=0.5,    # デフォルト値を0.5に設定
+                label="生成時の温度（低い=一貫性高、高い=創造性高）",
+                visible=False  # 最初は非表示
+            )
     # 余白トリミングオプション
     trim_whitespace = gr.Checkbox(
     submit_btn = gr.Button("生成")
     output_image = gr.Image(type="pil", label="ページ全体のスクリーンショット")
+    # 入力モード変更時のイベント処理（テキストモード時のみ温度スライダーとスタイルドロップダウンを表示）
+    def update_controls_visibility(mode):
         # Gradio 4.x用のアップデート方法
+        is_text_mode = mode == "テキスト入力"
+        return [
+            {"visible": is_text_mode, "__type__": "update"},  # temperature
+            {"visible": is_text_mode, "__type__": "update"},  # style_dropdown
+        ]
     input_mode.change(
+        fn=update_controls_visibility,
         inputs=input_mode,
+        outputs=[temperature, style_dropdown]
     )
     # 生成ボタンクリック時のイベント処理
     submit_btn.click(
         fn=process_input,
+        inputs=[input_mode, input_text, extension_percentage, temperature, trim_whitespace, style_dropdown],
         outputs=output_image
     )
     ## 設定情報
     - 使用モデル: {gemini_model} (環境変数 GEMINI_MODEL で変更可能)
+    - 対応スタイル: standard, cute, resort, cool, dental
     """)
 # --- Mount Gradio App onto FastAPI ---