HTMLviewer3_API_DATASET_URL

Paused

App Files Files Community

tomo2chin2 commited on Apr 19

Commit

4f99fb7

verified ·

1 Parent(s): e2eb5a0

Update app.py

Browse files

Files changed (1) hide show

app.py +405 -179

app.py CHANGED Viewed

@@ -15,7 +15,11 @@ import tempfile
 import time
 import os
 import logging
-from huggingface_hub import hf_hub_download  # 追加: HuggingFace Hubからファイルを直接ダウンロード
 # 正しいGemini関連のインポート
 import google.generativeai as genai
@@ -24,6 +28,88 @@ import google.generativeai as genai
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 # --- Gemini統合 ---
 class GeminiRequest(BaseModel):
     """Geminiへのリクエストデータモデル"""
@@ -40,9 +126,16 @@ class ScreenshotRequest(BaseModel):
     trim_whitespace: bool = True  # 余白トリミングオプション（デフォルト有効）
     style: str = "standard"  # デフォルトはstandard
-# HTMLのFont Awesomeレイアウトを改善する関数
 def enhance_font_awesome_layout(html_code):
-    """Font Awesomeレイアウトを改善するCSSを追加"""
     # CSSを追加
     fa_fix_css = """
     <style>
@@ -96,19 +189,19 @@ def enhance_font_awesome_layout(html_code):
     # headタグがある場合はその中に追加
     if '<head>' in html_code:
-        return html_code.replace('</head>', f'{fa_fix_css}</head>')
     # HTMLタグがある場合はその後に追加
     elif '<html' in html_code:
         head_end = html_code.find('</head>')
         if head_end > 0:
-            return html_code[:head_end] + fa_fix_css + html_code[head_end:]
         else:
             body_start = html_code.find('<body')
             if body_start > 0:
-                return html_code[:body_start] + f'<head>{fa_fix_css}</head>' + html_code[body_start:]
     # どちらもない場合は先頭に追加
-    return f'<html><head>{fa_fix_css}</head>' + html_code + '</html>'
 def load_system_instruction(style="standard"):
     """
@@ -267,11 +360,11 @@ def generate_html_from_text(text, temperature=0.3, style="standard"):
         logger.error(f"HTML生成中にエラーが発生: {e}", exc_info=True)
         raise Exception(f"Gemini APIでのHTML生成に失敗しました: {e}")
-# 画像から余分な空白領域をトリミングする関数
 def trim_image_whitespace(image, threshold=250, padding=10):
     """
-    画像から余分な白い空白をトリミングする
     Args:
         image: PIL.Image - 入力画像
         threshold: int - どの明るさ以上を空白と判断するか (0-255)
@@ -280,64 +373,72 @@ def trim_image_whitespace(image, threshold=250, padding=10):
     Returns:
         トリミングされたPIL.Image
     """
-    # グレースケールに変換
-    gray = image.convert('L')
-    # ピクセルデータを配列として取得
-    data = gray.getdata()
-    width, height = gray.size
-    # 有効範囲を見つける
-    min_x, min_y = width, height
-    max_x = max_y = 0
-    # ピクセルデータを2次元配列に変換して処理
-    pixels = list(data)
-    pixels = [pixels[i * width:(i + 1) * width] for i in range(height)]
-    # 各行をスキャンして非空白ピクセルを見つける
-    for y in range(height):
-        for x in range(width):
-            if pixels[y][x] < threshold:  # 非空白ピクセル
-                min_x = min(min_x, x)
-                min_y = min(min_y, y)
-                max_x = max(max_x, x)
-                max_y = max(max_y, y)
-    # 境界外のトリミングの場合はエラー
-    if min_x > max_x or min_y > max_y:
         logger.warning("トリミング領域が見つかりません。元の画像を返します。")
         return image
-    # パディングを追加
-    min_x = max(0, min_x - padding)
-    min_y = max(0, min_y - padding)
-    max_x = min(width - 1, max_x + padding)
-    max_y = min(height - 1, max_y + padding)
-    # 画像をトリミング
-    trimmed = image.crop((min_x, min_y, max_x + 1, max_y + 1))
-    logger.info(f"画像をトリミングしました: 元サイズ {width}x{height} → トリミング後 {trimmed.width}x{trimmed.height}")
-    return trimmed
-# 非同期スクリプトを使わず、同期的なスクリプトのみ使用する改善版
 def render_fullpage_screenshot(html_code: str, extension_percentage: float = 6.0,
-                              trim_whitespace: bool = True) -> Image.Image:
     """
     Renders HTML code to a full-page screenshot using Selenium.
     Args:
         html_code: The HTML source code string.
         extension_percentage: Percentage of extra space to add vertically.
         trim_whitespace: Whether to trim excess whitespace from the image.
     Returns:
         A PIL Image object of the screenshot.
     """
     tmp_path = None
-    driver = None
     # 1) Save HTML code to a temporary file
     try:
@@ -347,34 +448,12 @@ def render_fullpage_screenshot(html_code: str, extension_percentage: float = 6.0
         logger.info(f"HTML saved to temporary file: {tmp_path}")
     except Exception as e:
         logger.error(f"Error writing temporary HTML file: {e}")
         return Image.new('RGB', (1, 1), color=(0, 0, 0))
-    # 2) Headless Chrome(Chromium) options
-    options = Options()
-    options.add_argument("--headless")
-    options.add_argument("--no-sandbox")
-    options.add_argument("--disable-dev-shm-usage")
-    options.add_argument("--force-device-scale-factor=1")
-    options.add_argument("--disable-features=NetworkService")
-    options.add_argument("--dns-prefetch-disable")
-    # 環境変数からWebDriverパスを取得（任意）
-    webdriver_path = os.environ.get("CHROMEDRIVER_PATH")
-    if webdriver_path and os.path.exists(webdriver_path):
-        logger.info(f"Using CHROMEDRIVER_PATH: {webdriver_path}")
-        service = webdriver.ChromeService(executable_path=webdriver_path)
-    else:
-        logger.info("CHROMEDRIVER_PATH not set or invalid, using default PATH lookup.")
-        service = None # Use default behavior
     try:
-        logger.info("Initializing WebDriver...")
-        if service:
-             driver = webdriver.Chrome(service=service, options=options)
-        else:
-             driver = webdriver.Chrome(options=options)
-        logger.info("WebDriver initialized.")
-        # 3) 初期ウィンドウサイズを設定
         initial_width = 1200
         initial_height = 1000
         driver.set_window_size(initial_width, initial_height)
@@ -382,57 +461,68 @@ def render_fullpage_screenshot(html_code: str, extension_percentage: float = 6.0
         logger.info(f"Navigating to {file_url}")
         driver.get(file_url)
-        # 4) ページ読み込み待機
         logger.info("Waiting for body element...")
-        WebDriverWait(driver, 15).until(
             EC.presence_of_element_located((By.TAG_NAME, "body"))
         )
         logger.info("Body element found. Waiting for resource loading...")
-        # 5) 基本的なリソース読み込み待機 - タイムアウト回避
-        time.sleep(3)
-        # Font Awesome読み込み確認 - 非同期を使わない
-        logger.info("Checking for Font Awesome resources...")
-        fa_count = driver.execute_script("""
-            var icons = document.querySelectorAll('.fa, .fas, .far, .fab, [class*="fa-"]');
-            return icons.length;
-        """)
-        logger.info(f"Found {fa_count} Font Awesome elements")
-        # リソース読み込み状態を確認
-        doc_ready = driver.execute_script("return document.readyState;")
-        logger.info(f"Document ready state: {doc_ready}")
-        # Font Awesomeが多い場合は追加待機
-        if fa_count > 50:
-            logger.info("Many Font Awesome icons detected, waiting additional time")
-            time.sleep(2)
-        # 6) コンテンツレンダリングのためのスクロール処理 - 同期的に実行
         logger.info("Performing content rendering scroll...")
         total_height = driver.execute_script("return Math.max(document.body.scrollHeight, document.documentElement.scrollHeight);")
         viewport_height = driver.execute_script("return window.innerHeight;")
-        scrolls_needed = max(1, total_height // viewport_height)
-        for i in range(scrolls_needed + 1):
-            scroll_pos = i * (viewport_height - 200)  # オーバーラップさせる
             driver.execute_script(f"window.scrollTo(0, {scroll_pos});")
-            time.sleep(0.2)  # 短い待機
         # トップに戻る
         driver.execute_script("window.scrollTo(0, 0);")
-        time.sleep(0.5)
         logger.info("Scroll rendering completed")
-        # 7) スクロールバーを非表示に
         driver.execute_script("""
             document.documentElement.style.overflow = 'hidden';
             document.body.style.overflow = 'hidden';
         """)
-        logger.info("Scrollbars hidden")
-        # 8) ページの寸法を取得
         dimensions = driver.execute_script("""
             return {
                 width: Math.max(
@@ -457,57 +547,26 @@ def render_fullpage_screenshot(html_code: str, extension_percentage: float = 6.0
         scroll_height = dimensions['height']
         logger.info(f"Detected dimensions: width={scroll_width}, height={scroll_height}")
-        # 再検証 - 短いスクロールで再確認
-        driver.execute_script("window.scrollTo(0, document.body.scrollHeight);")
-        time.sleep(0.5)
-        driver.execute_script("window.scrollTo(0, 0);")
-        time.sleep(0.5)
-        dimensions_after = driver.execute_script("return {height: Math.max(document.documentElement.scrollHeight, document.body.scrollHeight)};")
-        scroll_height = max(scroll_height, dimensions_after['height'])
-        logger.info(f"After scroll check, height={scroll_height}")
         # 最小/最大値の設定
         scroll_width = max(scroll_width, 100)
         scroll_height = max(scroll_height, 100)
         scroll_width = min(scroll_width, 2000)
         scroll_height = min(scroll_height, 4000)
-        # 9) レイアウト安定化のための単純な待機 - タイムアウト回避
-        logger.info("Waiting for layout stabilization...")
-        time.sleep(2)
-        # 10) 高さに余白を追加
         adjusted_height = int(scroll_height * (1 + extension_percentage / 100.0))
         adjusted_height = max(adjusted_height, scroll_height, 100)
-        logger.info(f"Adjusted height calculated: {adjusted_height} (extension: {extension_percentage}%)")
-        # 11) ウィンドウサイズを調整
         adjusted_width = scroll_width
         logger.info(f"Resizing window to: width={adjusted_width}, height={adjusted_height}")
         driver.set_window_size(adjusted_width, adjusted_height)
-        time.sleep(1)
-        # リソース状態を確認 - 同期的スクリプト
-        resource_state = driver.execute_script("""
-            return {
-                readyState: document.readyState,
-                resourcesComplete: !document.querySelector('img:not([complete])') &&
-                                  !document.querySelector('link[rel="stylesheet"]:not([loaded])')
-            };
-        """)
-        logger.info(f"Resource state: {resource_state}")
-        if resource_state['readyState'] != 'complete':
-            logger.info("Document still loading, waiting additional time...")
-            time.sleep(1)
-        # トップにスクロール
-        driver.execute_script("window.scrollTo(0, 0);")
-        time.sleep(0.5)
-        logger.info("Scrolled to top.")
-        # 12) スクリーンショット取得
         logger.info("Taking screenshot...")
         png = driver.get_screenshot_as_png()
         logger.info("Screenshot taken successfully.")
@@ -516,7 +575,7 @@ def render_fullpage_screenshot(html_code: str, extension_percentage: float = 6.0
         img = Image.open(BytesIO(png))
         logger.info(f"Screenshot dimensions: {img.width}x{img.height}")
-        # 余白トリミング
         if trim_whitespace:
             img = trim_image_whitespace(img, threshold=248, padding=20)
             logger.info(f"Trimmed dimensions: {img.width}x{img.height}")
@@ -525,37 +584,200 @@ def render_fullpage_screenshot(html_code: str, extension_percentage: float = 6.0
     except Exception as e:
         logger.error(f"Error during screenshot generation: {e}", exc_info=True)
-        # Return a small black image on error
         return Image.new('RGB', (1, 1), color=(0, 0, 0))
     finally:
         logger.info("Cleaning up...")
-        if driver:
-            try:
-                driver.quit()
-                logger.info("WebDriver quit successfully.")
-            except Exception as e:
-                logger.error(f"Error quitting WebDriver: {e}", exc_info=True)
         if tmp_path and os.path.exists(tmp_path):
             try:
                 os.remove(tmp_path)
                 logger.info(f"Temporary file {tmp_path} removed.")
             except Exception as e:
-                logger.error(f"Error removing temporary file {tmp_path}: {e}", exc_info=True)
-# --- Geminiを使った新しい関数 ---
-def text_to_screenshot(text: str, extension_percentage: float, temperature: float = 0.3,
-                    trim_whitespace: bool = True, style: str = "standard") -> Image.Image:
-    """テキストをGemini APIでHTMLに変換し、スクリーンショットを生成する統合関数"""
     try:
-        # 1. テキストからHTMLを生成（温度パラメータとスタイルも渡す）
-        html_code = generate_html_from_text(text, temperature, style)
-        # 2. HTMLからスクリーンショットを生成
-        return render_fullpage_screenshot(html_code, extension_percentage, trim_whitespace)
     except Exception as e:
-        logger.error(f"テキストからスクリーンショット生成中にエラーが発生: {e}", exc_info=True)
         return Image.new('RGB', (1, 1), color=(0, 0, 0))  # エラー時は黒画像
 # --- FastAPI Setup ---
 app = FastAPI()
@@ -611,7 +833,7 @@ async def api_render_screenshot(request: ScreenshotRequest):
     """
     try:
         logger.info(f"API request received. Extension: {request.extension_percentage}%")
-        # Run the blocking Selenium code in a separate thread (FastAPI handles this)
         pil_image = render_fullpage_screenshot(
             request.html_code,
             request.extension_percentage,
@@ -635,7 +857,7 @@ async def api_render_screenshot(request: ScreenshotRequest):
         logger.error(f"API Error: {e}", exc_info=True)
         raise HTTPException(status_code=500, detail=f"Internal Server Error: {e}")
-# --- 新しいGemini API連携エンドポイント ---
 @app.post("/api/text-to-screenshot",
           response_class=StreamingResponse,
           tags=["Screenshot", "Gemini"],
@@ -650,8 +872,8 @@ async def api_text_to_screenshot(request: GeminiRequest):
                    f"拡張率: {request.extension_percentage}%, 温度: {request.temperature}, "
                    f"スタイル: {request.style}")
-        # テキストからHTMLを生成してスクリーンショットを作成（温度パラメータとスタイルも渡す）
-        pil_image = text_to_screenshot(
             request.text,
             request.extension_percentage,
             request.temperature,
@@ -661,8 +883,6 @@ async def api_text_to_screenshot(request: GeminiRequest):
         if pil_image.size == (1, 1):
             logger.error("スクリーンショット生成に失敗しました。1x1エラー画像を返します。")
-            # raise HTTPException(status_code=500, detail="スクリーンショット生成に失敗しました")
         # PIL画像をPNGバイトに変換
         img_byte_arr = BytesIO()
@@ -684,13 +904,14 @@ def process_input(input_mode, input_text, extension_percentage, temperature, tri
         # HTMLモ��ドの場合は既存の処理（スタイルは使わない）
         return render_fullpage_screenshot(input_text, extension_percentage, trim_whitespace)
     else:
-        # テキスト入力モードの場合はGemini APIを使用
-        return text_to_screenshot(input_text, extension_percentage, temperature, trim_whitespace, style)
 # Gradio UIの定義
 with gr.Blocks(title="Full Page Screenshot (テキスト変換対応)", theme=gr.themes.Base()) as iface:
     gr.Markdown("# HTMLビューア & テキスト→インフォグラフィック変換")
     gr.Markdown("HTMLコードをレンダリングするか、テキストをGemini APIでインフォグラフィックに変換して画像として取得します。")
     with gr.Row():
         input_mode = gr.Radio(
@@ -778,6 +999,7 @@ with gr.Blocks(title="Full Page Screenshot (テキスト変換対応)", theme=gr
     ## 設定情報
     - 使用モデル: {gemini_model} (環境変数 GEMINI_MODEL で変更可能)
     - 対応スタイル: standard, cute, resort, cool, dental
     """)
 # --- Mount Gradio App onto FastAPI ---
@@ -787,4 +1009,8 @@ app = gr.mount_gradio_app(app, iface, path="/")
 if __name__ == "__main__":
     import uvicorn
     logger.info("Starting Uvicorn server for local development...")
-    uvicorn.run(app, host="0.0.0.0", port=7860)

 import time
 import os
 import logging
+import numpy as np  # 追加: 画像処理の最適化用
+import threading  # 追加: 並列処理のため
+import queue  # 追加: WebDriverプール用
+from concurrent.futures import ThreadPoolExecutor  # 追加: 並列処理用
+from huggingface_hub import hf_hub_download
 # 正しいGemini関連のインポート
 import google.generativeai as genai
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
+# --- WebDriverプールの実装 ---
+class WebDriverPool:
+    """WebDriverインスタンスを再利用するためのプール"""
+    def __init__(self, max_drivers=3):
+        self.driver_queue = queue.Queue()
+        self.max_drivers = max_drivers
+        self.lock = threading.Lock()
+        self.count = 0
+        logger.info(f"WebDriverプールを初期化: 最大 {max_drivers} ドライバー")
+    def get_driver(self):
+        """プールからWebDriverを取得、なければ新規作成"""
+        if not self.driver_queue.empty():
+            logger.info("既存のWebDriverをプールから取得")
+            return self.driver_queue.get()
+        with self.lock:
+            if self.count < self.max_drivers:
+                self.count += 1
+                logger.info(f"新しいWebDriverを作成 (合計: {self.count}/{self.max_drivers})")
+                options = Options()
+                options.add_argument("--headless")
+                options.add_argument("--no-sandbox")
+                options.add_argument("--disable-dev-shm-usage")
+                options.add_argument("--force-device-scale-factor=1")
+                options.add_argument("--disable-features=NetworkService")
+                options.add_argument("--dns-prefetch-disable")
+                # 環境変数からWebDriverパスを取得（任意）
+                webdriver_path = os.environ.get("CHROMEDRIVER_PATH")
+                if webdriver_path and os.path.exists(webdriver_path):
+                    logger.info(f"CHROMEDRIVER_PATH使用: {webdriver_path}")
+                    service = webdriver.ChromeService(executable_path=webdriver_path)
+                    return webdriver.Chrome(service=service, options=options)
+                else:
+                    logger.info("デフォルトのChromeDriverを使用")
+                    return webdriver.Chrome(options=options)
+        # 最大数に達した場合は待機
+        logger.info("WebDriverプールがいっぱいです。利用可能なドライバーを待機中...")
+        return self.driver_queue.get()
+    def release_driver(self, driver):
+        """ドライバーをプールに戻す"""
+        if driver:
+            try:
+                # ブラウザをリセット
+                driver.get("about:blank")
+                driver.execute_script("""
+                    document.documentElement.style.overflow = '';
+                    document.body.style.overflow = '';
+                """)
+                self.driver_queue.put(driver)
+                logger.info("WebDriverをプールに戻しました")
+            except Exception as e:
+                logger.error(f"ドライバーをプールに戻す際にエラー: {e}")
+                driver.quit()
+                with self.lock:
+                    self.count -= 1
+    def close_all(self):
+        """全てのドライバーを終了"""
+        logger.info("WebDriverプールを終了します")
+        closed = 0
+        while not self.driver_queue.empty():
+            try:
+                driver = self.driver_queue.get(block=False)
+                driver.quit()
+                closed += 1
+            except queue.Empty:
+                break
+            except Exception as e:
+                logger.error(f"ドライバー終了中にエラー: {e}")
+        logger.info(f"{closed}個のWebDriverを終了しました")
+        with self.lock:
+            self.count = 0
+# グローバルなWebDriverプールを作成
+# サーバー環境のリソースに合わせて調整
+driver_pool = WebDriverPool(max_drivers=int(os.environ.get("MAX_WEBDRIVERS", "3")))
 # --- Gemini統合 ---
 class GeminiRequest(BaseModel):
     """Geminiへのリクエストデータモデル"""
     trim_whitespace: bool = True  # 余白トリミングオプション（デフォルト有効）
     style: str = "standard"  # デフォルトはstandard
+# HTMLのFont Awesomeレイアウトを改善する関数 - プリロード機能を追加
 def enhance_font_awesome_layout(html_code):
+    """Font Awesomeレイアウトを改善し、プリロードタグを追加"""
+    # Font Awesomeリソースのプリロード - パフォーマンス向上
+    fa_preload = """
+    <link rel="preload" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.4/webfonts/fa-solid-900.woff2" as="font" type="font/woff2" crossorigin>
+    <link rel="preload" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.4/webfonts/fa-regular-400.woff2" as="font" type="font/woff2" crossorigin>
+    <link rel="preload" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.4/webfonts/fa-brands-400.woff2" as="font" type="font/woff2" crossorigin>
+    """
     # CSSを追加
     fa_fix_css = """
     <style>
     # headタグがある場合はその中に追加
     if '<head>' in html_code:
+        return html_code.replace('</head>', f'{fa_preload}{fa_fix_css}</head>')
     # HTMLタグがある場合はその後に追加
     elif '<html' in html_code:
         head_end = html_code.find('</head>')
         if head_end > 0:
+            return html_code[:head_end] + fa_preload + fa_fix_css + html_code[head_end:]
         else:
             body_start = html_code.find('<body')
             if body_start > 0:
+                return html_code[:body_start] + f'<head>{fa_preload}{fa_fix_css}</head>' + html_code[body_start:]
     # どちらもない場合は先頭に追加
+    return f'<html><head>{fa_preload}{fa_fix_css}</head>' + html_code + '</html>'
 def load_system_instruction(style="standard"):
     """
         logger.error(f"HTML生成中にエラーが発生: {e}", exc_info=True)
         raise Exception(f"Gemini APIでのHTML生成に失敗しました: {e}")
+# 画像から余分な空白領域をトリミングする関数 - NumPyを使って最適化
 def trim_image_whitespace(image, threshold=250, padding=10):
     """
+    NumPyを使用して最適化された画像トリミング関数
     Args:
         image: PIL.Image - 入力画像
         threshold: int - どの明るさ以上を空白と判断するか (0-255)
     Returns:
         トリミングされたPIL.Image
     """
+    try:
+        # グレースケールに変換
+        gray = image.convert('L')
+        # NumPy配列として取得（高速処理のため）
+        np_image = np.array(gray)
+        # マスク作成（非白ピクセル）
+        mask = np_image < threshold
+        # マスクから行と列のインデックスを取得
+        rows = np.any(mask, axis=1)
+        cols = np.any(mask, axis=0)
+        # 非空のインデックス範囲を取得
+        if np.any(rows) and np.any(cols):
+            row_indices = np.where(rows)[0]
+            col_indices = np.where(cols)[0]
+            # 範囲取得
+            min_y, max_y = row_indices[0], row_indices[-1]
+            min_x, max_x = col_indices[0], col_indices[-1]
+            # パディング追加
+            min_x = max(0, min_x - padding)
+            min_y = max(0, min_y - padding)
+            max_x = min(image.width - 1, max_x + padding)
+            max_y = min(image.height - 1, max_y + padding)
+            # 画像をトリミング
+            trimmed = image.crop((min_x, min_y, max_x + 1, max_y + 1))
+            logger.info(f"画像をトリミングしました: 元サイズ {image.width}x{image.height} → トリミング後 {trimmed.width}x{trimmed.height}")
+            return trimmed
         logger.warning("トリミング領域が見つかりません。元の画像を返します。")
         return image
+    except Exception as e:
+        logger.error(f"画像トリミング中にエラー: {e}", exc_info=True)
+        return image  # エラー時は元の画像を返す
+# 最適化されたスクリーンショット生成関数 - 外部から初期化済みドライバーを受け取れるように
 def render_fullpage_screenshot(html_code: str, extension_percentage: float = 6.0,
+                              trim_whitespace: bool = True, driver=None) -> Image.Image:
     """
     Renders HTML code to a full-page screenshot using Selenium.
+    Optimized to accept an external driver or get one from the pool.
     Args:
         html_code: The HTML source code string.
         extension_percentage: Percentage of extra space to add vertically.
         trim_whitespace: Whether to trim excess whitespace from the image.
+        driver: An optional pre-initialized WebDriver instance.
     Returns:
         A PIL Image object of the screenshot.
     """
     tmp_path = None
+    driver_from_pool = False
+    # ドライバーがない場合はプールから取得
+    if driver is None:
+        driver = driver_pool.get_driver()
+        driver_from_pool = True
+        logger.info("WebDriverプールからドライバーを取得しました")
     # 1) Save HTML code to a temporary file
     try:
         logger.info(f"HTML saved to temporary file: {tmp_path}")
     except Exception as e:
         logger.error(f"Error writing temporary HTML file: {e}")
+        if driver_from_pool:
+            driver_pool.release_driver(driver)
         return Image.new('RGB', (1, 1), color=(0, 0, 0))
     try:
+        # ウィンドウサイズ初期設定
         initial_width = 1200
         initial_height = 1000
         driver.set_window_size(initial_width, initial_height)
         logger.info(f"Navigating to {file_url}")
         driver.get(file_url)
+        # ページ読み込み待機 - 動的な待機時間を実装
         logger.info("Waiting for body element...")
+        WebDriverWait(driver, 10).until(
             EC.presence_of_element_located((By.TAG_NAME, "body"))
         )
         logger.info("Body element found. Waiting for resource loading...")
+        # リソース読み込みの動的待機 - 最適化
+        max_wait = 3  # 最大待機時間（秒）
+        wait_increment = 0.2  # 確認間隔
+        wait_time = 0
+        while wait_time < max_wait:
+            resource_state = driver.execute_script("""
+                return {
+                    complete: document.readyState === 'complete',
+                    imgCount: document.images.length,
+                    imgLoaded: Array.from(document.images).filter(img => img.complete).length,
+                    faElements: document.querySelectorAll('.fa, .fas, .far, .fab, [class*="fa-"]').length
+                };
+            """)
+            # ドキュメント完了かつ画像が読み込まれている場合、待機終了
+            if resource_state['complete'] and (resource_state['imgCount'] == 0 or
+                                             resource_state['imgLoaded'] == resource_state['imgCount']):
+                logger.info(f"リソース読み込み完了: {resource_state}")
+                break
+            time.sleep(wait_increment)
+            wait_time += wait_increment
+            logger.info(f"リソース待機中... {wait_time:.1f}秒経過, 状態: {resource_state}")
+        # Font Awesome要素が多い場合は追加待機
+        fa_count = resource_state.get('faElements', 0)
+        if fa_count > 30:
+            logger.info(f"{fa_count}個のFont Awesome要素があるため、追加待機...")
+            time.sleep(min(1.0, fa_count / 100))  # 要素数に応じて待機（最大1秒）
+        # コンテンツレンダリングのためのスクロール処理 - パフォーマンス改善
         logger.info("Performing content rendering scroll...")
         total_height = driver.execute_script("return Math.max(document.body.scrollHeight, document.documentElement.scrollHeight);")
         viewport_height = driver.execute_script("return window.innerHeight;")
+        scrolls_needed = max(1, min(5, total_height // viewport_height))  # 最大5回までに制限
+        # スクロール処理の高速化
+        for i in range(scrolls_needed):
+            scroll_pos = i * (viewport_height - 100)  # 少しだけオーバーラップ
             driver.execute_script(f"window.scrollTo(0, {scroll_pos});")
+            time.sleep(0.1)  # 高速化のため待機時間短縮
         # トップに戻る
         driver.execute_script("window.scrollTo(0, 0);")
+        time.sleep(0.2)  # 短い待機に変更
         logger.info("Scroll rendering completed")
+        # スクロールバーを非表示に
         driver.execute_script("""
             document.documentElement.style.overflow = 'hidden';
             document.body.style.overflow = 'hidden';
         """)
+        # ページの寸法を取得
         dimensions = driver.execute_script("""
             return {
                 width: Math.max(
         scroll_height = dimensions['height']
         logger.info(f"Detected dimensions: width={scroll_width}, height={scroll_height}")
         # 最小/最大値の設定
         scroll_width = max(scroll_width, 100)
         scroll_height = max(scroll_height, 100)
         scroll_width = min(scroll_width, 2000)
         scroll_height = min(scroll_height, 4000)
+        # レイアウト安定化のための待機 - 短縮
+        time.sleep(0.5)  # 2秒から0.5秒に短縮
+        # 高���に余白を追加
         adjusted_height = int(scroll_height * (1 + extension_percentage / 100.0))
         adjusted_height = max(adjusted_height, scroll_height, 100)
+        # ウィンドウサイズを調整
         adjusted_width = scroll_width
         logger.info(f"Resizing window to: width={adjusted_width}, height={adjusted_height}")
         driver.set_window_size(adjusted_width, adjusted_height)
+        time.sleep(0.5)  # 短縮した待機時間
+        # スクリーンショット取得
         logger.info("Taking screenshot...")
         png = driver.get_screenshot_as_png()
         logger.info("Screenshot taken successfully.")
         img = Image.open(BytesIO(png))
         logger.info(f"Screenshot dimensions: {img.width}x{img.height}")
+        # 余白トリミング - 最適化版を使用
         if trim_whitespace:
             img = trim_image_whitespace(img, threshold=248, padding=20)
             logger.info(f"Trimmed dimensions: {img.width}x{img.height}")
     except Exception as e:
         logger.error(f"Error during screenshot generation: {e}", exc_info=True)
+        # エラー時は小さい黒画像を返す
         return Image.new('RGB', (1, 1), color=(0, 0, 0))
     finally:
         logger.info("Cleaning up...")
+        # WebDriverプールに戻す
+        if driver_from_pool:
+            driver_pool.release_driver(driver)
+            logger.info("Returned driver to pool")
+        # 一時ファイル削除
         if tmp_path and os.path.exists(tmp_path):
             try:
                 os.remove(tmp_path)
                 logger.info(f"Temporary file {tmp_path} removed.")
             except Exception as e:
+                logger.error(f"Error removing temporary file {tmp_path}: {e}")
+# --- 並列処理を活用した新しい関数 ---
+def text_to_screenshot_parallel(text: str, extension_percentage: float, temperature: float = 0.3,
+                             trim_whitespace: bool = True, style: str = "standard") -> Image.Image:
+    """テキストをGemini APIでHTMLに変換し、並列処理でスクリーンショットを生成する関数"""
+    start_time = time.time()
+    logger.info("並列処理によるテキスト→スクリーンショット生成を開始")
     try:
+        # WebDriverと HTML生成を並列で実行
+        with ThreadPoolExecutor(max_workers=2) as executor:
+            # Gemini APIリクエストタスク
+            html_future = executor.submit(
+                generate_html_from_text,
+                text=text,
+                temperature=temperature,
+                style=style
+            )
+            # WebDriver初期化タスク - プール使用
+            driver_future = executor.submit(driver_pool.get_driver)
+            # 結果を取得
+            html_code = html_future.result()
+            driver = driver_future.result()
+        # ドライバーはプールから取得しているためフラグ設定
+        driver_from_pool = True
+        # HTMLコードとドライバーが準備できたらスクリーンショット生成
+        logger.info(f"HTML生成完了：{len(html_code)}文字。スクリーンショット生成開始。")
+        # レンダリング前にドライバーの初期設定
+        tmp_path = None
+        try:
+            # 一時ファイルにHTMLを保存
+            with tempfile.NamedTemporaryFile(suffix=".html", delete=False, mode='w', encoding='utf-8') as tmp_file:
+                tmp_path = tmp_file.name
+                tmp_file.write(html_code)
+            logger.info(f"HTMLを一時ファイルに保存: {tmp_path}")
+            # ウィンドウサイズ初期設定
+            initial_width = 1200
+            initial_height = 1000
+            driver.set_window_size(initial_width, initial_height)
+            file_url = "file://" + tmp_path
+            logger.info(f"ページに移動: {file_url}")
+            driver.get(file_url)
+            # ここからスクリーンショット生成ロジック（前の実装と同様）
+            # ページ読み込み待機 - 動的な待機時間を実装
+            logger.info("body要素を待機...")
+            WebDriverWait(driver, 10).until(
+                EC.presence_of_element_located((By.TAG_NAME, "body"))
+            )
+            logger.info("body要素を検出。リソース読み込みを待機...")
+            # リソース読み込みの動的待機 - 最適化
+            max_wait = 3  # 最大待機時間（秒）
+            wait_increment = 0.2  # 確認間隔
+            wait_time = 0
+            while wait_time < max_wait:
+                resource_state = driver.execute_script("""
+                    return {
+                        complete: document.readyState === 'complete',
+                        imgCount: document.images.length,
+                        imgLoaded: Array.from(document.images).filter(img => img.complete).length,
+                        faElements: document.querySelectorAll('.fa, .fas, .far, .fab, [class*="fa-"]').length
+                    };
+                """)
+                # ドキュメント完了かつ画像が読み込まれている場合、待機終了
+                if resource_state['complete'] and (resource_state['imgCount'] == 0 or
+                                                 resource_state['imgLoaded'] == resource_state['imgCount']):
+                    logger.info(f"リソース読み込み完了: {resource_state}")
+                    break
+                time.sleep(wait_increment)
+                wait_time += wait_increment
+            # Font Awesome要素が多い場合は追加待機
+            fa_count = resource_state.get('faElements', 0)
+            if fa_count > 30:
+                logger.info(f"{fa_count}個のFont Awesome要素があるため、追加待機...")
+                time.sleep(min(0.5, fa_count / 200))  # 要素数に応じて待機（最大0.5秒）
+            # コンテンツレンダリングのための簡易スクロール
+            driver.execute_script("window.scrollTo(0, document.body.scrollHeight);")
+            time.sleep(0.2)
+            driver.execute_script("window.scrollTo(0, 0);")
+            time.sleep(0.2)
+            # スクロールバーを非表示に
+            driver.execute_script("""
+                document.documentElement.style.overflow = 'hidden';
+                document.body.style.overflow = 'hidden';
+            """)
+            # ページの寸法を取得
+            dimensions = driver.execute_script("""
+                return {
+                    width: Math.max(
+                        document.documentElement.scrollWidth,
+                        document.documentElement.offsetWidth,
+                        document.documentElement.clientWidth,
+                        document.body ? document.body.scrollWidth : 0,
+                        document.body ? document.body.offsetWidth : 0,
+                        document.body ? document.body.clientWidth : 0
+                    ),
+                    height: Math.max(
+                        document.documentElement.scrollHeight,
+                        document.documentElement.offsetHeight,
+                        document.documentElement.clientHeight,
+                        document.body ? document.body.scrollHeight : 0,
+                        document.body ? document.body.offsetHeight : 0,
+                        document.body ? document.body.clientHeight : 0
+                    )
+                };
+            """)
+            scroll_width = dimensions['width']
+            scroll_height = dimensions['height']
+            # 最小/最大値の設定
+            scroll_width = max(scroll_width, 100)
+            scroll_height = max(scroll_height, 100)
+            scroll_width = min(scroll_width, 2000)
+            scroll_height = min(scroll_height, 4000)
+            # 高さに余白を追加
+            adjusted_height = int(scroll_height * (1 + extension_percentage / 100.0))
+            adjusted_height = max(adjusted_height, scroll_height, 100)
+            # ウィンドウサイズを調整
+            driver.set_window_size(scroll_width, adjusted_height)
+            time.sleep(0.2)
+            # スクリーンショット取得
+            logger.info("スクリーンショットを撮影...")
+            png = driver.get_screenshot_as_png()
+            # PIL画像に変換
+            img = Image.open(BytesIO(png))
+            logger.info(f"スクリーンショットサイズ: {img.width}x{img.height}")
+            # 余白トリミング
+            if trim_whitespace:
+                img = trim_image_whitespace(img, threshold=248, padding=20)
+                logger.info(f"トリミング後のサイズ: {img.width}x{img.height}")
+            elapsed = time.time() - start_time
+            logger.info(f"並列処理による生成完了。所要時間: {elapsed:.2f}秒")
+            return img
+        except Exception as e:
+            logger.error(f"スクリーンショット生成中にエラー: {e}", exc_info=True)
+            return Image.new('RGB', (1, 1), color=(0, 0, 0))
+        finally:
+            # WebDriverプールに戻す
+            if driver_from_pool:
+                driver_pool.release_driver(driver)
+            # 一時ファイル削除
+            if tmp_path and os.path.exists(tmp_path):
+                try:
+                    os.remove(tmp_path)
+                except Exception as e:
+                    logger.error(f"一時ファイル削除エラー: {e}")
     except Exception as e:
+        logger.error(f"並列処理中のエラー: {e}", exc_info=True)
         return Image.new('RGB', (1, 1), color=(0, 0, 0))  # エラー時は黒画像
+# 従来の非並列版も残す（互換性のため）
+def text_to_screenshot(text: str, extension_percentage: float, temperature: float = 0.3,
+                    trim_whitespace: bool = True, style: str = "standard") -> Image.Image:
+    """テキストをGemini APIでHTMLに変換し、スクリーンショットを生成する統合関数（レガシー版）"""
+    # 並列処理版を呼び出す
+    return text_to_screenshot_parallel(text, extension_percentage, temperature, trim_whitespace, style)
 # --- FastAPI Setup ---
 app = FastAPI()
     """
     try:
         logger.info(f"API request received. Extension: {request.extension_percentage}%")
+        # Run the blocking Selenium code (now using the pooled version)
         pil_image = render_fullpage_screenshot(
             request.html_code,
             request.extension_percentage,
         logger.error(f"API Error: {e}", exc_info=True)
         raise HTTPException(status_code=500, detail=f"Internal Server Error: {e}")
+# --- 新しいGemini API連携エンドポイント（並列処理版） ---
 @app.post("/api/text-to-screenshot",
           response_class=StreamingResponse,
           tags=["Screenshot", "Gemini"],
                    f"拡張率: {request.extension_percentage}%, 温度: {request.temperature}, "
                    f"スタイル: {request.style}")
+        # 並列処理版を使用
+        pil_image = text_to_screenshot_parallel(
             request.text,
             request.extension_percentage,
             request.temperature,
         if pil_image.size == (1, 1):
             logger.error("スクリーンショット生成に失敗しました。1x1エラー画像を返します。")
         # PIL画像をPNGバイトに変換
         img_byte_arr = BytesIO()
         # HTMLモ��ドの場合は既存の処理（スタイルは使わない）
         return render_fullpage_screenshot(input_text, extension_percentage, trim_whitespace)
     else:
+        # テキスト入力モードの場合はGemini APIを使用（並列処理版）
+        return text_to_screenshot_parallel(input_text, extension_percentage, temperature, trim_whitespace, style)
 # Gradio UIの定義
 with gr.Blocks(title="Full Page Screenshot (テキスト変換対応)", theme=gr.themes.Base()) as iface:
     gr.Markdown("# HTMLビューア & テキスト→インフォグラフィック変換")
     gr.Markdown("HTMLコードをレンダリングするか、テキストをGemini APIでインフォグラフィックに変換して画像として取得します。")
+    gr.Markdown("**パフォーマンス向上版**: 並列処理と最適化により処理時間を短縮しています")
     with gr.Row():
         input_mode = gr.Radio(
     ## 設定情報
     - 使用モデル: {gemini_model} (環境変数 GEMINI_MODEL で変更可能)
     - 対応スタイル: standard, cute, resort, cool, dental
+    - WebDriverプール最大数: {driver_pool.max_drivers} (環境変数 MAX_WEBDRIVERS で変更可能)
     """)
 # --- Mount Gradio App onto FastAPI ---
 if __name__ == "__main__":
     import uvicorn
     logger.info("Starting Uvicorn server for local development...")
+    uvicorn.run(app, host="0.0.0.0", port=7860)
+# アプリケーション終了時にWebDriverプールをクリーンアップ
+import atexit
+atexit.register(driver_pool.close_all)