import asyncio
import codecs
import io
import random
import re
import time
from asyncio import Task
from pathlib import Path
from typing import Any, AsyncGenerator, Optional

import orjson as json
from curl_cffi.requests import AsyncSession, Cookies, Response
from curl_cffi.requests.exceptions import ReadTimeout

from .components import GemMixin
from .constants import (
    Endpoint,
    ErrorCode,
    GRPC,
    Model,
    TEMPORARY_CHAT_FLAG_INDEX,
    STREAMING_FLAG_INDEX,
    GEM_FLAG_INDEX,
)
from .exceptions import (
    APIError,
    AuthError,
    GeminiError,
    ModelInvalid,
    TemporarilyBlocked,
    TimeoutError,
    UsageLimitExceeded,
)
from .types import (
    Candidate,
    Gem,
    GeneratedImage,
    ModelOutput,
    RPCData,
    WebImage,
    AvailableModel,
    ChatInfo,
    ChatTurn,
    ChatHistory,
    GeneratedVideo,
)
from .utils import (
    extract_json_from_response,
    get_access_token,
    get_delta_by_fp_len,
    get_nested_value,
    logger,
    parse_file_name,
    parse_response_by_frame,
    rotate_1psidts,
    running,
    upload_file,
)

_CARD_CONTENT_RE = re.compile(r"^http://googleusercontent\.com/card_content/\d+")
_ARTIFACTS_RE = re.compile(r"http://googleusercontent\.com/\w+/\d+\n*")
_DEFAULT_METADATA: list[Any] = ["", "", "", None, None, None, None, None, None, ""]


class GeminiClient(GemMixin):
    """
    Async requests client interface for gemini.google.com.

    `secure_1psid` must be provided unless the optional dependency `browser-cookie3` is installed, and
    you have logged in to google.com in your local browser.

    Parameters
    ----------
    secure_1psid: `str`, optional
        __Secure-1PSID cookie value.
    secure_1psidts: `str`, optional
        __Secure-1PSIDTS cookie value, some Google accounts don't require this value, provide only if it's in the cookie list.
    proxy: `str`, optional
        Proxy URL.
    kwargs: `dict`, optional
        Additional arguments which will be passed to the http client.
        Refer to `curl_cffi.requests.AsyncSession` for more information.

    Raises
    ------
    `ValueError`
        If `browser-cookie3` is installed but cookies for google.com are not found in your local browser storage.
    """

    __slots__ = [
        "_cookies",
        "proxy",
        "_running",
        "client",
        "access_token",
        "build_label",
        "session_id",
        "timeout",
        "auto_close",
        "close_delay",
        "close_task",
        "auto_refresh",
        "refresh_interval",
        "refresh_task",
        "verbose",
        "watchdog_timeout",
        "_lock",
        "_reqid",
        "_gems",  # From GemMixin
        "_available_models",
        "_recent_chats",
        "kwargs",
    ]

    def __init__(
        self,
        secure_1psid: str | None = None,
        secure_1psidts: str | None = None,
        proxy: str | None = None,
        **kwargs,
    ):
        super().__init__()
        self._cookies = Cookies()
        self.proxy = proxy
        self._running: bool = False
        self.client: AsyncSession | None = None
        self.access_token: str | None = None
        self.build_label: str | None = None
        self.session_id: str | None = None
        self.timeout: float = 600
        self.auto_close: bool = False
        self.close_delay: float = 600
        self.close_task: Task | None = None
        self.auto_refresh: bool = True
        self.refresh_interval: float = 600
        self.refresh_task: Task | None = None
        self.verbose: bool = True
        self.watchdog_timeout: float = 90
        self._lock = asyncio.Lock()
        self._reqid: int = random.randint(10000, 99999)

        self._available_models: list[AvailableModel] | None = None
        self._recent_chats: list[ChatInfo] | None = None
        self.kwargs = kwargs

        if secure_1psid:
            self._cookies.set("__Secure-1PSID", secure_1psid, domain=".google.com")
            if secure_1psidts:
                self._cookies.set(
                    "__Secure-1PSIDTS", secure_1psidts, domain=".google.com"
                )

    @property
    def cookies(self) -> Cookies:
        """
        Returns the cookies used for the current session.
        """
        return self.client.cookies if self.client else self._cookies

    @cookies.setter
    def cookies(self, value: Cookies | dict):
        if isinstance(value, Cookies):
            self._cookies.update(value)
        elif isinstance(value, dict):
            for k, v in value.items():
                self._cookies.set(k, v, domain=".google.com")

        if self.client:
            self.client.cookies.update(self._cookies)

    async def init(
        self,
        timeout: float = 600,
        auto_close: bool = False,
        close_delay: float = 600,
        auto_refresh: bool = True,
        refresh_interval: float = 600,
        verbose: bool = True,
        watchdog_timeout: float = 90,
    ) -> None:
        """
        Get SNlM0e value as access token. Without this token posting will fail with 400 bad request.

        Parameters
        ----------
        timeout: `float`, optional
            Request timeout of the client in seconds. Used to limit the max waiting time when sending a request.
        auto_close: `bool`, optional
            If `True`, the client will close connections and clear resource usage after a certain period
            of inactivity. Useful for always-on services.
        close_delay: `float`, optional
            Time to wait before auto-closing the client in seconds. Effective only if `auto_close` is `True`.
        auto_refresh: `bool`, optional
            If `True`, will schedule a task to automatically refresh cookies and access token in the background.
        refresh_interval: `float`, optional
            Time interval for background cookie and access token refresh in seconds.
            Effective only if `auto_refresh` is `True`.
        verbose: `bool`, optional
            If `True`, will print more infomation in logs.
        watchdog_timeout: `float`, optional
            Timeout in seconds for shadow retry watchdog. If no data receives from stream but connection is active,
            client will retry automatically after this duration.
        """

        async with self._lock:
            if self._running:
                return

            try:
                self.verbose = verbose
                self.watchdog_timeout = watchdog_timeout
                access_token, build_label, session_id, session = await get_access_token(
                    base_cookies=self.cookies,
                    proxy=self.proxy,
                    verbose=self.verbose,
                    verify=self.kwargs.get("verify", True),
                )

                session.timeout = timeout
                self.client = session
                self._cookies.update(self.client.cookies)
                self.access_token = access_token
                self.build_label = build_label
                self.session_id = session_id
                self._running = True
                self._reqid = random.randint(10000, 99999)

                self.timeout = timeout
                self.auto_close = auto_close
                self.close_delay = close_delay
                if self.auto_close:
                    await self.reset_close_task()

                self.auto_refresh = auto_refresh
                self.refresh_interval = refresh_interval

                if self.refresh_task:
                    self.refresh_task.cancel()
                    self.refresh_task = None

                if self.auto_refresh:
                    self.refresh_task = asyncio.create_task(self.start_auto_refresh())

                await self._init_rpc()

                if self.verbose:
                    logger.success("Gemini client initialized successfully.")
            except Exception:
                await self.close()
                raise

    async def close(self, delay: float = 0) -> None:
        """
        Close the client after a certain period of inactivity, or call manually to close immediately.

        Parameters
        ----------
        delay: `float`, optional
            Time to wait before closing the client in seconds.
        """

        if delay:
            await asyncio.sleep(delay)

        self._running = False

        if self.close_task:
            self.close_task.cancel()
            self.close_task = None

        if self.refresh_task:
            self.refresh_task.cancel()
            self.refresh_task = None

        if self.client:
            self._cookies.update(self.client.cookies)
            await self.client.close()
            self.client = None

    async def reset_close_task(self) -> None:
        """
        Reset the timer for closing the client when a new request is made.
        """

        if self.close_task:
            self.close_task.cancel()
            self.close_task = None

        self.close_task = asyncio.create_task(self.close(self.close_delay))

    async def start_auto_refresh(self) -> None:
        """
        Start the background task to automatically refresh cookies.
        """
        if self.refresh_interval < 60:
            self.refresh_interval = 60

        while self._running:
            await asyncio.sleep(self.refresh_interval)

            if not self._running:
                break

            try:
                async with self._lock:
                    # Refresh all cookies in the background to keep the session alive.
                    new_1psidts = await rotate_1psidts(self.client, self.verbose)

                    if new_1psidts:
                        logger.debug("Cookies refreshed (network update).")
                    else:
                        logger.warning(
                            "Rotation response did not contain a new __Secure-1PSIDTS. "
                            "Session might expire soon if this persists."
                        )
            except asyncio.CancelledError:
                raise
            except AuthError:
                logger.warning(
                    "AuthError: Failed to refresh cookies. Retrying in next interval."
                )
            except Exception:
                logger.warning(
                    "Unexpected error while refreshing cookies. Retrying in next interval."
                )

    async def _init_rpc(self) -> None:
        """
        Send initial RPC calls to set up the session.
        """
        await self._fetch_models()
        await self._send_bard_settings()
        await self._send_bard_activity()
        await self._fetch_recent_chats()

    async def _fetch_models(self) -> None:
        """
        Fetch and parse available models.
        """
        response = await self._batch_execute(
            [
                RPCData(
                    rpcid=GRPC.LIST_MODELS,
                    payload="[]",
                )
            ]
        )

        response_json = extract_json_from_response(response.text)

        available_models = []
        for part in response_json:
            part_body_str = get_nested_value(part, [2])
            if not part_body_str:
                continue

            part_body = json.loads(part_body_str)

            models_list = get_nested_value(part_body, [15])
            if isinstance(models_list, list):
                for model_data in models_list:
                    if isinstance(model_data, list) and len(model_data) > 2:
                        model_id = get_nested_value(model_data, [0], "")
                        name = get_nested_value(model_data, [10]) or get_nested_value(
                            model_data, [1], ""
                        )
                        description = get_nested_value(
                            model_data, [12]
                        ) or get_nested_value(model_data, [2], "")
                        core_model = Model.UNSPECIFIED
                        code_name = "unspecified"
                        for enum_model in Model:
                            val = enum_model.model_header.get(
                                "x-goog-ext-525001261-jspb", ""
                            )
                            if val and (model_id in val):
                                core_model = enum_model
                                code_name = enum_model.model_name
                                break

                        if model_id and name:
                            available_models.append(
                                AvailableModel(
                                    id=code_name,
                                    name=name,
                                    model=core_model,
                                    description=description,
                                )
                            )
                break

        self._available_models = available_models

    async def _fetch_recent_chats(self, recent: int = 13) -> None:
        """
        Fetch and parse recent chats.
        """
        response_chats1 = await self._batch_execute(
            [
                RPCData(
                    rpcid=GRPC.LIST_CHATS,
                    payload=json.dumps([recent, None, [1, None, 1]]).decode("utf-8"),
                ),
            ]
        )
        response_chats2 = await self._batch_execute(
            [
                RPCData(
                    rpcid=GRPC.LIST_CHATS,
                    payload=json.dumps([recent, None, [0, None, 1]]).decode("utf-8"),
                ),
            ]
        )

        recent_chats: list[ChatInfo] = []
        for response_chats in (response_chats1, response_chats2):
            chats_json = extract_json_from_response(response_chats.text)
            for part in chats_json:
                part_body_str = get_nested_value(part, [2])
                if not part_body_str:
                    continue

                try:
                    part_body = json.loads(part_body_str)
                except json.JSONDecodeError:
                    continue

                chat_list = get_nested_value(part_body, [2])
                if isinstance(chat_list, list):
                    for chat_data in chat_list:
                        if isinstance(chat_data, list) and len(chat_data) > 1:
                            cid = get_nested_value(chat_data, [0], "")
                            title = get_nested_value(chat_data, [1], "")
                            is_pinned = bool(get_nested_value(chat_data, [2]))

                            if cid and title:
                                if not any(c.cid == cid for c in recent_chats):
                                    recent_chats.append(
                                        ChatInfo(
                                            cid=cid, title=title, is_pinned=is_pinned
                                        )
                                    )
                    break

        self._recent_chats = recent_chats

    async def _send_bard_settings(self) -> None:
        """
        Send required setup activity to Gemini.
        """
        await self._batch_execute(
            [
                RPCData(
                    rpcid=GRPC.BARD_SETTINGS,
                    payload='[[["adaptive_device_responses_enabled","advanced_mode_theme_override_triggered","advanced_zs_upsell_dismissal_count","advanced_zs_upsell_last_dismissed","ai_transparency_notice_dismissed","audio_overview_discovery_dismissal_count","audio_overview_discovery_last_dismissed","bard_in_chrome_link_sharing_enabled","bard_sticky_mode_disabled_count","canvas_create_discovery_tooltip_seen_count","combined_files_button_tag_seen_count","indigo_banner_explicit_dismissal_count","indigo_banner_impression_count","indigo_banner_last_seen_sec","current_popup_id","deep_research_has_seen_file_upload_tooltip","deep_research_model_update_disclaimer_display_count","default_bot_id","disabled_discovery_card_feature_ids","disabled_model_discovery_tooltip_feature_ids","disabled_mode_disclaimers","disabled_new_model_badge_mode_ids","disabled_settings_discovery_tooltip_feature_ids","disablement_disclaimer_last_dismissed_sec","disable_advanced_beta_dialog","disable_advanced_beta_non_en_banner","disable_advanced_resubscribe_ui","disable_at_mentions_discovery_tooltip","disable_autorun_fact_check_u18","disable_bot_create_tips_card","disable_bot_docs_in_gems_disclaimer","disable_bot_onboarding_dialog","disable_bot_save_reminder_tips_card","disable_bot_send_prompt_tips_card","disable_bot_shared_in_drive_disclaimer","disable_bot_try_create_tips_card","disable_colab_tooltip","disable_collapsed_tool_menu_tooltip","disable_continue_discovery_tooltip","disable_debug_info_moved_tooltip_v2","disable_enterprise_mode_dialog","disable_export_python_tooltip","disable_extensions_discovery_dialog","disable_extension_one_time_badge","disable_fact_check_tooltip_v2","disable_free_file_upload_tips_card","disable_generated_image_download_dialog","disable_get_app_banner","disable_get_app_desktop_dialog","disable_googler_in_enterprise_mode","disable_human_review_disclosure","disable_ice_open_vega_editor_tooltip","disable_image_upload_tooltip","disable_legal_concern_tooltip","disable_llm_history_import_disclaimer","disable_location_popup","disable_memory_discovery","disable_memory_extraction_discovery","disable_new_conversation_dialog","disable_onboarding_experience","disable_personal_context_tooltip","disable_photos_upload_disclaimer","disable_power_up_intro_tooltip","disable_scheduled_actions_mobile_notification_snackbar","disable_storybook_listen_button_tooltip","disable_streaming_settings_tooltip","disable_take_control_disclaimer","disable_teens_only_english_language_dialog","disable_tier1_rebranding_tooltip","disable_try_advanced_mode_dialog","enable_advanced_beta_mode","enable_advanced_mode","enable_googler_in_enterprise_mode","enable_memory","enable_memory_extraction","enable_personal_context","enable_personal_context_gemini","enable_personal_context_gemini_using_photos","enable_personal_context_gemini_using_workspace","enable_personal_context_search","enable_personal_context_youtube","enable_token_streaming","enforce_default_to_fast_version","mayo_discovery_banner_dismissal_count","mayo_discovery_banner_last_dismissed_sec","gempix_discovery_banner_dismissal_count","gempix_discovery_banner_last_dismissed","get_app_banner_ack_count","get_app_banner_seen_count","get_app_mobile_dialog_ack_count","guided_learning_banner_dismissal_count","guided_learning_banner_last_dismissed","has_accepted_agent_mode_fre_disclaimer","has_received_streaming_response","has_seen_agent_mode_tooltip","has_seen_bespoke_tooltip","has_seen_deepthink_mustard_tooltip","has_seen_deepthink_v2_tooltip","has_seen_deep_think_tooltip","has_seen_first_youtube_video_disclaimer","has_seen_ggo_tooltip","has_seen_image_grams_discovery_banner","has_seen_image_preview_in_input_area_tooltip","has_seen_kallo_discovery_banner","has_seen_kallo_tooltip","has_seen_model_picker_in_input_area_tooltip","has_seen_model_tooltip_in_input_area_for_gempix","has_seen_redo_with_gempix2_tooltip","has_seen_veograms_discovery_banner","has_seen_video_generation_discovery_banner","is_imported_chats_panel_open_by_default","jumpstart_onboarding_dismissal_count","last_dismissed_deep_research_implicit_invite","last_dismissed_discovery_feature_implicit_invites","last_dismissed_immersives_canvas_implicit_invite","last_dismissed_immersive_share_disclaimer_sec","last_dismissed_strike_timestamp_sec","last_dismissed_zs_student_aip_banner_sec","last_get_app_banner_ack_timestamp_sec","last_get_app_mobile_dialog_ack_timestamp_sec","last_human_review_disclosure_ack","last_selected_mode_id_in_embedded","last_selected_mode_id_on_web","last_two_up_activation_timestamp_sec","last_winter_olympics_interaction_timestamp_sec","memory_extracted_greeting_name","mini_gemini_tos_closed","mode_switcher_soft_badge_disabled_ids","mode_switcher_soft_badge_seen_count","personalization_first_party_onboarding_cross_surface_clicked","personalization_first_party_onboarding_cross_surface_seen_count","personalization_one_p_discovery_card_seen_count","personalization_one_p_discovery_last_consented","personalization_zero_state_card_last_interacted","personalization_zero_state_card_seen_count","popup_zs_visits_cooldown","require_reconsent_setting_for_personalization_banner_seen_count","show_debug_info","side_nav_open_by_default","student_verification_dismissal_count","student_verification_last_dismissed","task_viewer_cc_banner_dismissed_count","task_viewer_cc_banner_dismissed_time_sec","tool_menu_new_badge_disabled_ids","tool_menu_new_badge_impression_counts","tool_menu_soft_badge_disabled_ids","tool_menu_soft_badge_impression_counts","upload_disclaimer_last_consent_time_sec","viewed_student_aip_upsell_campaign_ids","voice_language","voice_name","web_and_app_activity_enabled","wellbeing_nudge_notice_last_dismissed_sec","zs_student_aip_banner_dismissal_count"]]]',
                )
            ]
        )

    async def _send_bard_activity(self) -> None:
        """
        Send warmup RPC calls before querying.
        """
        await self._batch_execute(
            [
                RPCData(
                    rpcid=GRPC.BARD_SETTINGS,
                    payload='[[["bard_activity_enabled"]]]',
                )
            ]
        )

    def list_models(self) -> list[AvailableModel] | None:
        """
        List all available models for the current account.

        Returns
        -------
        `list[gemini_webapi.types.AvailableModel]`
            List of models with their name and description. Returns `None` if the client holds no session cache.
        """
        return self._available_models

    async def generate_content(
        self,
        prompt: str,
        files: list[str | Path | bytes | io.BytesIO] | None = None,
        model: Model | str | dict = Model.UNSPECIFIED,
        gem: Gem | str | None = None,
        chat: Optional["ChatSession"] = None,
        temporary: bool = False,
        **kwargs,
    ) -> ModelOutput:
        """
        Generates contents with prompt.

        Parameters
        ----------
        prompt: `str`
            Text prompt provided by user.
        files: `list[str | Path | bytes | io.BytesIO]`, optional
            List of file paths or byte streams to be attached.
        model: `Model | str | dict`, optional
            Specify the model to use for generation.
            Pass either a `gemini_webapi.constants.Model` enum or a model name string to use predefined models.
            Pass a dictionary to use custom model header strings ("model_name" and "model_header" keys must be provided).
        gem: `Gem | str`, optional
            Specify a gem to use as system prompt for the chat session.
            Pass either a `gemini_webapi.types.Gem` object or a gem id string.
        chat: `ChatSession`, optional
            Chat data to retrieve conversation history.
            If None, will automatically generate a new chat id when sending post request.
        temporary: `bool`, optional
            If set to `True`, the ongoing conversation will not show up in Gemini history.
        kwargs: `dict`, optional
            Additional arguments which will be passed to the post request.
            Refer to `curl_cffi.requests.AsyncSession.request` for more information.

        Returns
        -------
        :class:`ModelOutput`
            Output data from gemini.google.com.

        Raises
        ------
        `AssertionError`
            If prompt is empty.
        `gemini_webapi.TimeoutError`
            If request timed out.
        `gemini_webapi.GeminiError`
            If no reply candidate found in response.
        `gemini_webapi.APIError`
            - If request failed with status code other than 200.
            - If response structure is invalid and failed to parse.
        """

        if self.auto_close:
            await self.reset_close_task()

        file_data = None
        if files:
            await self._send_bard_activity()

            uploaded_urls = await asyncio.gather(
                *(
                    upload_file(file, client=self.client, verbose=self.verbose)
                    for file in files
                )
            )
            file_data = [
                [[url], parse_file_name(file)]
                for url, file in zip(uploaded_urls, files)
            ]

        try:
            await self._send_bard_activity()

            session_state = {
                "last_texts": {},
                "last_thoughts": {},
                "last_progress_time": time.time(),
                "is_thinking": False,
                "is_queueing": False,
                "title": None,
            }
            output = None
            async for output in self._generate(
                prompt=prompt,
                req_file_data=file_data,
                model=model,
                gem=gem,
                chat=chat,
                temporary=temporary,
                session_state=session_state,
                **kwargs,
            ):
                pass

            if output is None:
                raise GeminiError(
                    "Failed to generate contents. No output data found in response."
                )

            if isinstance(chat, ChatSession):
                output.metadata = chat.metadata
                chat.last_output = output

            return output

        finally:
            if files:
                for file in files:
                    if isinstance(file, io.BytesIO):
                        file.close()

    async def generate_content_stream(
        self,
        prompt: str,
        files: list[str | Path | bytes | io.BytesIO] | None = None,
        model: Model | str | dict = Model.UNSPECIFIED,
        gem: Gem | str | None = None,
        chat: Optional["ChatSession"] = None,
        temporary: bool = False,
        **kwargs,
    ) -> AsyncGenerator[ModelOutput, None]:
        """
        Generates contents with prompt in streaming mode.

        This method sends a request to Gemini and yields partial responses as they arrive.
        It automatically calculates the text delta (new characters) to provide a smooth
        streaming experience. It also continuously updates chat metadata and candidate IDs.

        Parameters
        ----------
        prompt: `str`
            Text prompt provided by user.
        files: `list[str | Path | bytes | io.BytesIO]`, optional
            List of file paths or byte streams to be attached.
        model: `Model | str | dict`, optional
            Specify the model to use for generation.
        gem: `Gem | str`, optional
            Specify a gem to use as system prompt for the chat session.
        chat: `ChatSession`, optional
            Chat data to retrieve conversation history.
        temporary: `bool`, optional
            If set to `True`, the ongoing conversation will not show up in Gemini history.
        kwargs: `dict`, optional
            Additional arguments passed to `curl_cffi.requests.AsyncSession.stream`.

        Yields
        ------
        :class:`ModelOutput`
            Partial output data. The `text_delta` attribute contains only the NEW characters
            received since the last yield.

        Raises
        ------
        `gemini_webapi.APIError`
            If the request fails or response structure is invalid.
        `gemini_webapi.TimeoutError`
            If the stream request times out.
        """

        if self.auto_close:
            await self.reset_close_task()

        file_data = None
        if files:
            await self._send_bard_activity()

            uploaded_urls = await asyncio.gather(
                *(
                    upload_file(file, client=self.client, verbose=self.verbose)
                    for file in files
                )
            )
            file_data = [
                [[url], parse_file_name(file)]
                for url, file in zip(uploaded_urls, files)
            ]

        try:
            await self._send_bard_activity()

            session_state = {
                "last_texts": {},
                "last_thoughts": {},
                "last_progress_time": time.time(),
                "is_thinking": False,
                "is_queueing": False,
                "title": None,
            }
            output = None
            async for output in self._generate(
                prompt=prompt,
                req_file_data=file_data,
                model=model,
                gem=gem,
                chat=chat,
                temporary=temporary,
                session_state=session_state,
                **kwargs,
            ):
                yield output

            if output and isinstance(chat, ChatSession):
                output.metadata = chat.metadata
                chat.last_output = output

        finally:
            if files:
                for file in files:
                    if isinstance(file, io.BytesIO):
                        file.close()

    @running(retry=5)
    async def _generate(
        self,
        prompt: str,
        req_file_data: list[Any] | None = None,
        model: Model | str | dict = Model.UNSPECIFIED,
        gem: Gem | str | None = None,
        chat: Optional["ChatSession"] = None,
        temporary: bool = False,
        session_state: dict[str, Any] | None = None,
        **kwargs,
    ) -> AsyncGenerator[ModelOutput, None]:
        """
        Internal method which actually sends content generation requests.
        """

        assert prompt, "Prompt cannot be empty."

        if isinstance(model, str):
            model = Model.from_name(model)
        elif isinstance(model, dict):
            model = Model.from_dict(model)
        elif not isinstance(model, Model):
            raise TypeError(
                f"'model' must be a `gemini_webapi.constants.Model` instance, "
                f"string, or dictionary; got `{type(model).__name__}`"
            )

        _reqid = self._reqid
        self._reqid += 100000

        gem_id = gem.id if isinstance(gem, Gem) else gem

        chat_backup: dict[str, Any] | None = None
        if chat:
            chat_backup = {
                "metadata": (
                    list(chat.metadata)
                    if getattr(chat, "metadata", None)
                    else list(_DEFAULT_METADATA)
                ),
                "cid": getattr(chat, "cid", ""),
                "rid": getattr(chat, "rid", ""),
                "rcid": getattr(chat, "rcid", ""),
            }

        if session_state is None:
            session_state = {
                "last_texts": {},
                "last_thoughts": {},
                "last_progress_time": time.time(),
                "is_thinking": False,
                "is_queueing": False,
                "title": None,
            }
        else:
            # Reset connection-specific states during a retry attempt
            session_state["last_progress_time"] = time.time()
            session_state["is_thinking"] = False
            session_state["is_queueing"] = False

        has_generated_text = False
        sleep_time = 10

        message_content = [
            prompt,
            0,
            None,
            req_file_data,
            None,
            None,
            0,
        ]

        params: dict[str, Any] = {"_reqid": _reqid, "rt": "c"}
        if self.build_label:
            params["bl"] = self.build_label
        if self.session_id:
            params["f.sid"] = self.session_id

        while True:
            try:
                inner_req_list: list[Any] = [None] * 69
                inner_req_list[0] = message_content
                inner_req_list[2] = chat.metadata if chat else list(_DEFAULT_METADATA)
                inner_req_list[STREAMING_FLAG_INDEX] = 1
                if gem_id:
                    inner_req_list[GEM_FLAG_INDEX] = gem_id
                if temporary:
                    inner_req_list[TEMPORARY_CHAT_FLAG_INDEX] = 1

                request_data = {
                    "at": self.access_token,
                    "f.req": json.dumps(
                        [
                            None,
                            json.dumps(inner_req_list).decode("utf-8"),
                        ]
                    ).decode("utf-8"),
                }

                async with self.client.stream(
                    "POST",
                    Endpoint.GENERATE,
                    params=params,
                    headers=model.model_header,
                    data=request_data,
                    **kwargs,
                ) as response:
                    if self.verbose:
                        logger.debug(
                            f"HTTP Request: POST {Endpoint.GENERATE} [{response.status_code}]"
                        )
                    if response.status_code != 200:
                        await self.close()
                        raise APIError(
                            f"Failed to generate contents. Status: {response.status_code}"
                        )

                    buffer = ""
                    decoder = codecs.getincrementaldecoder("utf-8")(errors="replace")

                    last_texts: dict[str, str] = session_state["last_texts"]
                    last_thoughts: dict[str, str] = session_state["last_thoughts"]
                    last_progress_time = session_state["last_progress_time"]

                    is_thinking = session_state["is_thinking"]
                    is_queueing = session_state["is_queueing"]
                    has_candidates = False
                    is_completed = False  # Check if this conversation turn has been fully answered.
                    is_final_chunk = False  # Check if this turn is saved to history and marked complete or still pending (e.g., video generation).
                    cid = chat.cid if chat else ""
                    rid = chat.rid if chat else ""

                    async def _process_parts(
                        parts: list[Any],
                    ) -> AsyncGenerator[ModelOutput, None]:
                        nonlocal is_thinking, is_queueing, has_candidates, is_completed, is_final_chunk, cid, rid
                        for part in parts:
                            # Check for fatal error codes
                            error_code = get_nested_value(part, [5, 2, 0, 1, 0])
                            if error_code:
                                await self.close()
                                match error_code:
                                    case ErrorCode.USAGE_LIMIT_EXCEEDED:
                                        raise UsageLimitExceeded(
                                            f"Usage limit exceeded for model '{model.model_name}'. Please wait a few minutes, "
                                            "switch to a different model (e.g., Gemini Flash), or check your account limits on gemini.google.com."
                                        )
                                    case ErrorCode.MODEL_INCONSISTENT:
                                        raise ModelInvalid(
                                            "The specified model is inconsistent with the conversation history. "
                                            "Please ensure you are using the same 'model' parameter throughout the entire ChatSession."
                                        )
                                    case ErrorCode.MODEL_HEADER_INVALID:
                                        raise ModelInvalid(
                                            f"The model '{model.model_name}' is currently unavailable or the request structure is outdated. "
                                            "Please update 'gemini_webapi' to the latest version or report this on GitHub if the problem persists."
                                        )
                                    case ErrorCode.IP_TEMPORARILY_BLOCKED:
                                        raise TemporarilyBlocked(
                                            "Your IP address has been temporarily flagged or blocked by Google. "
                                            "Please try using a proxy, a different network, or wait for a while before retrying."
                                        )
                                    case ErrorCode.TEMPORARY_ERROR_1013:
                                        raise APIError(
                                            "Gemini encountered a temporary error (1013). Retrying..."
                                        )
                                    case _:
                                        raise APIError(
                                            f"Failed to generate contents (stream). Unknown API error code: {error_code}. "
                                            "This might be a temporary Google service issue."
                                        )

                            # Check for queueing status
                            status = get_nested_value(part, [5])
                            if isinstance(status, list) and status:
                                if not is_thinking:
                                    is_queueing = True
                                    session_state["is_queueing"] = True
                                    if not has_candidates:
                                        logger.debug(
                                            "Model is in a waiting state (queueing)..."
                                        )

                            inner_json_str = get_nested_value(part, [2])
                            if inner_json_str:
                                try:
                                    part_json = json.loads(inner_json_str)
                                    m_data = get_nested_value(part_json, [1])
                                    cid = get_nested_value(m_data, [0], "")
                                    rid = get_nested_value(m_data, [1], "")
                                    if m_data and isinstance(chat, ChatSession):
                                        chat.metadata = m_data

                                    # Check for busy analyzing data
                                    tool_name = get_nested_value(part_json, [6, 1, 0])
                                    if tool_name == "data_analysis_tool":
                                        is_thinking = True
                                        session_state["is_thinking"] = True
                                        is_queueing = False
                                        session_state["is_queueing"] = False
                                        if not has_candidates:
                                            logger.debug(
                                                f"Model is active (thinking/analyzing)... Raw: {str(part_json)[:500]}"
                                            )

                                    context_str = get_nested_value(part_json, [25])
                                    if isinstance(context_str, str):
                                        is_final_chunk = True
                                        is_thinking = False
                                        session_state["is_thinking"] = False
                                        is_queueing = False
                                        session_state["is_queueing"] = False
                                        if isinstance(chat, ChatSession):
                                            chat.metadata = [None] * 9 + [context_str]

                                    title = get_nested_value(part_json, [10, 0])
                                    if title:
                                        session_state["title"] = title

                                    candidates_list = get_nested_value(
                                        part_json, [4], []
                                    )
                                    if candidates_list:
                                        output_candidates = []
                                        for i, candidate_data in enumerate(
                                            candidates_list
                                        ):
                                            rcid = get_nested_value(candidate_data, [0])
                                            if not rcid:
                                                continue
                                            if isinstance(chat, ChatSession):
                                                chat.rcid = rcid

                                            (
                                                text,
                                                thoughts,
                                                web_images,
                                                generated_images,
                                                generated_videos,
                                            ) = self._parse_candidate(
                                                candidate_data, cid, rid, rcid
                                            )

                                            # Check if this frame represents the complete state of the message
                                            is_completed = (
                                                get_nested_value(
                                                    candidate_data, [8, 0], 1
                                                )
                                                == 2
                                            )

                                            # Save this conversation turn to list_chats whenever it is stored in history.
                                            if is_final_chunk:
                                                cid = get_nested_value(
                                                    part_json, [1, 0]
                                                )
                                                if cid and isinstance(
                                                    self._recent_chats, list
                                                ):
                                                    chat_title = session_state.get(
                                                        "title"
                                                    )
                                                    if not chat_title:
                                                        for c in self._recent_chats:
                                                            if c.cid == cid:
                                                                chat_title = c.title
                                                                break

                                                    if chat_title:
                                                        is_pinned = False
                                                        for c in self._recent_chats:
                                                            if c.cid == cid:
                                                                is_pinned = c.is_pinned
                                                                break

                                                        expected_idx = (
                                                            0
                                                            if is_pinned
                                                            else sum(
                                                                1
                                                                for c in self._recent_chats
                                                                if c.cid != cid
                                                                and c.is_pinned
                                                            )
                                                        )

                                                        if not (
                                                            len(self._recent_chats)
                                                            > expected_idx
                                                            and self._recent_chats[
                                                                expected_idx
                                                            ].cid
                                                            == cid
                                                            and self._recent_chats[
                                                                expected_idx
                                                            ].title
                                                            == chat_title
                                                        ):
                                                            self._recent_chats = [
                                                                c
                                                                for c in self._recent_chats
                                                                if c.cid != cid
                                                            ]
                                                            self._recent_chats.insert(
                                                                expected_idx,
                                                                ChatInfo(
                                                                    cid=cid,
                                                                    title=chat_title,
                                                                    is_pinned=is_pinned,
                                                                ),
                                                            )

                                            last_sent_text = last_texts.get(
                                                rcid
                                            ) or last_texts.get(f"idx_{i}", "")
                                            text_delta, new_full_text = (
                                                get_delta_by_fp_len(
                                                    text,
                                                    last_sent_text,
                                                    is_final=is_completed,
                                                )
                                            )
                                            last_sent_thought = last_thoughts.get(
                                                rcid
                                            ) or last_thoughts.get(f"idx_{i}", "")
                                            if thoughts:
                                                thoughts_delta, new_full_thought = (
                                                    get_delta_by_fp_len(
                                                        thoughts,
                                                        last_sent_thought,
                                                        is_final=is_completed,
                                                    )
                                                )
                                            else:
                                                thoughts_delta = ""
                                                new_full_thought = ""

                                            if (
                                                text_delta
                                                or thoughts_delta
                                                or web_images
                                                or generated_images
                                            ):
                                                has_candidates = True
                                                if thoughts_delta:
                                                    logger.debug(f"[Thinking]: {thoughts_delta.strip()}")
                                                if text_delta:
                                                    logger.debug(f"[Generating]: {text_delta.strip()}")

                                            # Update state with the provider's cleaned state to handle drift
                                            last_texts[rcid] = last_texts[
                                                f"idx_{i}"
                                            ] = new_full_text

                                            last_thoughts[rcid] = last_thoughts[
                                                f"idx_{i}"
                                            ] = new_full_thought

                                            output_candidates.append(
                                                Candidate(
                                                    rcid=rcid,
                                                    text=text,
                                                    text_delta=text_delta,
                                                    thoughts=thoughts or None,
                                                    thoughts_delta=thoughts_delta,
                                                    web_images=web_images,
                                                    generated_images=generated_images,
                                                    generated_videos=generated_videos,
                                                )
                                            )

                                        if output_candidates:
                                            is_thinking = False
                                            session_state["is_thinking"] = False
                                            is_queueing = False
                                            session_state["is_queueing"] = False
                                            yield ModelOutput(
                                                metadata=get_nested_value(
                                                    part_json, [1], []
                                                ),
                                                candidates=output_candidates,
                                            )
                                except json.JSONDecodeError:
                                    continue

                    chunk_iterator = response.aiter_content().__aiter__()
                    while True:
                        try:
                            stall_threshold = (
                                self.timeout
                                if (is_thinking or is_queueing)
                                else min(self.timeout, self.watchdog_timeout)
                            )
                            chunk = await asyncio.wait_for(
                                chunk_iterator.__anext__(), timeout=stall_threshold + 5
                            )
                        except StopAsyncIteration:
                            break
                        except asyncio.TimeoutError:
                            logger.debug(
                                f"[Watchdog] Socket idle for {stall_threshold + 5}s. Refreshing connection..."
                            )
                            break

                        buffer += decoder.decode(chunk, final=False)
                        if buffer.startswith(")]}'"):
                            buffer = buffer[4:].lstrip()
                        parsed_parts, buffer = parse_response_by_frame(buffer)

                        got_update = False
                        async for out in _process_parts(parsed_parts):
                            has_generated_text = True
                            yield out
                            got_update = True

                        if got_update:
                            last_progress_time = time.time()
                            session_state["last_progress_time"] = last_progress_time
                        else:
                            stall_threshold = (
                                self.timeout
                                if (is_thinking or is_queueing)
                                else min(self.timeout, self.watchdog_timeout)
                            )
                            if (time.time() - last_progress_time) > stall_threshold:
                                if is_thinking:
                                    logger.debug(
                                        f"[Watchdog] Model is taking its time thinking ({int(time.time() - last_progress_time)}s). Reconnecting to poll..."
                                    )
                                    break
                                else:
                                    logger.debug(
                                        f"[Watchdog] Connection idle for {stall_threshold}s (queueing={is_queueing}). "
                                        "Attempting recovery..."
                                    )
                                    await self.close()
                                    break

                    # Final flush
                    buffer += decoder.decode(b"", final=True)
                    if buffer:
                        parsed_parts, _ = parse_response_by_frame(buffer)
                        async for out in _process_parts(parsed_parts):
                            has_generated_text = True
                            yield out

                    if not is_completed or is_thinking or is_queueing:
                        stall_threshold = (
                            self.timeout
                            if (is_thinking or is_queueing)
                            else min(self.timeout, self.watchdog_timeout)
                        )
                        if (time.time() - last_progress_time) > stall_threshold:
                            if not is_thinking:
                                logger.debug(
                                    f"[Watchdog] Stream ended after {stall_threshold}s without completing. Triggering recovery..."
                                )
                            else:
                                logger.debug(
                                    "[Watchdog] Stream finished but model is still thinking. Polling again..."
                                )

                        if cid:
                            logger.debug(
                                f"Stream incomplete. Checking conversation history for {cid}..."
                            )

                            poll_start_time = time.time()

                            while True:
                                if (time.time() - poll_start_time) > self.timeout:
                                    logger.warning(
                                        f"[Recovery] Polling for {cid} timed out after {self.timeout}s."
                                    )
                                    if has_generated_text:
                                        raise GeminiError(
                                            "The connection to Gemini was lost while generating the response, and recovery timed out. "
                                            "Please try sending your prompt again."
                                        )
                                    else:
                                        raise APIError(
                                            "read_chat polling timed out waiting for the model to finish. "
                                            "The original request may have been silently aborted by Google."
                                        )
                                await self._send_bard_activity()
                                recovered_history = await self.read_chat(cid)
                                if (
                                    recovered_history
                                    and recovered_history.turns
                                    and recovered_history.turns[-1].role == "model"
                                ):
                                    recovered = recovered_history.turns[-1].info
                                    if (
                                        recovered
                                        and recovered.candidates
                                        and (
                                            recovered.candidates[0].text.strip()
                                            or recovered.candidates[0].generated_images
                                            or recovered.candidates[0].web_images
                                        )
                                    ):
                                        rec_rcid = recovered.candidates[0].rcid
                                        prev_rcid = (
                                            chat_backup["rcid"] if chat_backup else ""
                                        )
                                        current_expected_rcid = (
                                            getattr(chat, "rcid", "") if chat else ""
                                        )

                                        is_new_turn = (
                                            rec_rcid == current_expected_rcid
                                            if current_expected_rcid
                                            else rec_rcid != prev_rcid
                                        )

                                        if is_new_turn:
                                            logger.debug(
                                                f"[Recovery] Successfully recovered response for CID: {cid} (RCID: {rec_rcid})"
                                            )
                                            if chat:
                                                recovered.metadata = chat.metadata
                                                chat.rcid = rec_rcid
                                            yield recovered
                                            break
                                        else:
                                            logger.debug(
                                                f"[Recovery] Recovered turn is not the target turn (target: {current_expected_rcid or 'NEW'}, got {rec_rcid}). Waiting..."
                                            )

                                logger.debug(
                                    f"[Recovery] Response not ready, waiting {sleep_time}s..."
                                )
                                await asyncio.sleep(sleep_time)
                            break
                        else:
                            logger.debug(
                                f"Stream suspended (completed={is_completed}, final_chunk={is_final_chunk}, thinking={is_thinking}, queueing={is_queueing}). "
                                f"No CID found to recover. (Request ID: {_reqid})"
                            )
                            raise APIError(
                                "The original request may have been silently aborted by Google."
                            )

                break

            except ReadTimeout:
                raise TimeoutError(
                    "The request timed out while waiting for Gemini to respond. This often happens with very long prompts "
                    "or complex file analysis. Try increasing the 'timeout' value when initializing GeminiClient."
                )
            except (GeminiError, APIError):
                if not has_generated_text and chat and chat_backup:
                    chat.metadata = list(chat_backup["metadata"])  # type: ignore
                    chat.cid = chat_backup["cid"]
                    chat.rid = chat_backup["rid"]
                    chat.rcid = chat_backup["rcid"]
                raise
            except Exception:
                if not has_generated_text and chat and chat_backup:
                    chat.metadata = list(chat_backup["metadata"])  # type: ignore
                    chat.cid = chat_backup["cid"]
                    chat.rid = chat_backup["rid"]
                    chat.rcid = chat_backup["rcid"]
                logger.debug(
                    "Stream parsing interrupted. Attempting to recover conversation context..."
                )
                raise APIError(
                    "Failed to parse response body from Google. This might be a temporary API change or invalid data."
                )

    def start_chat(self, **kwargs) -> "ChatSession":
        """
        Returns a `ChatSession` object attached to this client.

        Parameters
        ----------
        kwargs: `dict`, optional
            Additional arguments which will be passed to the chat session.
            Refer to `gemini_webapi.ChatSession` for more information.

        Returns
        -------
        :class:`ChatSession`
            Empty chat session object for retrieving conversation history.
        """

        return ChatSession(geminiclient=self, **kwargs)

    async def delete_chat(self, cid: str) -> None:
        """
        Delete a specific conversation by chat id.

        Parameters
        ----------
        cid: `str`
            The ID of the chat requiring deletion (e.g. "c_...").
        """

        await self._batch_execute(
            [
                RPCData(
                    rpcid=GRPC.DELETE_CHAT,
                    payload=json.dumps([cid]).decode("utf-8"),
                ),
            ]
        )
        await self._batch_execute(
            [
                RPCData(
                    rpcid=GRPC.DELETE_CHAT_SECOND,
                    payload=json.dumps([cid, [1, None, 0, 1]]).decode("utf-8"),
                ),
            ]
        )

    def list_chats(self) -> list[ChatInfo] | None:
        """
        List all conversations.

        Returns
        -------
        `list[gemini_webapi.types.ChatInfo] | None`
            The list of conversations. Returns `None` if the client holds no session cache.
        """
        return self._recent_chats

    async def read_chat(self, cid: str, limit: int = 10) -> ChatHistory | None:
        """
        Fetch the full conversation history by chat id.

        Parameters
        ----------
        cid: `str`
            The ID of the conversation to read (e.g. "c_...").
        limit: `int`, optional
            The maximum number of turns to fetch, by default 10.

        Returns
        -------
        :class:`ChatHistory` | None
            The conversation history, or None if reading failed.
        """
        try:
            response = await self._batch_execute(
                [
                    RPCData(
                        rpcid=GRPC.READ_CHAT,
                        payload=json.dumps(
                            [cid, limit, None, 1, [1], [4], None, 1]
                        ).decode("utf-8"),
                    ),
                ]
            )

            response_json = extract_json_from_response(response.text)

            for part in response_json:
                part_body_str = get_nested_value(part, [2])
                if not part_body_str:
                    continue

                part_body = json.loads(part_body_str)
                turns_data = get_nested_value(part_body, [0])
                if not turns_data:
                    continue

                chat_turns = []
                for conv_turn in turns_data:
                    # User turn
                    user_text = get_nested_value(conv_turn, [2, 0, 0], "")
                    if user_text:
                        chat_turns.append(ChatTurn(role="user", text=user_text))

                    # Model turn
                    candidates_list = get_nested_value(conv_turn, [3, 0])
                    if candidates_list:
                        output_candidates = []
                        rid = get_nested_value(conv_turn, [1], "")
                        for candidate_data in candidates_list:
                            rcid = get_nested_value(candidate_data, [0], "")
                            (
                                text,
                                thoughts,
                                web_images,
                                generated_images,
                                generated_videos,
                            ) = self._parse_candidate(candidate_data, cid, rid, rcid)
                            output_candidates.append(
                                Candidate(
                                    rcid=rcid,
                                    text=text,
                                    thoughts=thoughts,
                                    web_images=web_images,
                                    generated_images=generated_images,
                                    generated_videos=generated_videos,
                                )
                            )

                        if output_candidates:
                            model_output = ModelOutput(
                                metadata=[cid, rid, output_candidates[0].rcid],
                                candidates=output_candidates,
                            )
                            chat_turns.append(
                                ChatTurn(
                                    role="model",
                                    text=output_candidates[0].text,
                                    info=model_output,
                                )
                            )

                return ChatHistory(cid=cid, metadata=[cid], turns=chat_turns)

            return None
        except Exception:
            logger.debug(
                f"[read_chat] Response data for {cid!r} is still incomplete (model is still processing)..."
            )
            return None

    def _parse_candidate(
        self, candidate_data: list[Any], cid: str, rid: str, rcid: str
    ) -> tuple[str, str, list[WebImage], list[GeneratedImage], list[GeneratedVideo]]:
        """
        Parses individual candidate data from the Gemini response.

        Args:
            candidate_data (list[Any]): The raw candidate list from the API response.
            cid (str): Conversation ID.
            rid (str): Response ID.
            rcid (str): Response Candidate ID.

        Returns:
            tuple: A tuple containing:
                - text (str): The main response text.
                - thoughts (str): The model's reasoning or internal thoughts.
                - web_images (list[WebImage]): List of images found on the web.
                - generated_images (list[GeneratedImage]): List of images generated by the model.
                - generated_videos (list[GeneratedVideo]): List of videos generated by the model.
        """
        text = get_nested_value(candidate_data, [1, 0], "")
        if _CARD_CONTENT_RE.match(text):
            text = get_nested_value(candidate_data, [22, 0]) or text

        # Cleanup googleusercontent artifacts
        text = _ARTIFACTS_RE.sub("", text)

        thoughts = get_nested_value(candidate_data, [37, 0, 0]) or ""

        # Image handling
        web_images = []
        for img_idx, web_img_data in enumerate(
            get_nested_value(candidate_data, [12, 1], [])
        ):
            url = get_nested_value(web_img_data, [0, 0, 0])
            if url:
                web_images.append(
                    WebImage(
                        url=url,
                        title=f"[Image {img_idx + 1}]",
                        alt=get_nested_value(web_img_data, [0, 4], ""),
                        proxy=self.proxy,
                        client=self.client,
                    )
                )

        generated_images = []
        for img_idx, gen_img_data in enumerate(
            get_nested_value(candidate_data, [12, 7, 0], [])
        ):
            url = get_nested_value(gen_img_data, [0, 3, 3])
            if url:
                image_id = get_nested_value(gen_img_data, [1, 0])
                if not image_id:
                    image_id = f"http://googleusercontent.com/image_generation_content/{img_idx}"

                generated_images.append(
                    GeneratedImage(
                        url=url,
                        title=f"[Generated Image {img_idx}]",
                        alt=get_nested_value(gen_img_data, [0, 3, 2], ""),
                        proxy=self.proxy,
                        client=self.client,
                        client_ref=self,
                        cid=cid,
                        rid=rid,
                        rcid=rcid,
                        image_id=image_id,
                    )
                )

        # Video handling
        generated_videos = []
        for video_root in get_nested_value(candidate_data, [12, 59, 0], []):
            video_info = get_nested_value(video_root, [0])
            if video_info:
                urls = get_nested_value(video_info, [0, 7], [])
                if len(urls) >= 2:
                    generated_videos.append(
                        GeneratedVideo(
                            url=urls[1],
                            thumbnail=urls[0],
                            cid=cid,
                            rid=rid,
                            rcid=rcid,
                            client_ref=self,
                            proxy=self.proxy,
                        )
                    )

        return text, thoughts, web_images, generated_images, generated_videos

    async def _get_image_full_size(
        self, cid: str, rid: str, rcid: str, image_id: str
    ) -> str | None:
        """
        Get the full size URL of an image.
        """
        try:
            payload = [
                [
                    [None, None, None, [None, None, None, None, None, ""]],
                    [image_id, 0],
                    None,
                    [19, ""],
                    None,
                    None,
                    None,
                    None,
                    None,
                    "",
                ],
                [rid, rcid, cid, None, ""],
                1,
                0,
                1,
            ]

            response = await self._batch_execute(
                [
                    RPCData(
                        rpcid=GRPC.IMAGE_FULL_SIZE,
                        payload=json.dumps(payload).decode("utf-8"),
                    ),
                ]
            )

            response_data = extract_json_from_response(response.text)
            return get_nested_value(
                json.loads(get_nested_value(response_data, [0, 2], "[]")), [0]
            )
        except Exception:
            logger.debug(
                "[_get_image_full_size] Could not retrieve full size URL via RPC."
            )
            return None

    @running(retry=2)
    async def _batch_execute(self, payloads: list[RPCData], **kwargs) -> Response:
        """
        Execute a batch of requests to Gemini API.

        Parameters
        ----------
        payloads: `list[RPCData]`
            List of `gemini_webapi.types.RPCData` objects to be executed.
        kwargs: `dict`, optional
            Additional arguments which will be passed to the post request.
            Refer to `curl_cffi.requests.AsyncSession.request` for more information.

        Returns
        -------
        :class:`curl_cffi.requests.Response`
            Response object containing the result of the batch execution.
        """

        _reqid = self._reqid
        self._reqid += 100000

        try:
            params: dict[str, Any] = {
                "rpcids": ",".join([p.rpcid for p in payloads]),
                "_reqid": _reqid,
                "rt": "c",
                "source-path": "/app",
            }
            if self.build_label:
                params["bl"] = self.build_label
            if self.session_id:
                params["f.sid"] = self.session_id

            response = await self.client.post(
                Endpoint.BATCH_EXEC,
                params=params,
                data={
                    "at": self.access_token,
                    "f.req": json.dumps(
                        [[payload.serialize() for payload in payloads]]
                    ).decode("utf-8"),
                },
                **kwargs,
            )
            if self.verbose:
                logger.debug(
                    f"HTTP Request: POST {Endpoint.BATCH_EXEC} [{response.status_code}]"
                )
        except ReadTimeout:
            raise TimeoutError(
                "The request timed out while waiting for Gemini to respond. This often happens with very long prompts "
                "or complex file analysis. Try increasing the 'timeout' value when initializing GeminiClient."
            )

        if response.status_code != 200:
            await self.close()
            raise APIError(
                f"Batch execution failed with status code {response.status_code}"
            )

        return response


class ChatSession:
    """
    Chat data to retrieve conversation history. Only if all 3 ids are provided will the conversation history be retrieved.

    Parameters
    ----------
    geminiclient: `GeminiClient`
        Async requests client interface for gemini.google.com.
    metadata: `list[str]`, optional
        List of chat metadata `[cid, rid, rcid]`, can be shorter than 3 elements, like `[cid, rid]` or `[cid]` only.
    cid: `str`, optional
        Chat id, if provided together with metadata, will override the first value in it.
    rid: `str`, optional
        Reply id, if provided together with metadata, will override the second value in it.
    rcid: `str`, optional
        Reply candidate id, if provided together with metadata, will override the third value in it.
    model: `Model | str | dict`, optional
        Specify the model to use for generation.
        Pass either a `gemini_webapi.constants.Model` enum or a model name string to use predefined models.
        Pass a dictionary to use custom model header strings ("model_name" and "model_header" keys must be provided).
    gem: `Gem | str`, optional
        Specify a gem to use as system prompt for the chat session.
        Pass either a `gemini_webapi.types.Gem` object or a gem id string.
    """

    __slots__ = [
        "__metadata",
        "geminiclient",
        "last_output",
        "model",
        "gem",
    ]

    def __init__(
        self,
        geminiclient: GeminiClient,
        metadata: list[str | None] | None = None,
        cid: str = "",  # chat id
        rid: str = "",  # reply id
        rcid: str = "",  # reply candidate id
        model: Model | str | dict = Model.UNSPECIFIED,
        gem: Gem | str | None = None,
    ):
        self.__metadata: list[Any] = list(_DEFAULT_METADATA)
        self.geminiclient: GeminiClient = geminiclient
        self.last_output: ModelOutput | None = None
        self.model: Model | str | dict = model
        self.gem: Gem | str | None = gem

        if metadata:
            self.metadata = metadata
        if cid:
            self.cid = cid
        if rid:
            self.rid = rid
        if rcid:
            self.rcid = rcid

    def __str__(self):
        return f"ChatSession(cid='{self.cid}', rid='{self.rid}', rcid='{self.rcid}')"

    __repr__ = __str__

    def __setattr__(self, name: str, value: Any) -> None:
        super().__setattr__(name, value)
        # update conversation history when last output is updated
        if name == "last_output" and isinstance(value, ModelOutput):
            self.metadata = value.metadata
            self.rcid = value.rcid

    async def send_message(
        self,
        prompt: str,
        files: list[str | Path | bytes | io.BytesIO] | None = None,
        temporary: bool = False,
        **kwargs,
    ) -> ModelOutput:
        """
        Generates contents with prompt.
        Use as a shortcut for `GeminiClient.generate_content(prompt, files, self)`.

        Parameters
        ----------
        prompt: `str`
            Text prompt provided by user.
        files: `list[str | Path | bytes | io.BytesIO]`, optional
            List of file paths or byte streams to be attached.
        temporary: `bool`, optional
            If set to `True`, the ongoing conversation will not show up in Gemini history.
            Switching temporary mode within a chat session will clear the previous context
            and create a new chat session under the hood.
        kwargs: `dict`, optional
            Additional arguments which will be passed to the post request.
            Refer to `curl_cffi.requests.AsyncSession.request` for more information.

        Returns
        -------
        :class:`ModelOutput`
            Output data from gemini.google.com.

        Raises
        ------
        `AssertionError`
            If prompt is empty.
        `gemini_webapi.TimeoutError`
            If request timed out.
        `gemini_webapi.GeminiError`
            If no reply candidate found in response.
        `gemini_webapi.APIError`
            - If request failed with status code other than 200.
            - If response structure is invalid and failed to parse.
        """

        return await self.geminiclient.generate_content(
            prompt=prompt,
            files=files,
            model=self.model,
            gem=self.gem,
            chat=self,
            temporary=temporary,
            **kwargs,
        )

    async def send_message_stream(
        self,
        prompt: str,
        files: list[str | Path | bytes | io.BytesIO] | None = None,
        temporary: bool = False,
        **kwargs,
    ) -> AsyncGenerator[ModelOutput, None]:
        """
        Generates contents with prompt in streaming mode within this chat session.

        This is a shortcut for `GeminiClient.generate_content_stream(prompt, files, self)`.
        The session's metadata and conversation history are automatically managed.

        Parameters
        ----------
        prompt: `str`
            Text prompt provided by user.
        files: `list[str | Path | bytes | io.BytesIO]`, optional
            List of file paths or byte streams to be attached.
        temporary: `bool`, optional
            If set to `True`, the ongoing conversation will not show up in Gemini history.
            Switching temporary mode within a chat session will clear the previous context
            and create a new chat session under the hood.
        kwargs: `dict`, optional
            Additional arguments passed to the streaming request.

        Yields
        ------
        :class:`ModelOutput`
            Partial output data containing text deltas.
        """

        async for output in self.geminiclient.generate_content_stream(
            prompt=prompt,
            files=files,
            model=self.model,
            gem=self.gem,
            chat=self,
            temporary=temporary,
            **kwargs,
        ):
            yield output

    def choose_candidate(self, index: int) -> ModelOutput:
        """
        Choose a candidate from the last `ModelOutput` to control the ongoing conversation flow.

        Parameters
        ----------
        index: `int`
            Index of the candidate to choose, starting from 0.

        Returns
        -------
        :class:`ModelOutput`
            Output data of the chosen candidate.

        Raises
        ------
        `ValueError`
            If no previous output data found in this chat session, or if index exceeds the number of candidates in last model output.
        """

        if not self.last_output:
            raise ValueError("No previous output data found in this chat session.")

        if index >= len(self.last_output.candidates):
            raise ValueError(
                f"Index {index} exceeds the number of candidates in last model output."
            )

        self.last_output.chosen = index
        self.rcid = self.last_output.rcid
        return self.last_output

    async def read_history(self, limit: int = 10) -> ChatHistory | None:
        """
        Fetch the conversation history for this session.

        Parameters
        ----------
        limit: `int`, optional
            The maximum number of turns to fetch, by default 10.

        Returns
        -------
        :class:`ChatHistory` | None
            The conversation history, or None if reading failed or cid is missing.
        """
        if not self.cid:
            return None
        return await self.geminiclient.read_chat(self.cid, limit=limit)

    @property
    def metadata(self):
        return self.__metadata

    @metadata.setter
    def metadata(self, value: list[str]):
        if not isinstance(value, list):
            return

        # Update only non-None elements to preserve existing CID/RID/RCID/Context
        for i, val in enumerate(value):
            if i < 10 and val is not None:
                self.__metadata[i] = val

    @property
    def cid(self):
        return self.__metadata[0]

    @cid.setter
    def cid(self, value: str):
        self.__metadata[0] = value

    @property
    def rcid(self):
        return self.__metadata[2]

    @rcid.setter
    def rcid(self, value: str):
        self.__metadata[2] = value

    @property
    def rid(self):
        return self.__metadata[1]

    @rid.setter
    def rid(self, value: str):
        self.__metadata[1] = value