Spaces:

habulaj
/

subapi

Running

App Files Files Community

subapi / gemini_webapi /client.py

habulaj

Upload 49 files

e816bb2 verified 13 days ago

raw

history blame contribute delete

83.7 kB

	import asyncio
	import codecs
	import io
	import random
	import re
	import time
	from asyncio import Task
	from pathlib import Path
	from typing import Any, AsyncGenerator, Optional

	import orjson as json
	from curl_cffi.requests import AsyncSession, Cookies, Response
	from curl_cffi.requests.exceptions import ReadTimeout

	from .components import GemMixin
	from .constants import (
	Endpoint,
	ErrorCode,
	GRPC,
	Model,
	TEMPORARY_CHAT_FLAG_INDEX,
	STREAMING_FLAG_INDEX,
	GEM_FLAG_INDEX,
	)
	from .exceptions import (
	APIError,
	AuthError,
	GeminiError,
	ModelInvalid,
	TemporarilyBlocked,
	TimeoutError,
	UsageLimitExceeded,
	)
	from .types import (
	Candidate,
	Gem,
	GeneratedImage,
	ModelOutput,
	RPCData,
	WebImage,
	AvailableModel,
	ChatInfo,
	ChatTurn,
	ChatHistory,
	GeneratedVideo,
	)
	from .utils import (
	extract_json_from_response,
	get_access_token,
	get_delta_by_fp_len,
	get_nested_value,
	logger,
	parse_file_name,
	parse_response_by_frame,
	rotate_1psidts,
	running,
	upload_file,
	)

	_CARD_CONTENT_RE = re.compile(r"^http://googleusercontent\.com/card_content/\d+")
	_ARTIFACTS_RE = re.compile(r"http://googleusercontent\.com/\w+/\d+\n*")
	_DEFAULT_METADATA: list[Any] = ["", "", "", None, None, None, None, None, None, ""]


	class GeminiClient(GemMixin):
	"""
	Async requests client interface for gemini.google.com.

	`secure_1psid` must be provided unless the optional dependency `browser-cookie3` is installed, and
	you have logged in to google.com in your local browser.

	Parameters
	----------
	secure_1psid: `str`, optional
	__Secure-1PSID cookie value.
	secure_1psidts: `str`, optional
	__Secure-1PSIDTS cookie value, some Google accounts don't require this value, provide only if it's in the cookie list.
	proxy: `str`, optional
	Proxy URL.
	kwargs: `dict`, optional
	Additional arguments which will be passed to the http client.
	Refer to `curl_cffi.requests.AsyncSession` for more information.

	Raises
	------
	`ValueError`
	If `browser-cookie3` is installed but cookies for google.com are not found in your local browser storage.
	"""

	__slots__ = [
	"_cookies",
	"proxy",
	"_running",
	"client",
	"access_token",
	"build_label",
	"session_id",
	"timeout",
	"auto_close",
	"close_delay",
	"close_task",
	"auto_refresh",
	"refresh_interval",
	"refresh_task",
	"verbose",
	"watchdog_timeout",
	"_lock",
	"_reqid",
	"_gems", # From GemMixin
	"_available_models",
	"_recent_chats",
	"kwargs",
	]

	def __init__(
	self,
	secure_1psid: str \| None = None,
	secure_1psidts: str \| None = None,
	proxy: str \| None = None,
	**kwargs,
	):
	super().__init__()
	self._cookies = Cookies()
	self.proxy = proxy
	self._running: bool = False
	self.client: AsyncSession \| None = None
	self.access_token: str \| None = None
	self.build_label: str \| None = None
	self.session_id: str \| None = None
	self.timeout: float = 600
	self.auto_close: bool = False
	self.close_delay: float = 600
	self.close_task: Task \| None = None
	self.auto_refresh: bool = True
	self.refresh_interval: float = 600
	self.refresh_task: Task \| None = None
	self.verbose: bool = True
	self.watchdog_timeout: float = 90
	self._lock = asyncio.Lock()
	self._reqid: int = random.randint(10000, 99999)

	self._available_models: list[AvailableModel] \| None = None
	self._recent_chats: list[ChatInfo] \| None = None
	self.kwargs = kwargs

	if secure_1psid:
	self._cookies.set("__Secure-1PSID", secure_1psid, domain=".google.com")
	if secure_1psidts:
	self._cookies.set(
	"__Secure-1PSIDTS", secure_1psidts, domain=".google.com"
	)

	@property
	def cookies(self) -> Cookies:
	"""
	Returns the cookies used for the current session.
	"""
	return self.client.cookies if self.client else self._cookies

	@cookies.setter
	def cookies(self, value: Cookies \| dict):
	if isinstance(value, Cookies):
	self._cookies.update(value)
	elif isinstance(value, dict):
	for k, v in value.items():
	self._cookies.set(k, v, domain=".google.com")

	if self.client:
	self.client.cookies.update(self._cookies)

	async def init(
	self,
	timeout: float = 600,
	auto_close: bool = False,
	close_delay: float = 600,
	auto_refresh: bool = True,
	refresh_interval: float = 600,
	verbose: bool = True,
	watchdog_timeout: float = 90,
	) -> None:
	"""
	Get SNlM0e value as access token. Without this token posting will fail with 400 bad request.

	Parameters
	----------
	timeout: `float`, optional
	Request timeout of the client in seconds. Used to limit the max waiting time when sending a request.
	auto_close: `bool`, optional
	If `True`, the client will close connections and clear resource usage after a certain period
	of inactivity. Useful for always-on services.
	close_delay: `float`, optional
	Time to wait before auto-closing the client in seconds. Effective only if `auto_close` is `True`.
	auto_refresh: `bool`, optional
	If `True`, will schedule a task to automatically refresh cookies and access token in the background.
	refresh_interval: `float`, optional
	Time interval for background cookie and access token refresh in seconds.
	Effective only if `auto_refresh` is `True`.
	verbose: `bool`, optional
	If `True`, will print more infomation in logs.
	watchdog_timeout: `float`, optional
	Timeout in seconds for shadow retry watchdog. If no data receives from stream but connection is active,
	client will retry automatically after this duration.
	"""

	async with self._lock:
	if self._running:
	return

	try:
	self.verbose = verbose
	self.watchdog_timeout = watchdog_timeout
	access_token, build_label, session_id, session = await get_access_token(
	base_cookies=self.cookies,
	proxy=self.proxy,
	verbose=self.verbose,
	verify=self.kwargs.get("verify", True),
	)

	session.timeout = timeout
	self.client = session
	self._cookies.update(self.client.cookies)
	self.access_token = access_token
	self.build_label = build_label
	self.session_id = session_id
	self._running = True
	self._reqid = random.randint(10000, 99999)

	self.timeout = timeout
	self.auto_close = auto_close
	self.close_delay = close_delay
	if self.auto_close:
	await self.reset_close_task()

	self.auto_refresh = auto_refresh
	self.refresh_interval = refresh_interval

	if self.refresh_task:
	self.refresh_task.cancel()
	self.refresh_task = None

	if self.auto_refresh:
	self.refresh_task = asyncio.create_task(self.start_auto_refresh())

	await self._init_rpc()

	if self.verbose:
	logger.success("Gemini client initialized successfully.")
	except Exception:
	await self.close()
	raise

	async def close(self, delay: float = 0) -> None:
	"""
	Close the client after a certain period of inactivity, or call manually to close immediately.

	Parameters
	----------
	delay: `float`, optional
	Time to wait before closing the client in seconds.
	"""

	if delay:
	await asyncio.sleep(delay)

	self._running = False

	if self.close_task:
	self.close_task.cancel()
	self.close_task = None

	if self.refresh_task:
	self.refresh_task.cancel()
	self.refresh_task = None

	if self.client:
	self._cookies.update(self.client.cookies)
	await self.client.close()
	self.client = None

	async def reset_close_task(self) -> None:
	"""
	Reset the timer for closing the client when a new request is made.
	"""

	if self.close_task:
	self.close_task.cancel()
	self.close_task = None

	self.close_task = asyncio.create_task(self.close(self.close_delay))

	async def start_auto_refresh(self) -> None:
	"""
	Start the background task to automatically refresh cookies.
	"""
	if self.refresh_interval < 60:
	self.refresh_interval = 60

	while self._running:
	await asyncio.sleep(self.refresh_interval)

	if not self._running:
	break

	try:
	async with self._lock:
	# Refresh all cookies in the background to keep the session alive.
	new_1psidts = await rotate_1psidts(self.client, self.verbose)

	if new_1psidts:
	logger.debug("Cookies refreshed (network update).")
	else:
	logger.warning(
	"Rotation response did not contain a new __Secure-1PSIDTS. "
	"Session might expire soon if this persists."
	)
	except asyncio.CancelledError:
	raise
	except AuthError:
	logger.warning(
	"AuthError: Failed to refresh cookies. Retrying in next interval."
	)
	except Exception:
	logger.warning(
	"Unexpected error while refreshing cookies. Retrying in next interval."
	)

	async def _init_rpc(self) -> None:
	"""
	Send initial RPC calls to set up the session.
	"""
	await self._fetch_models()
	await self._send_bard_settings()
	await self._send_bard_activity()
	await self._fetch_recent_chats()

	async def _fetch_models(self) -> None:
	"""
	Fetch and parse available models.
	"""
	response = await self._batch_execute(
	[
	RPCData(
	rpcid=GRPC.LIST_MODELS,
	payload="[]",
	)
	]
	)

	response_json = extract_json_from_response(response.text)

	available_models = []
	for part in response_json:
	part_body_str = get_nested_value(part, [2])
	if not part_body_str:
	continue

	part_body = json.loads(part_body_str)

	models_list = get_nested_value(part_body, [15])
	if isinstance(models_list, list):
	for model_data in models_list:
	if isinstance(model_data, list) and len(model_data) > 2:
	model_id = get_nested_value(model_data, [0], "")
	name = get_nested_value(model_data, [10]) or get_nested_value(
	model_data, [1], ""
	)
	description = get_nested_value(
	model_data, [12]
	) or get_nested_value(model_data, [2], "")
	core_model = Model.UNSPECIFIED
	code_name = "unspecified"
	for enum_model in Model:
	val = enum_model.model_header.get(
	"x-goog-ext-525001261-jspb", ""
	)
	if val and (model_id in val):
	core_model = enum_model
	code_name = enum_model.model_name
	break

	if model_id and name:
	available_models.append(
	AvailableModel(
	id=code_name,
	name=name,
	model=core_model,
	description=description,
	)
	)
	break

	self._available_models = available_models

	async def _fetch_recent_chats(self, recent: int = 13) -> None:
	"""
	Fetch and parse recent chats.
	"""
	response_chats1 = await self._batch_execute(
	[
	RPCData(
	rpcid=GRPC.LIST_CHATS,
	payload=json.dumps([recent, None, [1, None, 1]]).decode("utf-8"),
	),
	]
	)
	response_chats2 = await self._batch_execute(
	[
	RPCData(
	rpcid=GRPC.LIST_CHATS,
	payload=json.dumps([recent, None, [0, None, 1]]).decode("utf-8"),
	),
	]
	)

	recent_chats: list[ChatInfo] = []
	for response_chats in (response_chats1, response_chats2):
	chats_json = extract_json_from_response(response_chats.text)
	for part in chats_json:
	part_body_str = get_nested_value(part, [2])
	if not part_body_str:
	continue

	try:
	part_body = json.loads(part_body_str)
	except json.JSONDecodeError:
	continue

	chat_list = get_nested_value(part_body, [2])
	if isinstance(chat_list, list):
	for chat_data in chat_list:
	if isinstance(chat_data, list) and len(chat_data) > 1:
	cid = get_nested_value(chat_data, [0], "")
	title = get_nested_value(chat_data, [1], "")
	is_pinned = bool(get_nested_value(chat_data, [2]))

	if cid and title:
	if not any(c.cid == cid for c in recent_chats):
	recent_chats.append(
	ChatInfo(
	cid=cid, title=title, is_pinned=is_pinned
	)
	)
	break

	self._recent_chats = recent_chats

	async def _send_bard_settings(self) -> None:
	"""
	Send required setup activity to Gemini.
	"""
	await self._batch_execute(
	[
	RPCData(
	rpcid=GRPC.BARD_SETTINGS,
	payload='[[["adaptive_device_responses_enabled","advanced_mode_theme_override_triggered","advanced_zs_upsell_dismissal_count","advanced_zs_upsell_last_dismissed","ai_transparency_notice_dismissed","audio_overview_discovery_dismissal_count","audio_overview_discovery_last_dismissed","bard_in_chrome_link_sharing_enabled","bard_sticky_mode_disabled_count","canvas_create_discovery_tooltip_seen_count","combined_files_button_tag_seen_count","indigo_banner_explicit_dismissal_count","indigo_banner_impression_count","indigo_banner_last_seen_sec","current_popup_id","deep_research_has_seen_file_upload_tooltip","deep_research_model_update_disclaimer_display_count","default_bot_id","disabled_discovery_card_feature_ids","disabled_model_discovery_tooltip_feature_ids","disabled_mode_disclaimers","disabled_new_model_badge_mode_ids","disabled_settings_discovery_tooltip_feature_ids","disablement_disclaimer_last_dismissed_sec","disable_advanced_beta_dialog","disable_advanced_beta_non_en_banner","disable_advanced_resubscribe_ui","disable_at_mentions_discovery_tooltip","disable_autorun_fact_check_u18","disable_bot_create_tips_card","disable_bot_docs_in_gems_disclaimer","disable_bot_onboarding_dialog","disable_bot_save_reminder_tips_card","disable_bot_send_prompt_tips_card","disable_bot_shared_in_drive_disclaimer","disable_bot_try_create_tips_card","disable_colab_tooltip","disable_collapsed_tool_menu_tooltip","disable_continue_discovery_tooltip","disable_debug_info_moved_tooltip_v2","disable_enterprise_mode_dialog","disable_export_python_tooltip","disable_extensions_discovery_dialog","disable_extension_one_time_badge","disable_fact_check_tooltip_v2","disable_free_file_upload_tips_card","disable_generated_image_download_dialog","disable_get_app_banner","disable_get_app_desktop_dialog","disable_googler_in_enterprise_mode","disable_human_review_disclosure","disable_ice_open_vega_editor_tooltip","disable_image_upload_tooltip","disable_legal_concern_tooltip","disable_llm_history_import_disclaimer","disable_location_popup","disable_memory_discovery","disable_memory_extraction_discovery","disable_new_conversation_dialog","disable_onboarding_experience","disable_personal_context_tooltip","disable_photos_upload_disclaimer","disable_power_up_intro_tooltip","disable_scheduled_actions_mobile_notification_snackbar","disable_storybook_listen_button_tooltip","disable_streaming_settings_tooltip","disable_take_control_disclaimer","disable_teens_only_english_language_dialog","disable_tier1_rebranding_tooltip","disable_try_advanced_mode_dialog","enable_advanced_beta_mode","enable_advanced_mode","enable_googler_in_enterprise_mode","enable_memory","enable_memory_extraction","enable_personal_context","enable_personal_context_gemini","enable_personal_context_gemini_using_photos","enable_personal_context_gemini_using_workspace","enable_personal_context_search","enable_personal_context_youtube","enable_token_streaming","enforce_default_to_fast_version","mayo_discovery_banner_dismissal_count","mayo_discovery_banner_last_dismissed_sec","gempix_discovery_banner_dismissal_count","gempix_discovery_banner_last_dismissed","get_app_banner_ack_count","get_app_banner_seen_count","get_app_mobile_dialog_ack_count","guided_learning_banner_dismissal_count","guided_learning_banner_last_dismissed","has_accepted_agent_mode_fre_disclaimer","has_received_streaming_response","has_seen_agent_mode_tooltip","has_seen_bespoke_tooltip","has_seen_deepthink_mustard_tooltip","has_seen_deepthink_v2_tooltip","has_seen_deep_think_tooltip","has_seen_first_youtube_video_disclaimer","has_seen_ggo_tooltip","has_seen_image_grams_discovery_banner","has_seen_image_preview_in_input_area_tooltip","has_seen_kallo_discovery_banner","has_seen_kallo_tooltip","has_seen_model_picker_in_input_area_tooltip","has_seen_model_tooltip_in_input_area_for_gempix","has_seen_redo_with_gempix2_tooltip","has_seen_veograms_discovery_banner","has_seen_video_generation_discovery_banner","is_imported_chats_panel_open_by_default","jumpstart_onboarding_dismissal_count","last_dismissed_deep_research_implicit_invite","last_dismissed_discovery_feature_implicit_invites","last_dismissed_immersives_canvas_implicit_invite","last_dismissed_immersive_share_disclaimer_sec","last_dismissed_strike_timestamp_sec","last_dismissed_zs_student_aip_banner_sec","last_get_app_banner_ack_timestamp_sec","last_get_app_mobile_dialog_ack_timestamp_sec","last_human_review_disclosure_ack","last_selected_mode_id_in_embedded","last_selected_mode_id_on_web","last_two_up_activation_timestamp_sec","last_winter_olympics_interaction_timestamp_sec","memory_extracted_greeting_name","mini_gemini_tos_closed","mode_switcher_soft_badge_disabled_ids","mode_switcher_soft_badge_seen_count","personalization_first_party_onboarding_cross_surface_clicked","personalization_first_party_onboarding_cross_surface_seen_count","personalization_one_p_discovery_card_seen_count","personalization_one_p_discovery_last_consented","personalization_zero_state_card_last_interacted","personalization_zero_state_card_seen_count","popup_zs_visits_cooldown","require_reconsent_setting_for_personalization_banner_seen_count","show_debug_info","side_nav_open_by_default","student_verification_dismissal_count","student_verification_last_dismissed","task_viewer_cc_banner_dismissed_count","task_viewer_cc_banner_dismissed_time_sec","tool_menu_new_badge_disabled_ids","tool_menu_new_badge_impression_counts","tool_menu_soft_badge_disabled_ids","tool_menu_soft_badge_impression_counts","upload_disclaimer_last_consent_time_sec","viewed_student_aip_upsell_campaign_ids","voice_language","voice_name","web_and_app_activity_enabled","wellbeing_nudge_notice_last_dismissed_sec","zs_student_aip_banner_dismissal_count"]]]',
	)
	]
	)

	async def _send_bard_activity(self) -> None:
	"""
	Send warmup RPC calls before querying.
	"""
	await self._batch_execute(
	[
	RPCData(
	rpcid=GRPC.BARD_SETTINGS,
	payload='[[["bard_activity_enabled"]]]',
	)
	]
	)

	def list_models(self) -> list[AvailableModel] \| None:
	"""
	List all available models for the current account.

	Returns
	-------
	`list[gemini_webapi.types.AvailableModel]`
	List of models with their name and description. Returns `None` if the client holds no session cache.
	"""
	return self._available_models

	async def generate_content(
	self,
	prompt: str,
	files: list[str \| Path \| bytes \| io.BytesIO] \| None = None,
	model: Model \| str \| dict = Model.UNSPECIFIED,
	gem: Gem \| str \| None = None,
	chat: Optional["ChatSession"] = None,
	temporary: bool = False,
	**kwargs,
	) -> ModelOutput:
	"""
	Generates contents with prompt.

	Parameters
	----------
	prompt: `str`
	Text prompt provided by user.
	files: `list[str \| Path \| bytes \| io.BytesIO]`, optional
	List of file paths or byte streams to be attached.
	model: `Model \| str \| dict`, optional
	Specify the model to use for generation.
	Pass either a `gemini_webapi.constants.Model` enum or a model name string to use predefined models.
	Pass a dictionary to use custom model header strings ("model_name" and "model_header" keys must be provided).
	gem: `Gem \| str`, optional
	Specify a gem to use as system prompt for the chat session.
	Pass either a `gemini_webapi.types.Gem` object or a gem id string.
	chat: `ChatSession`, optional
	Chat data to retrieve conversation history.
	If None, will automatically generate a new chat id when sending post request.
	temporary: `bool`, optional
	If set to `True`, the ongoing conversation will not show up in Gemini history.
	kwargs: `dict`, optional
	Additional arguments which will be passed to the post request.
	Refer to `curl_cffi.requests.AsyncSession.request` for more information.

	Returns
	-------
	:class:`ModelOutput`
	Output data from gemini.google.com.

	Raises
	------
	`AssertionError`
	If prompt is empty.
	`gemini_webapi.TimeoutError`
	If request timed out.
	`gemini_webapi.GeminiError`
	If no reply candidate found in response.
	`gemini_webapi.APIError`
	- If request failed with status code other than 200.
	- If response structure is invalid and failed to parse.
	"""

	if self.auto_close:
	await self.reset_close_task()

	file_data = None
	if files:
	await self._send_bard_activity()

	uploaded_urls = await asyncio.gather(
	*(
	upload_file(file, client=self.client, verbose=self.verbose)
	for file in files
	)
	)
	file_data = [
	[[url], parse_file_name(file)]
	for url, file in zip(uploaded_urls, files)
	]

	try:
	await self._send_bard_activity()

	session_state = {
	"last_texts": {},
	"last_thoughts": {},
	"last_progress_time": time.time(),
	"is_thinking": False,
	"is_queueing": False,
	"title": None,
	}
	output = None
	async for output in self._generate(
	prompt=prompt,
	req_file_data=file_data,
	model=model,
	gem=gem,
	chat=chat,
	temporary=temporary,
	session_state=session_state,
	**kwargs,
	):
	pass

	if output is None:
	raise GeminiError(
	"Failed to generate contents. No output data found in response."
	)

	if isinstance(chat, ChatSession):
	output.metadata = chat.metadata
	chat.last_output = output

	return output

	finally:
	if files:
	for file in files:
	if isinstance(file, io.BytesIO):
	file.close()

	async def generate_content_stream(
	self,
	prompt: str,
	files: list[str \| Path \| bytes \| io.BytesIO] \| None = None,
	model: Model \| str \| dict = Model.UNSPECIFIED,
	gem: Gem \| str \| None = None,
	chat: Optional["ChatSession"] = None,
	temporary: bool = False,
	**kwargs,
	) -> AsyncGenerator[ModelOutput, None]:
	"""
	Generates contents with prompt in streaming mode.

	This method sends a request to Gemini and yields partial responses as they arrive.
	It automatically calculates the text delta (new characters) to provide a smooth
	streaming experience. It also continuously updates chat metadata and candidate IDs.

	Parameters
	----------
	prompt: `str`
	Text prompt provided by user.
	files: `list[str \| Path \| bytes \| io.BytesIO]`, optional
	List of file paths or byte streams to be attached.
	model: `Model \| str \| dict`, optional
	Specify the model to use for generation.
	gem: `Gem \| str`, optional
	Specify a gem to use as system prompt for the chat session.
	chat: `ChatSession`, optional
	Chat data to retrieve conversation history.
	temporary: `bool`, optional
	If set to `True`, the ongoing conversation will not show up in Gemini history.
	kwargs: `dict`, optional
	Additional arguments passed to `curl_cffi.requests.AsyncSession.stream`.

	Yields
	------
	:class:`ModelOutput`
	Partial output data. The `text_delta` attribute contains only the NEW characters
	received since the last yield.

	Raises
	------
	`gemini_webapi.APIError`
	If the request fails or response structure is invalid.
	`gemini_webapi.TimeoutError`
	If the stream request times out.
	"""

	if self.auto_close:
	await self.reset_close_task()

	file_data = None
	if files:
	await self._send_bard_activity()

	uploaded_urls = await asyncio.gather(
	*(
	upload_file(file, client=self.client, verbose=self.verbose)
	for file in files
	)
	)
	file_data = [
	[[url], parse_file_name(file)]
	for url, file in zip(uploaded_urls, files)
	]

	try:
	await self._send_bard_activity()

	session_state = {
	"last_texts": {},
	"last_thoughts": {},
	"last_progress_time": time.time(),
	"is_thinking": False,
	"is_queueing": False,
	"title": None,
	}
	output = None
	async for output in self._generate(
	prompt=prompt,
	req_file_data=file_data,
	model=model,
	gem=gem,
	chat=chat,
	temporary=temporary,
	session_state=session_state,
	**kwargs,
	):
	yield output

	if output and isinstance(chat, ChatSession):
	output.metadata = chat.metadata
	chat.last_output = output

	finally:
	if files:
	for file in files:
	if isinstance(file, io.BytesIO):
	file.close()

	@running(retry=5)
	async def _generate(
	self,
	prompt: str,
	req_file_data: list[Any] \| None = None,
	model: Model \| str \| dict = Model.UNSPECIFIED,
	gem: Gem \| str \| None = None,
	chat: Optional["ChatSession"] = None,
	temporary: bool = False,
	session_state: dict[str, Any] \| None = None,
	**kwargs,
	) -> AsyncGenerator[ModelOutput, None]:
	"""
	Internal method which actually sends content generation requests.
	"""

	assert prompt, "Prompt cannot be empty."

	if isinstance(model, str):
	model = Model.from_name(model)
	elif isinstance(model, dict):
	model = Model.from_dict(model)
	elif not isinstance(model, Model):
	raise TypeError(
	f"'model' must be a `gemini_webapi.constants.Model` instance, "
	f"string, or dictionary; got `{type(model).__name__}`"
	)

	_reqid = self._reqid
	self._reqid += 100000

	gem_id = gem.id if isinstance(gem, Gem) else gem

	chat_backup: dict[str, Any] \| None = None
	if chat:
	chat_backup = {
	"metadata": (
	list(chat.metadata)
	if getattr(chat, "metadata", None)
	else list(_DEFAULT_METADATA)
	),
	"cid": getattr(chat, "cid", ""),
	"rid": getattr(chat, "rid", ""),
	"rcid": getattr(chat, "rcid", ""),
	}

	if session_state is None:
	session_state = {
	"last_texts": {},
	"last_thoughts": {},
	"last_progress_time": time.time(),
	"is_thinking": False,
	"is_queueing": False,
	"title": None,
	}
	else:
	# Reset connection-specific states during a retry attempt
	session_state["last_progress_time"] = time.time()
	session_state["is_thinking"] = False
	session_state["is_queueing"] = False

	has_generated_text = False
	sleep_time = 10

	message_content = [
	prompt,
	0,
	None,
	req_file_data,
	None,
	None,
	0,
	]

	params: dict[str, Any] = {"_reqid": _reqid, "rt": "c"}
	if self.build_label:
	params["bl"] = self.build_label
	if self.session_id:
	params["f.sid"] = self.session_id

	while True:
	try:
	inner_req_list: list[Any] = [None] * 69
	inner_req_list[0] = message_content
	inner_req_list[2] = chat.metadata if chat else list(_DEFAULT_METADATA)
	inner_req_list[STREAMING_FLAG_INDEX] = 1
	if gem_id:
	inner_req_list[GEM_FLAG_INDEX] = gem_id
	if temporary:
	inner_req_list[TEMPORARY_CHAT_FLAG_INDEX] = 1

	request_data = {
	"at": self.access_token,
	"f.req": json.dumps(
	[
	None,
	json.dumps(inner_req_list).decode("utf-8"),
	]
	).decode("utf-8"),
	}

	async with self.client.stream(
	"POST",
	Endpoint.GENERATE,
	params=params,
	headers=model.model_header,
	data=request_data,
	**kwargs,
	) as response:
	if self.verbose:
	logger.debug(
	f"HTTP Request: POST {Endpoint.GENERATE} [{response.status_code}]"
	)
	if response.status_code != 200:
	await self.close()
	raise APIError(
	f"Failed to generate contents. Status: {response.status_code}"
	)

	buffer = ""
	decoder = codecs.getincrementaldecoder("utf-8")(errors="replace")

	last_texts: dict[str, str] = session_state["last_texts"]
	last_thoughts: dict[str, str] = session_state["last_thoughts"]
	last_progress_time = session_state["last_progress_time"]

	is_thinking = session_state["is_thinking"]
	is_queueing = session_state["is_queueing"]
	has_candidates = False
	is_completed = False # Check if this conversation turn has been fully answered.
	is_final_chunk = False # Check if this turn is saved to history and marked complete or still pending (e.g., video generation).
	cid = chat.cid if chat else ""
	rid = chat.rid if chat else ""

	async def _process_parts(
	parts: list[Any],
	) -> AsyncGenerator[ModelOutput, None]:
	nonlocal is_thinking, is_queueing, has_candidates, is_completed, is_final_chunk, cid, rid
	for part in parts:
	# Check for fatal error codes
	error_code = get_nested_value(part, [5, 2, 0, 1, 0])
	if error_code:
	await self.close()
	match error_code:
	case ErrorCode.USAGE_LIMIT_EXCEEDED:
	raise UsageLimitExceeded(
	f"Usage limit exceeded for model '{model.model_name}'. Please wait a few minutes, "
	"switch to a different model (e.g., Gemini Flash), or check your account limits on gemini.google.com."
	)
	case ErrorCode.MODEL_INCONSISTENT:
	raise ModelInvalid(
	"The specified model is inconsistent with the conversation history. "
	"Please ensure you are using the same 'model' parameter throughout the entire ChatSession."
	)
	case ErrorCode.MODEL_HEADER_INVALID:
	raise ModelInvalid(
	f"The model '{model.model_name}' is currently unavailable or the request structure is outdated. "
	"Please update 'gemini_webapi' to the latest version or report this on GitHub if the problem persists."
	)
	case ErrorCode.IP_TEMPORARILY_BLOCKED:
	raise TemporarilyBlocked(
	"Your IP address has been temporarily flagged or blocked by Google. "
	"Please try using a proxy, a different network, or wait for a while before retrying."
	)
	case ErrorCode.TEMPORARY_ERROR_1013:
	raise APIError(
	"Gemini encountered a temporary error (1013). Retrying..."
	)
	case _:
	raise APIError(
	f"Failed to generate contents (stream). Unknown API error code: {error_code}. "
	"This might be a temporary Google service issue."
	)

	# Check for queueing status
	status = get_nested_value(part, [5])
	if isinstance(status, list) and status:
	if not is_thinking:
	is_queueing = True
	session_state["is_queueing"] = True
	if not has_candidates:
	logger.debug(
	"Model is in a waiting state (queueing)..."
	)

	inner_json_str = get_nested_value(part, [2])
	if inner_json_str:
	try:
	part_json = json.loads(inner_json_str)
	m_data = get_nested_value(part_json, [1])
	cid = get_nested_value(m_data, [0], "")
	rid = get_nested_value(m_data, [1], "")
	if m_data and isinstance(chat, ChatSession):
	chat.metadata = m_data

	# Check for busy analyzing data
	tool_name = get_nested_value(part_json, [6, 1, 0])
	if tool_name == "data_analysis_tool":
	is_thinking = True
	session_state["is_thinking"] = True
	is_queueing = False
	session_state["is_queueing"] = False
	if not has_candidates:
	logger.debug(
	f"Model is active (thinking/analyzing)... Raw: {str(part_json)[:500]}"
	)

	context_str = get_nested_value(part_json, [25])
	if isinstance(context_str, str):
	is_final_chunk = True
	is_thinking = False
	session_state["is_thinking"] = False
	is_queueing = False
	session_state["is_queueing"] = False
	if isinstance(chat, ChatSession):
	chat.metadata = [None] * 9 + [context_str]

	title = get_nested_value(part_json, [10, 0])
	if title:
	session_state["title"] = title

	candidates_list = get_nested_value(
	part_json, [4], []
	)
	if candidates_list:
	output_candidates = []
	for i, candidate_data in enumerate(
	candidates_list
	):
	rcid = get_nested_value(candidate_data, [0])
	if not rcid:
	continue
	if isinstance(chat, ChatSession):
	chat.rcid = rcid

	(
	text,
	thoughts,
	web_images,
	generated_images,
	generated_videos,
	) = self._parse_candidate(
	candidate_data, cid, rid, rcid
	)

	# Check if this frame represents the complete state of the message
	is_completed = (
	get_nested_value(
	candidate_data, [8, 0], 1
	)
	== 2
	)

	# Save this conversation turn to list_chats whenever it is stored in history.
	if is_final_chunk:
	cid = get_nested_value(
	part_json, [1, 0]
	)
	if cid and isinstance(
	self._recent_chats, list
	):
	chat_title = session_state.get(
	"title"
	)
	if not chat_title:
	for c in self._recent_chats:
	if c.cid == cid:
	chat_title = c.title
	break

	if chat_title:
	is_pinned = False
	for c in self._recent_chats:
	if c.cid == cid:
	is_pinned = c.is_pinned
	break

	expected_idx = (
	0
	if is_pinned
	else sum(
	1
	for c in self._recent_chats
	if c.cid != cid
	and c.is_pinned
	)
	)

	if not (
	len(self._recent_chats)
	> expected_idx
	and self._recent_chats[
	expected_idx
	].cid
	== cid
	and self._recent_chats[
	expected_idx
	].title
	== chat_title
	):
	self._recent_chats = [
	c
	for c in self._recent_chats
	if c.cid != cid
	]
	self._recent_chats.insert(
	expected_idx,
	ChatInfo(
	cid=cid,
	title=chat_title,
	is_pinned=is_pinned,
	),
	)

	last_sent_text = last_texts.get(
	rcid
	) or last_texts.get(f"idx_{i}", "")
	text_delta, new_full_text = (
	get_delta_by_fp_len(
	text,
	last_sent_text,
	is_final=is_completed,
	)
	)
	last_sent_thought = last_thoughts.get(
	rcid
	) or last_thoughts.get(f"idx_{i}", "")
	if thoughts:
	thoughts_delta, new_full_thought = (
	get_delta_by_fp_len(
	thoughts,
	last_sent_thought,
	is_final=is_completed,
	)
	)
	else:
	thoughts_delta = ""
	new_full_thought = ""

	if (
	text_delta
	or thoughts_delta
	or web_images
	or generated_images
	):
	has_candidates = True
	if thoughts_delta:
	logger.debug(f"[Thinking]: {thoughts_delta.strip()}")
	if text_delta:
	logger.debug(f"[Generating]: {text_delta.strip()}")

	# Update state with the provider's cleaned state to handle drift
	last_texts[rcid] = last_texts[
	f"idx_{i}"
	] = new_full_text

	last_thoughts[rcid] = last_thoughts[
	f"idx_{i}"
	] = new_full_thought

	output_candidates.append(
	Candidate(
	rcid=rcid,
	text=text,
	text_delta=text_delta,
	thoughts=thoughts or None,
	thoughts_delta=thoughts_delta,
	web_images=web_images,
	generated_images=generated_images,
	generated_videos=generated_videos,
	)
	)

	if output_candidates:
	is_thinking = False
	session_state["is_thinking"] = False
	is_queueing = False
	session_state["is_queueing"] = False
	yield ModelOutput(
	metadata=get_nested_value(
	part_json, [1], []
	),
	candidates=output_candidates,
	)
	except json.JSONDecodeError:
	continue

	chunk_iterator = response.aiter_content().__aiter__()
	while True:
	try:
	stall_threshold = (
	self.timeout
	if (is_thinking or is_queueing)
	else min(self.timeout, self.watchdog_timeout)
	)
	chunk = await asyncio.wait_for(
	chunk_iterator.__anext__(), timeout=stall_threshold + 5
	)
	except StopAsyncIteration:
	break
	except asyncio.TimeoutError:
	logger.debug(
	f"[Watchdog] Socket idle for {stall_threshold + 5}s. Refreshing connection..."
	)
	break

	buffer += decoder.decode(chunk, final=False)
	if buffer.startswith(")]}'"):
	buffer = buffer[4:].lstrip()
	parsed_parts, buffer = parse_response_by_frame(buffer)

	got_update = False
	async for out in _process_parts(parsed_parts):
	has_generated_text = True
	yield out
	got_update = True

	if got_update:
	last_progress_time = time.time()
	session_state["last_progress_time"] = last_progress_time
	else:
	stall_threshold = (
	self.timeout
	if (is_thinking or is_queueing)
	else min(self.timeout, self.watchdog_timeout)
	)
	if (time.time() - last_progress_time) > stall_threshold:
	if is_thinking:
	logger.debug(
	f"[Watchdog] Model is taking its time thinking ({int(time.time() - last_progress_time)}s). Reconnecting to poll..."
	)
	break
	else:
	logger.debug(
	f"[Watchdog] Connection idle for {stall_threshold}s (queueing={is_queueing}). "
	"Attempting recovery..."
	)
	await self.close()
	break

	# Final flush
	buffer += decoder.decode(b"", final=True)
	if buffer:
	parsed_parts, _ = parse_response_by_frame(buffer)
	async for out in _process_parts(parsed_parts):
	has_generated_text = True
	yield out

	if not is_completed or is_thinking or is_queueing:
	stall_threshold = (
	self.timeout
	if (is_thinking or is_queueing)
	else min(self.timeout, self.watchdog_timeout)
	)
	if (time.time() - last_progress_time) > stall_threshold:
	if not is_thinking:
	logger.debug(
	f"[Watchdog] Stream ended after {stall_threshold}s without completing. Triggering recovery..."
	)
	else:
	logger.debug(
	"[Watchdog] Stream finished but model is still thinking. Polling again..."
	)

	if cid:
	logger.debug(
	f"Stream incomplete. Checking conversation history for {cid}..."
	)

	poll_start_time = time.time()

	while True:
	if (time.time() - poll_start_time) > self.timeout:
	logger.warning(
	f"[Recovery] Polling for {cid} timed out after {self.timeout}s."
	)
	if has_generated_text:
	raise GeminiError(
	"The connection to Gemini was lost while generating the response, and recovery timed out. "
	"Please try sending your prompt again."
	)
	else:
	raise APIError(
	"read_chat polling timed out waiting for the model to finish. "
	"The original request may have been silently aborted by Google."
	)
	await self._send_bard_activity()
	recovered_history = await self.read_chat(cid)
	if (
	recovered_history
	and recovered_history.turns
	and recovered_history.turns[-1].role == "model"
	):
	recovered = recovered_history.turns[-1].info
	if (
	recovered
	and recovered.candidates
	and (
	recovered.candidates[0].text.strip()
	or recovered.candidates[0].generated_images
	or recovered.candidates[0].web_images
	)
	):
	rec_rcid = recovered.candidates[0].rcid
	prev_rcid = (
	chat_backup["rcid"] if chat_backup else ""
	)
	current_expected_rcid = (
	getattr(chat, "rcid", "") if chat else ""
	)

	is_new_turn = (
	rec_rcid == current_expected_rcid
	if current_expected_rcid
	else rec_rcid != prev_rcid
	)

	if is_new_turn:
	logger.debug(
	f"[Recovery] Successfully recovered response for CID: {cid} (RCID: {rec_rcid})"
	)
	if chat:
	recovered.metadata = chat.metadata
	chat.rcid = rec_rcid
	yield recovered
	break
	else:
	logger.debug(
	f"[Recovery] Recovered turn is not the target turn (target: {current_expected_rcid or 'NEW'}, got {rec_rcid}). Waiting..."
	)

	logger.debug(
	f"[Recovery] Response not ready, waiting {sleep_time}s..."
	)
	await asyncio.sleep(sleep_time)
	break
	else:
	logger.debug(
	f"Stream suspended (completed={is_completed}, final_chunk={is_final_chunk}, thinking={is_thinking}, queueing={is_queueing}). "
	f"No CID found to recover. (Request ID: {_reqid})"
	)
	raise APIError(
	"The original request may have been silently aborted by Google."
	)

	break

	except ReadTimeout:
	raise TimeoutError(
	"The request timed out while waiting for Gemini to respond. This often happens with very long prompts "
	"or complex file analysis. Try increasing the 'timeout' value when initializing GeminiClient."
	)
	except (GeminiError, APIError):
	if not has_generated_text and chat and chat_backup:
	chat.metadata = list(chat_backup["metadata"]) # type: ignore
	chat.cid = chat_backup["cid"]
	chat.rid = chat_backup["rid"]
	chat.rcid = chat_backup["rcid"]
	raise
	except Exception:
	if not has_generated_text and chat and chat_backup:
	chat.metadata = list(chat_backup["metadata"]) # type: ignore
	chat.cid = chat_backup["cid"]
	chat.rid = chat_backup["rid"]
	chat.rcid = chat_backup["rcid"]
	logger.debug(
	"Stream parsing interrupted. Attempting to recover conversation context..."
	)
	raise APIError(
	"Failed to parse response body from Google. This might be a temporary API change or invalid data."
	)

	def start_chat(self, **kwargs) -> "ChatSession":
	"""
	Returns a `ChatSession` object attached to this client.

	Parameters
	----------
	kwargs: `dict`, optional
	Additional arguments which will be passed to the chat session.
	Refer to `gemini_webapi.ChatSession` for more information.

	Returns
	-------
	:class:`ChatSession`
	Empty chat session object for retrieving conversation history.
	"""

	return ChatSession(geminiclient=self, **kwargs)

	async def delete_chat(self, cid: str) -> None:
	"""
	Delete a specific conversation by chat id.

	Parameters
	----------
	cid: `str`
	The ID of the chat requiring deletion (e.g. "c_...").
	"""

	await self._batch_execute(
	[
	RPCData(
	rpcid=GRPC.DELETE_CHAT,
	payload=json.dumps([cid]).decode("utf-8"),
	),
	]
	)
	await self._batch_execute(
	[
	RPCData(
	rpcid=GRPC.DELETE_CHAT_SECOND,
	payload=json.dumps([cid, [1, None, 0, 1]]).decode("utf-8"),
	),
	]
	)

	def list_chats(self) -> list[ChatInfo] \| None:
	"""
	List all conversations.

	Returns
	-------
	`list[gemini_webapi.types.ChatInfo] \| None`
	The list of conversations. Returns `None` if the client holds no session cache.
	"""
	return self._recent_chats

	async def read_chat(self, cid: str, limit: int = 10) -> ChatHistory \| None:
	"""
	Fetch the full conversation history by chat id.

	Parameters
	----------
	cid: `str`
	The ID of the conversation to read (e.g. "c_...").
	limit: `int`, optional
	The maximum number of turns to fetch, by default 10.

	Returns
	-------
	:class:`ChatHistory` \| None
	The conversation history, or None if reading failed.
	"""
	try:
	response = await self._batch_execute(
	[
	RPCData(
	rpcid=GRPC.READ_CHAT,
	payload=json.dumps(
	[cid, limit, None, 1, [1], [4], None, 1]
	).decode("utf-8"),
	),
	]
	)

	response_json = extract_json_from_response(response.text)

	for part in response_json:
	part_body_str = get_nested_value(part, [2])
	if not part_body_str:
	continue

	part_body = json.loads(part_body_str)
	turns_data = get_nested_value(part_body, [0])
	if not turns_data:
	continue

	chat_turns = []
	for conv_turn in turns_data:
	# User turn
	user_text = get_nested_value(conv_turn, [2, 0, 0], "")
	if user_text:
	chat_turns.append(ChatTurn(role="user", text=user_text))

	# Model turn
	candidates_list = get_nested_value(conv_turn, [3, 0])
	if candidates_list:
	output_candidates = []
	rid = get_nested_value(conv_turn, [1], "")
	for candidate_data in candidates_list:
	rcid = get_nested_value(candidate_data, [0], "")
	(
	text,
	thoughts,
	web_images,
	generated_images,
	generated_videos,
	) = self._parse_candidate(candidate_data, cid, rid, rcid)
	output_candidates.append(
	Candidate(
	rcid=rcid,
	text=text,
	thoughts=thoughts,
	web_images=web_images,
	generated_images=generated_images,
	generated_videos=generated_videos,
	)
	)

	if output_candidates:
	model_output = ModelOutput(
	metadata=[cid, rid, output_candidates[0].rcid],
	candidates=output_candidates,
	)
	chat_turns.append(
	ChatTurn(
	role="model",
	text=output_candidates[0].text,
	info=model_output,
	)
	)

	return ChatHistory(cid=cid, metadata=[cid], turns=chat_turns)

	return None
	except Exception:
	logger.debug(
	f"[read_chat] Response data for {cid!r} is still incomplete (model is still processing)..."
	)
	return None

	def _parse_candidate(
	self, candidate_data: list[Any], cid: str, rid: str, rcid: str
	) -> tuple[str, str, list[WebImage], list[GeneratedImage], list[GeneratedVideo]]:
	"""
	Parses individual candidate data from the Gemini response.

	Args:
	candidate_data (list[Any]): The raw candidate list from the API response.
	cid (str): Conversation ID.
	rid (str): Response ID.
	rcid (str): Response Candidate ID.

	Returns:
	tuple: A tuple containing:
	- text (str): The main response text.
	- thoughts (str): The model's reasoning or internal thoughts.
	- web_images (list[WebImage]): List of images found on the web.
	- generated_images (list[GeneratedImage]): List of images generated by the model.
	- generated_videos (list[GeneratedVideo]): List of videos generated by the model.
	"""
	text = get_nested_value(candidate_data, [1, 0], "")
	if _CARD_CONTENT_RE.match(text):
	text = get_nested_value(candidate_data, [22, 0]) or text

	# Cleanup googleusercontent artifacts
	text = _ARTIFACTS_RE.sub("", text)

	thoughts = get_nested_value(candidate_data, [37, 0, 0]) or ""

	# Image handling
	web_images = []
	for img_idx, web_img_data in enumerate(
	get_nested_value(candidate_data, [12, 1], [])
	):
	url = get_nested_value(web_img_data, [0, 0, 0])
	if url:
	web_images.append(
	WebImage(
	url=url,
	title=f"[Image {img_idx + 1}]",
	alt=get_nested_value(web_img_data, [0, 4], ""),
	proxy=self.proxy,
	client=self.client,
	)
	)

	generated_images = []
	for img_idx, gen_img_data in enumerate(
	get_nested_value(candidate_data, [12, 7, 0], [])
	):
	url = get_nested_value(gen_img_data, [0, 3, 3])
	if url:
	image_id = get_nested_value(gen_img_data, [1, 0])
	if not image_id:
	image_id = f"http://googleusercontent.com/image_generation_content/{img_idx}"

	generated_images.append(
	GeneratedImage(
	url=url,
	title=f"[Generated Image {img_idx}]",
	alt=get_nested_value(gen_img_data, [0, 3, 2], ""),
	proxy=self.proxy,
	client=self.client,
	client_ref=self,
	cid=cid,
	rid=rid,
	rcid=rcid,
	image_id=image_id,
	)
	)

	# Video handling
	generated_videos = []
	for video_root in get_nested_value(candidate_data, [12, 59, 0], []):
	video_info = get_nested_value(video_root, [0])
	if video_info:
	urls = get_nested_value(video_info, [0, 7], [])
	if len(urls) >= 2:
	generated_videos.append(
	GeneratedVideo(
	url=urls[1],
	thumbnail=urls[0],
	cid=cid,
	rid=rid,
	rcid=rcid,
	client_ref=self,
	proxy=self.proxy,
	)
	)

	return text, thoughts, web_images, generated_images, generated_videos

	async def _get_image_full_size(
	self, cid: str, rid: str, rcid: str, image_id: str
	) -> str \| None:
	"""
	Get the full size URL of an image.
	"""
	try:
	payload = [
	[
	[None, None, None, [None, None, None, None, None, ""]],
	[image_id, 0],
	None,
	[19, ""],
	None,
	None,
	None,
	None,
	None,
	"",
	],
	[rid, rcid, cid, None, ""],
	1,
	0,
	1,
	]

	response = await self._batch_execute(
	[
	RPCData(
	rpcid=GRPC.IMAGE_FULL_SIZE,
	payload=json.dumps(payload).decode("utf-8"),
	),
	]
	)

	response_data = extract_json_from_response(response.text)
	return get_nested_value(
	json.loads(get_nested_value(response_data, [0, 2], "[]")), [0]
	)
	except Exception:
	logger.debug(
	"[_get_image_full_size] Could not retrieve full size URL via RPC."
	)
	return None

	@running(retry=2)
	async def _batch_execute(self, payloads: list[RPCData], **kwargs) -> Response:
	"""
	Execute a batch of requests to Gemini API.

	Parameters
	----------
	payloads: `list[RPCData]`
	List of `gemini_webapi.types.RPCData` objects to be executed.
	kwargs: `dict`, optional
	Additional arguments which will be passed to the post request.
	Refer to `curl_cffi.requests.AsyncSession.request` for more information.

	Returns
	-------
	:class:`curl_cffi.requests.Response`
	Response object containing the result of the batch execution.
	"""

	_reqid = self._reqid
	self._reqid += 100000

	try:
	params: dict[str, Any] = {
	"rpcids": ",".join([p.rpcid for p in payloads]),
	"_reqid": _reqid,
	"rt": "c",
	"source-path": "/app",
	}
	if self.build_label:
	params["bl"] = self.build_label
	if self.session_id:
	params["f.sid"] = self.session_id

	response = await self.client.post(
	Endpoint.BATCH_EXEC,
	params=params,
	data={
	"at": self.access_token,
	"f.req": json.dumps(
	[[payload.serialize() for payload in payloads]]
	).decode("utf-8"),
	},
	**kwargs,
	)
	if self.verbose:
	logger.debug(
	f"HTTP Request: POST {Endpoint.BATCH_EXEC} [{response.status_code}]"
	)
	except ReadTimeout:
	raise TimeoutError(
	"The request timed out while waiting for Gemini to respond. This often happens with very long prompts "
	"or complex file analysis. Try increasing the 'timeout' value when initializing GeminiClient."
	)

	if response.status_code != 200:
	await self.close()
	raise APIError(
	f"Batch execution failed with status code {response.status_code}"
	)

	return response


	class ChatSession:
	"""
	Chat data to retrieve conversation history. Only if all 3 ids are provided will the conversation history be retrieved.

	Parameters
	----------
	geminiclient: `GeminiClient`
	Async requests client interface for gemini.google.com.
	metadata: `list[str]`, optional
	List of chat metadata `[cid, rid, rcid]`, can be shorter than 3 elements, like `[cid, rid]` or `[cid]` only.
	cid: `str`, optional
	Chat id, if provided together with metadata, will override the first value in it.
	rid: `str`, optional
	Reply id, if provided together with metadata, will override the second value in it.
	rcid: `str`, optional
	Reply candidate id, if provided together with metadata, will override the third value in it.
	model: `Model \| str \| dict`, optional
	Specify the model to use for generation.
	Pass either a `gemini_webapi.constants.Model` enum or a model name string to use predefined models.
	Pass a dictionary to use custom model header strings ("model_name" and "model_header" keys must be provided).
	gem: `Gem \| str`, optional
	Specify a gem to use as system prompt for the chat session.
	Pass either a `gemini_webapi.types.Gem` object or a gem id string.
	"""

	__slots__ = [
	"__metadata",
	"geminiclient",
	"last_output",
	"model",
	"gem",
	]

	def __init__(
	self,
	geminiclient: GeminiClient,
	metadata: list[str \| None] \| None = None,
	cid: str = "", # chat id
	rid: str = "", # reply id
	rcid: str = "", # reply candidate id
	model: Model \| str \| dict = Model.UNSPECIFIED,
	gem: Gem \| str \| None = None,
	):
	self.__metadata: list[Any] = list(_DEFAULT_METADATA)
	self.geminiclient: GeminiClient = geminiclient
	self.last_output: ModelOutput \| None = None
	self.model: Model \| str \| dict = model
	self.gem: Gem \| str \| None = gem

	if metadata:
	self.metadata = metadata
	if cid:
	self.cid = cid
	if rid:
	self.rid = rid
	if rcid:
	self.rcid = rcid

	def __str__(self):
	return f"ChatSession(cid='{self.cid}', rid='{self.rid}', rcid='{self.rcid}')"

	__repr__ = __str__

	def __setattr__(self, name: str, value: Any) -> None:
	super().__setattr__(name, value)
	# update conversation history when last output is updated
	if name == "last_output" and isinstance(value, ModelOutput):
	self.metadata = value.metadata
	self.rcid = value.rcid

	async def send_message(
	self,
	prompt: str,
	files: list[str \| Path \| bytes \| io.BytesIO] \| None = None,
	temporary: bool = False,
	**kwargs,
	) -> ModelOutput:
	"""
	Generates contents with prompt.
	Use as a shortcut for `GeminiClient.generate_content(prompt, files, self)`.

	Parameters
	----------
	prompt: `str`
	Text prompt provided by user.
	files: `list[str \| Path \| bytes \| io.BytesIO]`, optional
	List of file paths or byte streams to be attached.
	temporary: `bool`, optional
	If set to `True`, the ongoing conversation will not show up in Gemini history.
	Switching temporary mode within a chat session will clear the previous context
	and create a new chat session under the hood.
	kwargs: `dict`, optional
	Additional arguments which will be passed to the post request.
	Refer to `curl_cffi.requests.AsyncSession.request` for more information.

	Returns
	-------
	:class:`ModelOutput`
	Output data from gemini.google.com.

	Raises
	------
	`AssertionError`
	If prompt is empty.
	`gemini_webapi.TimeoutError`
	If request timed out.
	`gemini_webapi.GeminiError`
	If no reply candidate found in response.
	`gemini_webapi.APIError`
	- If request failed with status code other than 200.
	- If response structure is invalid and failed to parse.
	"""

	return await self.geminiclient.generate_content(
	prompt=prompt,
	files=files,
	model=self.model,
	gem=self.gem,
	chat=self,
	temporary=temporary,
	**kwargs,
	)

	async def send_message_stream(
	self,
	prompt: str,
	files: list[str \| Path \| bytes \| io.BytesIO] \| None = None,
	temporary: bool = False,
	**kwargs,
	) -> AsyncGenerator[ModelOutput, None]:
	"""
	Generates contents with prompt in streaming mode within this chat session.

	This is a shortcut for `GeminiClient.generate_content_stream(prompt, files, self)`.
	The session's metadata and conversation history are automatically managed.

	Parameters
	----------
	prompt: `str`
	Text prompt provided by user.
	files: `list[str \| Path \| bytes \| io.BytesIO]`, optional
	List of file paths or byte streams to be attached.
	temporary: `bool`, optional
	If set to `True`, the ongoing conversation will not show up in Gemini history.
	Switching temporary mode within a chat session will clear the previous context
	and create a new chat session under the hood.
	kwargs: `dict`, optional
	Additional arguments passed to the streaming request.

	Yields
	------
	:class:`ModelOutput`
	Partial output data containing text deltas.
	"""

	async for output in self.geminiclient.generate_content_stream(
	prompt=prompt,
	files=files,
	model=self.model,
	gem=self.gem,
	chat=self,
	temporary=temporary,
	**kwargs,
	):
	yield output

	def choose_candidate(self, index: int) -> ModelOutput:
	"""
	Choose a candidate from the last `ModelOutput` to control the ongoing conversation flow.

	Parameters
	----------
	index: `int`
	Index of the candidate to choose, starting from 0.

	Returns
	-------
	:class:`ModelOutput`
	Output data of the chosen candidate.

	Raises
	------
	`ValueError`
	If no previous output data found in this chat session, or if index exceeds the number of candidates in last model output.
	"""

	if not self.last_output:
	raise ValueError("No previous output data found in this chat session.")

	if index >= len(self.last_output.candidates):
	raise ValueError(
	f"Index {index} exceeds the number of candidates in last model output."
	)

	self.last_output.chosen = index
	self.rcid = self.last_output.rcid
	return self.last_output

	async def read_history(self, limit: int = 10) -> ChatHistory \| None:
	"""
	Fetch the conversation history for this session.

	Parameters
	----------
	limit: `int`, optional
	The maximum number of turns to fetch, by default 10.

	Returns
	-------
	:class:`ChatHistory` \| None
	The conversation history, or None if reading failed or cid is missing.
	"""
	if not self.cid:
	return None
	return await self.geminiclient.read_chat(self.cid, limit=limit)

	@property
	def metadata(self):
	return self.__metadata

	@metadata.setter
	def metadata(self, value: list[str]):
	if not isinstance(value, list):
	return

	# Update only non-None elements to preserve existing CID/RID/RCID/Context
	for i, val in enumerate(value):
	if i < 10 and val is not None:
	self.__metadata[i] = val

	@property
	def cid(self):
	return self.__metadata[0]

	@cid.setter
	def cid(self, value: str):
	self.__metadata[0] = value

	@property
	def rcid(self):
	return self.__metadata[2]

	@rcid.setter
	def rcid(self, value: str):
	self.__metadata[2] = value

	@property
	def rid(self):
	return self.__metadata[1]

	@rid.setter
	def rid(self, value: str):
	self.__metadata[1] = value