ML_Hyper

Running

ML_Hyper / comfy_api_nodes /nodes_pika.py

DegMaTsu

Initial commit ComfyUI-Reactor-Video-Face-Swap-Hyperswap

359fa44 5 months ago

23.8 kB

	"""
	Pika x ComfyUI API Nodes

	Pika API docs: https://pika-827374fb.mintlify.app/api-reference
	"""
	from __future__ import annotations

	from io import BytesIO
	import logging
	from typing import Optional, TypeVar

	import torch

	from typing_extensions import override
	from comfy_api.latest import ComfyExtension, IO
	from comfy_api.input_impl.video_types import VideoCodec, VideoContainer, VideoInput
	from comfy_api_nodes.apis import pika_defs
	from comfy_api_nodes.apis.client import (
	ApiEndpoint,
	EmptyRequest,
	HttpMethod,
	PollingOperation,
	SynchronousOperation,
	)
	from comfy_api_nodes.util import validate_string, download_url_to_video_output, tensor_to_bytesio

	R = TypeVar("R")

	PATH_PIKADDITIONS = "/proxy/pika/generate/pikadditions"
	PATH_PIKASWAPS = "/proxy/pika/generate/pikaswaps"
	PATH_PIKAFFECTS = "/proxy/pika/generate/pikaffects"

	PIKA_API_VERSION = "2.2"
	PATH_TEXT_TO_VIDEO = f"/proxy/pika/generate/{PIKA_API_VERSION}/t2v"
	PATH_IMAGE_TO_VIDEO = f"/proxy/pika/generate/{PIKA_API_VERSION}/i2v"
	PATH_PIKAFRAMES = f"/proxy/pika/generate/{PIKA_API_VERSION}/pikaframes"
	PATH_PIKASCENES = f"/proxy/pika/generate/{PIKA_API_VERSION}/pikascenes"

	PATH_VIDEO_GET = "/proxy/pika/videos"


	async def execute_task(
	initial_operation: SynchronousOperation[R, pika_defs.PikaGenerateResponse],
	auth_kwargs: Optional[dict[str, str]] = None,
	node_id: Optional[str] = None,
	) -> IO.NodeOutput:
	task_id = (await initial_operation.execute()).video_id
	final_response: pika_defs.PikaVideoResponse = await PollingOperation(
	poll_endpoint=ApiEndpoint(
	path=f"{PATH_VIDEO_GET}/{task_id}",
	method=HttpMethod.GET,
	request_model=EmptyRequest,
	response_model=pika_defs.PikaVideoResponse,
	),
	completed_statuses=["finished"],
	failed_statuses=["failed", "cancelled"],
	status_extractor=lambda response: (response.status.value if response.status else None),
	progress_extractor=lambda response: (response.progress if hasattr(response, "progress") else None),
	auth_kwargs=auth_kwargs,
	result_url_extractor=lambda response: (response.url if hasattr(response, "url") else None),
	node_id=node_id,
	estimated_duration=60,
	max_poll_attempts=240,
	).execute()
	if not final_response.url:
	error_msg = f"Pika task {task_id} succeeded but no video data found in response:\n{final_response}"
	logging.error(error_msg)
	raise Exception(error_msg)
	video_url = final_response.url
	logging.info("Pika task %s succeeded. Video URL: %s", task_id, video_url)
	return IO.NodeOutput(await download_url_to_video_output(video_url))


	def get_base_inputs_types() -> list[IO.Input]:
	"""Get the base required inputs types common to all Pika nodes."""
	return [
	IO.String.Input("prompt_text", multiline=True),
	IO.String.Input("negative_prompt", multiline=True),
	IO.Int.Input("seed", min=0, max=0xFFFFFFFF, control_after_generate=True),
	IO.Combo.Input("resolution", options=["1080p", "720p"], default="1080p"),
	IO.Combo.Input("duration", options=[5, 10], default=5),
	]


	class PikaImageToVideo(IO.ComfyNode):
	"""Pika 2.2 Image to Video Node."""

	@classmethod
	def define_schema(cls) -> IO.Schema:
	return IO.Schema(
	node_id="PikaImageToVideoNode2_2",
	display_name="Pika Image to Video",
	description="Sends an image and prompt to the Pika API v2.2 to generate a video.",
	category="api node/video/Pika",
	inputs=[
	IO.Image.Input("image", tooltip="The image to convert to video"),
	*get_base_inputs_types(),
	],
	outputs=[IO.Video.Output()],
	hidden=[
	IO.Hidden.auth_token_comfy_org,
	IO.Hidden.api_key_comfy_org,
	IO.Hidden.unique_id,
	],
	is_api_node=True,
	)

	@classmethod
	async def execute(
	cls,
	image: torch.Tensor,
	prompt_text: str,
	negative_prompt: str,
	seed: int,
	resolution: str,
	duration: int,
	) -> IO.NodeOutput:
	image_bytes_io = tensor_to_bytesio(image)
	pika_files = {"image": ("image.png", image_bytes_io, "image/png")}
	pika_request_data = pika_defs.PikaBodyGenerate22I2vGenerate22I2vPost(
	promptText=prompt_text,
	negativePrompt=negative_prompt,
	seed=seed,
	resolution=resolution,
	duration=duration,
	)
	auth = {
	"auth_token": cls.hidden.auth_token_comfy_org,
	"comfy_api_key": cls.hidden.api_key_comfy_org,
	}
	initial_operation = SynchronousOperation(
	endpoint=ApiEndpoint(
	path=PATH_IMAGE_TO_VIDEO,
	method=HttpMethod.POST,
	request_model=pika_defs.PikaBodyGenerate22I2vGenerate22I2vPost,
	response_model=pika_defs.PikaGenerateResponse,
	),
	request=pika_request_data,
	files=pika_files,
	content_type="multipart/form-data",
	auth_kwargs=auth,
	)
	return await execute_task(initial_operation, auth_kwargs=auth, node_id=cls.hidden.unique_id)


	class PikaTextToVideoNode(IO.ComfyNode):
	"""Pika Text2Video v2.2 Node."""

	@classmethod
	def define_schema(cls) -> IO.Schema:
	return IO.Schema(
	node_id="PikaTextToVideoNode2_2",
	display_name="Pika Text to Video",
	description="Sends a text prompt to the Pika API v2.2 to generate a video.",
	category="api node/video/Pika",
	inputs=[
	*get_base_inputs_types(),
	IO.Float.Input(
	"aspect_ratio",
	step=0.001,
	min=0.4,
	max=2.5,
	default=1.7777777777777777,
	tooltip="Aspect ratio (width / height)",
	)
	],
	outputs=[IO.Video.Output()],
	hidden=[
	IO.Hidden.auth_token_comfy_org,
	IO.Hidden.api_key_comfy_org,
	IO.Hidden.unique_id,
	],
	is_api_node=True,
	)

	@classmethod
	async def execute(
	cls,
	prompt_text: str,
	negative_prompt: str,
	seed: int,
	resolution: str,
	duration: int,
	aspect_ratio: float,
	) -> IO.NodeOutput:
	auth = {
	"auth_token": cls.hidden.auth_token_comfy_org,
	"comfy_api_key": cls.hidden.api_key_comfy_org,
	}
	initial_operation = SynchronousOperation(
	endpoint=ApiEndpoint(
	path=PATH_TEXT_TO_VIDEO,
	method=HttpMethod.POST,
	request_model=pika_defs.PikaBodyGenerate22T2vGenerate22T2vPost,
	response_model=pika_defs.PikaGenerateResponse,
	),
	request=pika_defs.PikaBodyGenerate22T2vGenerate22T2vPost(
	promptText=prompt_text,
	negativePrompt=negative_prompt,
	seed=seed,
	resolution=resolution,
	duration=duration,
	aspectRatio=aspect_ratio,
	),
	auth_kwargs=auth,
	content_type="application/x-www-form-urlencoded",
	)
	return await execute_task(initial_operation, auth_kwargs=auth, node_id=cls.hidden.unique_id)


	class PikaScenes(IO.ComfyNode):
	"""PikaScenes v2.2 Node."""

	@classmethod
	def define_schema(cls) -> IO.Schema:
	return IO.Schema(
	node_id="PikaScenesV2_2",
	display_name="Pika Scenes (Video Image Composition)",
	description="Combine your images to create a video with the objects in them. Upload multiple images as ingredients and generate a high-quality video that incorporates all of them.",
	category="api node/video/Pika",
	inputs=[
	*get_base_inputs_types(),
	IO.Combo.Input(
	"ingredients_mode",
	options=["creative", "precise"],
	default="creative",
	),
	IO.Float.Input(
	"aspect_ratio",
	step=0.001,
	min=0.4,
	max=2.5,
	default=1.7777777777777777,
	tooltip="Aspect ratio (width / height)",
	),
	IO.Image.Input(
	"image_ingredient_1",
	optional=True,
	tooltip="Image that will be used as ingredient to create a video.",
	),
	IO.Image.Input(
	"image_ingredient_2",
	optional=True,
	tooltip="Image that will be used as ingredient to create a video.",
	),
	IO.Image.Input(
	"image_ingredient_3",
	optional=True,
	tooltip="Image that will be used as ingredient to create a video.",
	),
	IO.Image.Input(
	"image_ingredient_4",
	optional=True,
	tooltip="Image that will be used as ingredient to create a video.",
	),
	IO.Image.Input(
	"image_ingredient_5",
	optional=True,
	tooltip="Image that will be used as ingredient to create a video.",
	),
	],
	outputs=[IO.Video.Output()],
	hidden=[
	IO.Hidden.auth_token_comfy_org,
	IO.Hidden.api_key_comfy_org,
	IO.Hidden.unique_id,
	],
	is_api_node=True,
	)

	@classmethod
	async def execute(
	cls,
	prompt_text: str,
	negative_prompt: str,
	seed: int,
	resolution: str,
	duration: int,
	ingredients_mode: str,
	aspect_ratio: float,
	image_ingredient_1: Optional[torch.Tensor] = None,
	image_ingredient_2: Optional[torch.Tensor] = None,
	image_ingredient_3: Optional[torch.Tensor] = None,
	image_ingredient_4: Optional[torch.Tensor] = None,
	image_ingredient_5: Optional[torch.Tensor] = None,
	) -> IO.NodeOutput:
	all_image_bytes_io = []
	for image in [
	image_ingredient_1,
	image_ingredient_2,
	image_ingredient_3,
	image_ingredient_4,
	image_ingredient_5,
	]:
	if image is not None:
	all_image_bytes_io.append(tensor_to_bytesio(image))

	pika_files = [
	("images", (f"image_{i}.png", image_bytes_io, "image/png"))
	for i, image_bytes_io in enumerate(all_image_bytes_io)
	]

	pika_request_data = pika_defs.PikaBodyGenerate22C2vGenerate22PikascenesPost(
	ingredientsMode=ingredients_mode,
	promptText=prompt_text,
	negativePrompt=negative_prompt,
	seed=seed,
	resolution=resolution,
	duration=duration,
	aspectRatio=aspect_ratio,
	)
	auth = {
	"auth_token": cls.hidden.auth_token_comfy_org,
	"comfy_api_key": cls.hidden.api_key_comfy_org,
	}
	initial_operation = SynchronousOperation(
	endpoint=ApiEndpoint(
	path=PATH_PIKASCENES,
	method=HttpMethod.POST,
	request_model=pika_defs.PikaBodyGenerate22C2vGenerate22PikascenesPost,
	response_model=pika_defs.PikaGenerateResponse,
	),
	request=pika_request_data,
	files=pika_files,
	content_type="multipart/form-data",
	auth_kwargs=auth,
	)

	return await execute_task(initial_operation, auth_kwargs=auth, node_id=cls.hidden.unique_id)


	class PikAdditionsNode(IO.ComfyNode):
	"""Pika Pikadditions Node. Add an image into a video."""

	@classmethod
	def define_schema(cls) -> IO.Schema:
	return IO.Schema(
	node_id="Pikadditions",
	display_name="Pikadditions (Video Object Insertion)",
	description="Add any object or image into your video. Upload a video and specify what you'd like to add to create a seamlessly integrated result.",
	category="api node/video/Pika",
	inputs=[
	IO.Video.Input("video", tooltip="The video to add an image to."),
	IO.Image.Input("image", tooltip="The image to add to the video."),
	IO.String.Input("prompt_text", multiline=True),
	IO.String.Input("negative_prompt", multiline=True),
	IO.Int.Input(
	"seed",
	min=0,
	max=0xFFFFFFFF,
	control_after_generate=True,
	),
	],
	outputs=[IO.Video.Output()],
	hidden=[
	IO.Hidden.auth_token_comfy_org,
	IO.Hidden.api_key_comfy_org,
	IO.Hidden.unique_id,
	],
	is_api_node=True,
	)

	@classmethod
	async def execute(
	cls,
	video: VideoInput,
	image: torch.Tensor,
	prompt_text: str,
	negative_prompt: str,
	seed: int,
	) -> IO.NodeOutput:
	video_bytes_io = BytesIO()
	video.save_to(video_bytes_io, format=VideoContainer.MP4, codec=VideoCodec.H264)
	video_bytes_io.seek(0)

	image_bytes_io = tensor_to_bytesio(image)
	pika_files = {
	"video": ("video.mp4", video_bytes_io, "video/mp4"),
	"image": ("image.png", image_bytes_io, "image/png"),
	}
	pika_request_data = pika_defs.PikaBodyGeneratePikadditionsGeneratePikadditionsPost(
	promptText=prompt_text,
	negativePrompt=negative_prompt,
	seed=seed,
	)
	auth = {
	"auth_token": cls.hidden.auth_token_comfy_org,
	"comfy_api_key": cls.hidden.api_key_comfy_org,
	}
	initial_operation = SynchronousOperation(
	endpoint=ApiEndpoint(
	path=PATH_PIKADDITIONS,
	method=HttpMethod.POST,
	request_model=pika_defs.PikaBodyGeneratePikadditionsGeneratePikadditionsPost,
	response_model=pika_defs.PikaGenerateResponse,
	),
	request=pika_request_data,
	files=pika_files,
	content_type="multipart/form-data",
	auth_kwargs=auth,
	)

	return await execute_task(initial_operation, auth_kwargs=auth, node_id=cls.hidden.unique_id)


	class PikaSwapsNode(IO.ComfyNode):
	"""Pika Pikaswaps Node."""

	@classmethod
	def define_schema(cls) -> IO.Schema:
	return IO.Schema(
	node_id="Pikaswaps",
	display_name="Pika Swaps (Video Object Replacement)",
	description="Swap out any object or region of your video with a new image or object. Define areas to replace either with a mask or coordinates.",
	category="api node/video/Pika",
	inputs=[
	IO.Video.Input("video", tooltip="The video to swap an object in."),
	IO.Image.Input(
	"image",
	tooltip="The image used to replace the masked object in the video.",
	optional=True,
	),
	IO.Mask.Input(
	"mask",
	tooltip="Use the mask to define areas in the video to replace.",
	optional=True,
	),
	IO.String.Input("prompt_text", multiline=True, optional=True),
	IO.String.Input("negative_prompt", multiline=True, optional=True),
	IO.Int.Input("seed", min=0, max=0xFFFFFFFF, control_after_generate=True, optional=True),
	IO.String.Input(
	"region_to_modify",
	multiline=True,
	optional=True,
	tooltip="Plaintext description of the object / region to modify.",
	),
	],
	outputs=[IO.Video.Output()],
	hidden=[
	IO.Hidden.auth_token_comfy_org,
	IO.Hidden.api_key_comfy_org,
	IO.Hidden.unique_id,
	],
	is_api_node=True,
	)

	@classmethod
	async def execute(
	cls,
	video: VideoInput,
	image: Optional[torch.Tensor] = None,
	mask: Optional[torch.Tensor] = None,
	prompt_text: str = "",
	negative_prompt: str = "",
	seed: int = 0,
	region_to_modify: str = "",
	) -> IO.NodeOutput:
	video_bytes_io = BytesIO()
	video.save_to(video_bytes_io, format=VideoContainer.MP4, codec=VideoCodec.H264)
	video_bytes_io.seek(0)
	pika_files = {
	"video": ("video.mp4", video_bytes_io, "video/mp4"),
	}
	if mask is not None:
	pika_files["modifyRegionMask"] = ("mask.png", tensor_to_bytesio(mask), "image/png")
	if image is not None:
	pika_files["image"] = ("image.png", tensor_to_bytesio(image), "image/png")

	pika_request_data = pika_defs.PikaBodyGeneratePikaswapsGeneratePikaswapsPost(
	promptText=prompt_text,
	negativePrompt=negative_prompt,
	seed=seed,
	modifyRegionRoi=region_to_modify if region_to_modify else None,
	)
	auth = {
	"auth_token": cls.hidden.auth_token_comfy_org,
	"comfy_api_key": cls.hidden.api_key_comfy_org,
	}
	initial_operation = SynchronousOperation(
	endpoint=ApiEndpoint(
	path=PATH_PIKASWAPS,
	method=HttpMethod.POST,
	request_model=pika_defs.PikaBodyGeneratePikaswapsGeneratePikaswapsPost,
	response_model=pika_defs.PikaGenerateResponse,
	),
	request=pika_request_data,
	files=pika_files,
	content_type="multipart/form-data",
	auth_kwargs=auth,
	)
	return await execute_task(initial_operation, auth_kwargs=auth, node_id=cls.hidden.unique_id)


	class PikaffectsNode(IO.ComfyNode):
	"""Pika Pikaffects Node."""

	@classmethod
	def define_schema(cls) -> IO.Schema:
	return IO.Schema(
	node_id="Pikaffects",
	display_name="Pikaffects (Video Effects)",
	description="Generate a video with a specific Pikaffect. Supported Pikaffects: Cake-ify, Crumble, Crush, Decapitate, Deflate, Dissolve, Explode, Eye-pop, Inflate, Levitate, Melt, Peel, Poke, Squish, Ta-da, Tear",
	category="api node/video/Pika",
	inputs=[
	IO.Image.Input("image", tooltip="The reference image to apply the Pikaffect to."),
	IO.Combo.Input(
	"pikaffect", options=pika_defs.Pikaffect, default="Cake-ify"
	),
	IO.String.Input("prompt_text", multiline=True),
	IO.String.Input("negative_prompt", multiline=True),
	IO.Int.Input("seed", min=0, max=0xFFFFFFFF, control_after_generate=True),
	],
	outputs=[IO.Video.Output()],
	hidden=[
	IO.Hidden.auth_token_comfy_org,
	IO.Hidden.api_key_comfy_org,
	IO.Hidden.unique_id,
	],
	is_api_node=True,
	)

	@classmethod
	async def execute(
	cls,
	image: torch.Tensor,
	pikaffect: str,
	prompt_text: str,
	negative_prompt: str,
	seed: int,
	) -> IO.NodeOutput:
	auth = {
	"auth_token": cls.hidden.auth_token_comfy_org,
	"comfy_api_key": cls.hidden.api_key_comfy_org,
	}
	initial_operation = SynchronousOperation(
	endpoint=ApiEndpoint(
	path=PATH_PIKAFFECTS,
	method=HttpMethod.POST,
	request_model=pika_defs.PikaBodyGeneratePikaffectsGeneratePikaffectsPost,
	response_model=pika_defs.PikaGenerateResponse,
	),
	request=pika_defs.PikaBodyGeneratePikaffectsGeneratePikaffectsPost(
	pikaffect=pikaffect,
	promptText=prompt_text,
	negativePrompt=negative_prompt,
	seed=seed,
	),
	files={"image": ("image.png", tensor_to_bytesio(image), "image/png")},
	content_type="multipart/form-data",
	auth_kwargs=auth,
	)
	return await execute_task(initial_operation, auth_kwargs=auth, node_id=cls.hidden.unique_id)


	class PikaStartEndFrameNode(IO.ComfyNode):
	"""PikaFrames v2.2 Node."""

	@classmethod
	def define_schema(cls) -> IO.Schema:
	return IO.Schema(
	node_id="PikaStartEndFrameNode2_2",
	display_name="Pika Start and End Frame to Video",
	description="Generate a video by combining your first and last frame. Upload two images to define the start and end points, and let the AI create a smooth transition between them.",
	category="api node/video/Pika",
	inputs=[
	IO.Image.Input("image_start", tooltip="The first image to combine."),
	IO.Image.Input("image_end", tooltip="The last image to combine."),
	*get_base_inputs_types(),
	],
	outputs=[IO.Video.Output()],
	hidden=[
	IO.Hidden.auth_token_comfy_org,
	IO.Hidden.api_key_comfy_org,
	IO.Hidden.unique_id,
	],
	is_api_node=True,
	)

	@classmethod
	async def execute(
	cls,
	image_start: torch.Tensor,
	image_end: torch.Tensor,
	prompt_text: str,
	negative_prompt: str,
	seed: int,
	resolution: str,
	duration: int,
	) -> IO.NodeOutput:
	validate_string(prompt_text, field_name="prompt_text", min_length=1)
	pika_files = [
	("keyFrames", ("image_start.png", tensor_to_bytesio(image_start), "image/png")),
	("keyFrames", ("image_end.png", tensor_to_bytesio(image_end), "image/png")),
	]
	auth = {
	"auth_token": cls.hidden.auth_token_comfy_org,
	"comfy_api_key": cls.hidden.api_key_comfy_org,
	}
	initial_operation = SynchronousOperation(
	endpoint=ApiEndpoint(
	path=PATH_PIKAFRAMES,
	method=HttpMethod.POST,
	request_model=pika_defs.PikaBodyGenerate22KeyframeGenerate22PikaframesPost,
	response_model=pika_defs.PikaGenerateResponse,
	),
	request=pika_defs.PikaBodyGenerate22KeyframeGenerate22PikaframesPost(
	promptText=prompt_text,
	negativePrompt=negative_prompt,
	seed=seed,
	resolution=resolution,
	duration=duration,
	),
	files=pika_files,
	content_type="multipart/form-data",
	auth_kwargs=auth,
	)
	return await execute_task(initial_operation, auth_kwargs=auth, node_id=cls.hidden.unique_id)


	class PikaApiNodesExtension(ComfyExtension):
	@override
	async def get_node_list(self) -> list[type[IO.ComfyNode]]:
	return [
	PikaImageToVideo,
	PikaTextToVideoNode,
	PikaScenes,
	PikAdditionsNode,
	PikaSwapsNode,
	PikaffectsNode,
	PikaStartEndFrameNode,
	]


	async def comfy_entrypoint() -> PikaApiNodesExtension:
	return PikaApiNodesExtension()