mirror of
https://github.com/comfyanonymous/ComfyUI.git
synced 2025-06-07 20:12:57 +08:00

* Add Ideogram generate node. * Add staging api. * Add API_NODE and common error for missing auth token (#5) * Add Minimax Video Generation + Async Task queue polling example (#6) * [Minimax] Show video preview and embed workflow in ouput (#7) * Remove uv.lock * Remove polling operations. * Revert "Remove polling operations." * Update stubs. * Added Ideogram and Minimax back in. * Added initial BFL Flux 1.1 [pro] Ultra node (#11) * Add --comfy-api-base launch arg (#13) * Add instructions for staging development. (#14) * remove validation to make it easier to run against LAN copies of the API * Manually add BFL polling status response schema (#15) * Add function for uploading files. (#18) * Add Luma nodes (#16) * Refactor util functions (#20) * Add VIDEO type (#21) * Add rest of Luma node functionality (#19) * Fix image_luma_ref not working (#28) * [Bug] Remove duplicated option T2V-01 in MinimaxTextToVideoNode (#31) * Add utils to map from pydantic model fields to comfy node inputs (#30) * add veo2, bump av req (#32) * Add Recraft nodes (#29) * Add Kling Nodes (#12) * Add Camera Concepts (luma_concepts) to Luma Video nodes (#33) * Add Runway nodes (#17) * Convert Minimax node to use VIDEO output type (#34) * Standard `CATEGORY` system for api nodes (#35) * Set `Content-Type` header when uploading files (#36) * add better error propagation to veo2 (#37) * Add Realistic Image and Logo Raster styles for Recraft v3 (#38) * Fix runway image upload and progress polling (#39) * Fix image upload for Luma: only include `Content-Type` header field if it's set explicitly (#40) * Moved Luma nodes to nodes_luma.py (#47) * Moved Recraft nodes to nodes_recraft.py (#48) * Add Pixverse nodes (#46) * Move and fix BFL nodes to node_bfl.py (#49) * Move and edit Minimax node to nodes_minimax.py (#50) * Add Minimax Image to Video node + Cleanup (#51) * Add Recraft Text to Vector node, add Save SVG node to handle its output (#53) * Added pixverse_template support to Pixverse Text to Video node (#54) * Added Recraft Controls + Recraft Color RGB nodes (#57) * split remaining nodes out of nodes_api, make utility lib, refactor ideogram (#61) * Add types and doctstrings to utils file (#64) * Fix: `PollingOperation` progress bar update progress by absolute value (#65) * Use common download function in kling nodes module (#67) * Fix: Luma video nodes in `api nodes/image` category (#68) * Set request type explicitly (#66) * Add `control_after_generate` to all seed inputs (#69) * Fix bug: deleting `Content-Type` when property does not exist (#73) * Add preview to Save SVG node (#74) * change default poll interval (#76), rework veo2 * Add Pixverse and updated Kling types (#75) * Added Pixverse Image to VIdeo node (#77) * Add Pixverse Transition Video node (#79) * Proper ray-1-6 support as fix has been applied in backend (#80) * Added Recraft Style - Infinite Style Library node (#82) * add ideogram v3 (#83) * [Kling] Split Camera Control config to its own node (#81) * Add Pika i2v and t2v nodes (#52) * Temporary Fix for Runway (#87) * Added Stability Stable Image Ultra node (#86) * Remove Runway nodes (#88) * Fix: Prompt text can't be validated in Kling nodes when using primitive nodes (#90) * Fix: typo in node name "Stabiliy" => "Stability" (#91) * Add String (Multiline) node (#93) * Update Pika Duration and Resolution options (#94) * Change base branch to master. Not main. (#95) * Fix UploadRequest file_name param (#98) * Removed Infinite Style Library until later (#99) * fix ideogram style types (#100) * fix multi image return (#101) * add metadata saving to SVG (#102) * Bump templates version to include API node template workflows (#104) * Fix: `download_url_to_video_output` return type (#103) * fix 4o generation bug (#106) * Serve SVG files directly (#107) * Add a bunch of nodes, 3 ready to use, the rest waiting for endpoint support (#108) * Revert "Serve SVG files directly" (#111) * Expose 4 remaining Recraft nodes (#112) * [Kling] Add `Duration` and `Video ID` outputs (#105) * Fix: datamodel-codegen sets string#binary type to non-existent `bytes_aliased` variable (#114) * Fix: Dall-e 2 not setting request content-type dynamically (#113) * Default request timeout: one hour. (#116) * Add Kling nodes: camera control, start-end frame, lip-sync, video extend (#115) * Add 8 nodes - 4 BFL, 4 Stability (#117) * Fix error for Recraft ImageToImage error for nonexistent random_seed param (#118) * Add remaining Pika nodes (#119) * Make controls input work for Recraft Image to Image node (#120) * Use upstream PR: Support saving Comfy VIDEO type to buffer (#123) * Use Upstream PR: "Fix: Error creating video when sliced audio tensor chunks are non-c-contiguous" (#127) * Improve audio upload utils (#128) * Fix: Nested `AnyUrl` in request model cannot be serialized (Kling, Runway) (#129) * Show errors and API output URLs to the user (change log levels) (#131) * Fix: Luma I2I fails when weight is <=0.01 (#132) * Change category of `LumaConcepts` node from image to video (#133) * Fix: `image.shape` accessed before `image` is null-checked (#134) * Apply small fixes and most prompt validation (if needed to avoid API error) (#135) * Node name/category modifications (#140) * Add back Recraft Style - Infinite Style Library node (#141) * Fixed Kling: Check attributes of pydantic types. (#144) * Bump `comfyui-workflow-templates` version (#142) * [Kling] Print response data when error validating response (#146) * Fix: error validating Kling image response, trying to use `"key" in` on Pydantic class instance (#147) * [Kling] Fix: Correct/verify supported subset of input combos in Kling nodes (#149) * [Kling] Fix typo in node description (#150) * [Kling] Fix: CFG min/max not being enforced (#151) * Rebase launch-rebase (private) on prep-branch (public copy of master) (#153) * Bump templates version (#154) * Fix: Kling image gen nodes don't return entire batch when `n` > 1 (#152) * Remove pixverse_template from PixVerse Transition Video node (#155) * Invert image_weight value on Luma Image to Image node (#156) * Invert and resize mask for Ideogram V3 node to match masking conventions (#158) * [Kling] Fix: image generation nodes not returning Tuple (#159) * [Bug] [Kling] Fix Kling camera control (#161) * Kling Image Gen v2 + improve node descriptions for Flux/OpenAI (#160) * [Kling] Don't return video_id from dual effect video (#162) * Bump frontend to 1.18.8 (#163) * Use 3.9 compat syntax (#164) * Use Python 3.10 * add example env var * Update templates to 0.1.11 * Bump frontend to 1.18.9 --------- Co-authored-by: Robin Huang <robin.j.huang@gmail.com> Co-authored-by: Christian Byrne <cbyrne@comfy.org> Co-authored-by: thot experiment <94414189+thot-experiment@users.noreply.github.com>
284 lines
9.7 KiB
Python
284 lines
9.7 KiB
Python
import io
|
|
import logging
|
|
import base64
|
|
import requests
|
|
import torch
|
|
|
|
from comfy.comfy_types.node_typing import IO, ComfyNodeABC
|
|
from comfy_api.input_impl.video_types import VideoFromFile
|
|
from comfy_api_nodes.apis import (
|
|
Veo2GenVidRequest,
|
|
Veo2GenVidResponse,
|
|
Veo2GenVidPollRequest,
|
|
Veo2GenVidPollResponse
|
|
)
|
|
from comfy_api_nodes.apis.client import (
|
|
ApiEndpoint,
|
|
HttpMethod,
|
|
SynchronousOperation,
|
|
PollingOperation,
|
|
)
|
|
|
|
from comfy_api_nodes.apinode_utils import (
|
|
downscale_image_tensor,
|
|
tensor_to_base64_string
|
|
)
|
|
|
|
def convert_image_to_base64(image: torch.Tensor):
|
|
if image is None:
|
|
return None
|
|
|
|
scaled_image = downscale_image_tensor(image, total_pixels=2048*2048)
|
|
return tensor_to_base64_string(scaled_image)
|
|
|
|
class VeoVideoGenerationNode(ComfyNodeABC):
|
|
"""
|
|
Generates videos from text prompts using Google's Veo API.
|
|
|
|
This node can create videos from text descriptions and optional image inputs,
|
|
with control over parameters like aspect ratio, duration, and more.
|
|
"""
|
|
|
|
@classmethod
|
|
def INPUT_TYPES(s):
|
|
return {
|
|
"required": {
|
|
"prompt": (
|
|
IO.STRING,
|
|
{
|
|
"multiline": True,
|
|
"default": "",
|
|
"tooltip": "Text description of the video",
|
|
},
|
|
),
|
|
"aspect_ratio": (
|
|
IO.COMBO,
|
|
{
|
|
"options": ["16:9", "9:16"],
|
|
"default": "16:9",
|
|
"tooltip": "Aspect ratio of the output video",
|
|
},
|
|
),
|
|
},
|
|
"optional": {
|
|
"negative_prompt": (
|
|
IO.STRING,
|
|
{
|
|
"multiline": True,
|
|
"default": "",
|
|
"tooltip": "Negative text prompt to guide what to avoid in the video",
|
|
},
|
|
),
|
|
"duration_seconds": (
|
|
IO.INT,
|
|
{
|
|
"default": 5,
|
|
"min": 5,
|
|
"max": 8,
|
|
"step": 1,
|
|
"display": "number",
|
|
"tooltip": "Duration of the output video in seconds",
|
|
},
|
|
),
|
|
"enhance_prompt": (
|
|
IO.BOOLEAN,
|
|
{
|
|
"default": True,
|
|
"tooltip": "Whether to enhance the prompt with AI assistance",
|
|
}
|
|
),
|
|
"person_generation": (
|
|
IO.COMBO,
|
|
{
|
|
"options": ["ALLOW", "BLOCK"],
|
|
"default": "ALLOW",
|
|
"tooltip": "Whether to allow generating people in the video",
|
|
},
|
|
),
|
|
"seed": (
|
|
IO.INT,
|
|
{
|
|
"default": 0,
|
|
"min": 0,
|
|
"max": 0xFFFFFFFF,
|
|
"step": 1,
|
|
"display": "number",
|
|
"control_after_generate": True,
|
|
"tooltip": "Seed for video generation (0 for random)",
|
|
},
|
|
),
|
|
"image": (IO.IMAGE, {
|
|
"default": None,
|
|
"tooltip": "Optional reference image to guide video generation",
|
|
}),
|
|
},
|
|
"hidden": {
|
|
"auth_token": "AUTH_TOKEN_COMFY_ORG",
|
|
},
|
|
}
|
|
|
|
RETURN_TYPES = (IO.VIDEO,)
|
|
FUNCTION = "generate_video"
|
|
CATEGORY = "api node/video/Veo"
|
|
DESCRIPTION = "Generates videos from text prompts using Google's Veo API"
|
|
API_NODE = True
|
|
|
|
def generate_video(
|
|
self,
|
|
prompt,
|
|
aspect_ratio="16:9",
|
|
negative_prompt="",
|
|
duration_seconds=5,
|
|
enhance_prompt=True,
|
|
person_generation="ALLOW",
|
|
seed=0,
|
|
image=None,
|
|
auth_token=None,
|
|
):
|
|
# Prepare the instances for the request
|
|
instances = []
|
|
|
|
instance = {
|
|
"prompt": prompt
|
|
}
|
|
|
|
# Add image if provided
|
|
if image is not None:
|
|
image_base64 = convert_image_to_base64(image)
|
|
if image_base64:
|
|
instance["image"] = {
|
|
"bytesBase64Encoded": image_base64,
|
|
"mimeType": "image/png"
|
|
}
|
|
|
|
instances.append(instance)
|
|
|
|
# Create parameters dictionary
|
|
parameters = {
|
|
"aspectRatio": aspect_ratio,
|
|
"personGeneration": person_generation,
|
|
"durationSeconds": duration_seconds,
|
|
"enhancePrompt": enhance_prompt,
|
|
}
|
|
|
|
# Add optional parameters if provided
|
|
if negative_prompt:
|
|
parameters["negativePrompt"] = negative_prompt
|
|
if seed > 0:
|
|
parameters["seed"] = seed
|
|
|
|
# Initial request to start video generation
|
|
initial_operation = SynchronousOperation(
|
|
endpoint=ApiEndpoint(
|
|
path="/proxy/veo/generate",
|
|
method=HttpMethod.POST,
|
|
request_model=Veo2GenVidRequest,
|
|
response_model=Veo2GenVidResponse
|
|
),
|
|
request=Veo2GenVidRequest(
|
|
instances=instances,
|
|
parameters=parameters
|
|
),
|
|
auth_token=auth_token
|
|
)
|
|
|
|
initial_response = initial_operation.execute()
|
|
operation_name = initial_response.name
|
|
|
|
logging.info(f"Veo generation started with operation name: {operation_name}")
|
|
|
|
# Define status extractor function
|
|
def status_extractor(response):
|
|
# Only return "completed" if the operation is done, regardless of success or failure
|
|
# We'll check for errors after polling completes
|
|
return "completed" if response.done else "pending"
|
|
|
|
# Define progress extractor function
|
|
def progress_extractor(response):
|
|
# Could be enhanced if the API provides progress information
|
|
return None
|
|
|
|
# Define the polling operation
|
|
poll_operation = PollingOperation(
|
|
poll_endpoint=ApiEndpoint(
|
|
path="/proxy/veo/poll",
|
|
method=HttpMethod.POST,
|
|
request_model=Veo2GenVidPollRequest,
|
|
response_model=Veo2GenVidPollResponse
|
|
),
|
|
completed_statuses=["completed"],
|
|
failed_statuses=[], # No failed statuses, we'll handle errors after polling
|
|
status_extractor=status_extractor,
|
|
progress_extractor=progress_extractor,
|
|
request=Veo2GenVidPollRequest(
|
|
operationName=operation_name
|
|
),
|
|
auth_token=auth_token,
|
|
poll_interval=5.0
|
|
)
|
|
|
|
# Execute the polling operation
|
|
poll_response = poll_operation.execute()
|
|
|
|
# Now check for errors in the final response
|
|
# Check for error in poll response
|
|
if hasattr(poll_response, 'error') and poll_response.error:
|
|
error_message = f"Veo API error: {poll_response.error.message} (code: {poll_response.error.code})"
|
|
logging.error(error_message)
|
|
raise Exception(error_message)
|
|
|
|
# Check for RAI filtered content
|
|
if (hasattr(poll_response.response, 'raiMediaFilteredCount') and
|
|
poll_response.response.raiMediaFilteredCount > 0):
|
|
|
|
# Extract reason message if available
|
|
if (hasattr(poll_response.response, 'raiMediaFilteredReasons') and
|
|
poll_response.response.raiMediaFilteredReasons):
|
|
reason = poll_response.response.raiMediaFilteredReasons[0]
|
|
error_message = f"Content filtered by Google's Responsible AI practices: {reason} ({poll_response.response.raiMediaFilteredCount} videos filtered.)"
|
|
else:
|
|
error_message = f"Content filtered by Google's Responsible AI practices ({poll_response.response.raiMediaFilteredCount} videos filtered.)"
|
|
|
|
logging.error(error_message)
|
|
raise Exception(error_message)
|
|
|
|
# Extract video data
|
|
video_data = None
|
|
if poll_response.response and hasattr(poll_response.response, 'videos') and poll_response.response.videos and len(poll_response.response.videos) > 0:
|
|
video = poll_response.response.videos[0]
|
|
|
|
# Check if video is provided as base64 or URL
|
|
if hasattr(video, 'bytesBase64Encoded') and video.bytesBase64Encoded:
|
|
# Decode base64 string to bytes
|
|
video_data = base64.b64decode(video.bytesBase64Encoded)
|
|
elif hasattr(video, 'gcsUri') and video.gcsUri:
|
|
# Download from URL
|
|
video_url = video.gcsUri
|
|
video_response = requests.get(video_url)
|
|
video_data = video_response.content
|
|
else:
|
|
raise Exception("Video returned but no data or URL was provided")
|
|
else:
|
|
raise Exception("Video generation completed but no video was returned")
|
|
|
|
if not video_data:
|
|
raise Exception("No video data was returned")
|
|
|
|
logging.info("Video generation completed successfully")
|
|
|
|
# Convert video data to BytesIO object
|
|
video_io = io.BytesIO(video_data)
|
|
|
|
# Return VideoFromFile object
|
|
return (VideoFromFile(video_io),)
|
|
|
|
|
|
# Register the node
|
|
NODE_CLASS_MAPPINGS = {
|
|
"VeoVideoGenerationNode": VeoVideoGenerationNode,
|
|
}
|
|
|
|
NODE_DISPLAY_NAME_MAPPINGS = {
|
|
"VeoVideoGenerationNode": "Google Veo2 Video Generation",
|
|
}
|