feat: Add ImageResizeMode for GenerateVideos

matthew29tang · copybara-github · commit 152209c11c5a · 2026-04-09T19:06:43.000-07:00
PiperOrigin-RevId: 869306823
diff --git a/google/genai/models.py b/google/genai/models.py
@@ -2115,6 +2115,9 @@ def _GenerateVideosConfig_to_mldev(
   if getv(from_object, ['labels']) is not None:
     raise ValueError('labels parameter is not supported in Gemini API.')
 
+  if getv(from_object, ['resize_mode']) is not None:
+    raise ValueError('resize_mode parameter is not supported in Gemini API.')
+
   return to_object
 
 
@@ -2241,6 +2244,13 @@ def _GenerateVideosConfig_to_vertex(
   if getv(from_object, ['labels']) is not None:
     setv(parent_object, ['labels'], getv(from_object, ['labels']))
 
+  if getv(from_object, ['resize_mode']) is not None:
+    setv(
+        parent_object,
+        ['parameters', 'resizeMode'],
+        getv(from_object, ['resize_mode']),
+    )
+
   return to_object
 
 
diff --git a/google/genai/tests/models/test_generate_videos.py b/google/genai/tests/models/test_generate_videos.py
@@ -304,6 +304,8 @@ def test_text_and_image_to_video_poll(client):
       image=GCS_IMAGE if client.vertexai else LOCAL_IMAGE,
       config=types.GenerateVideosConfig(
           output_gcs_uri=OUTPUT_GCS_URI if client.vertexai else None,
+          resize_mode=(types.ImageResizeMode.CROP
+                       if client.vertexai else None),
       ),
   )
   while not operation.done:
diff --git a/google/genai/types.py b/google/genai/types.py
@@ -1006,6 +1006,17 @@ class VideoCompressionQuality(_common.CaseInSensitiveEnum):
       with a larger file size."""
 
 
+class ImageResizeMode(_common.CaseInSensitiveEnum):
+  """Resize mode for the image input for video generation."""
+
+  CROP = 'CROP'
+  """Crop the image to fit the correct aspect ratio (so we lose parts
+      of the image in the process)."""
+  PAD = 'PAD'
+  """Pad the image to fit the correct aspect ratio (so we don't lose
+      any parts of the image in the process)."""
+
+
 class TuningMethod(_common.CaseInSensitiveEnum):
   """Enum representing the tuning method."""
 
@@ -11159,6 +11170,10 @@ class GenerateVideosConfig(_common.BaseModel):
       default=None,
       description="""User specified labels to track billing usage.""",
   )
+  resize_mode: Optional[ImageResizeMode] = Field(
+      default=None,
+      description="""Resize mode of the image input for video generation.""",
+  )
 
 
 class GenerateVideosConfigDict(TypedDict, total=False):
@@ -11231,6 +11246,9 @@ class GenerateVideosConfigDict(TypedDict, total=False):
   labels: Optional[dict[str, str]]
   """User specified labels to track billing usage."""
 
+  resize_mode: Optional[ImageResizeMode]
+  """Resize mode of the image input for video generation."""
+
 
 GenerateVideosConfigOrDict = Union[
     GenerateVideosConfig, GenerateVideosConfigDict

Original file line number	Diff line number	Diff line change
`@@ -304,6 +304,8 @@ def test_text_and_image_to_video_poll(client):`
`304`	`304`	`image=GCS_IMAGE if client.vertexai else LOCAL_IMAGE,`
`305`	`305`	`config=types.GenerateVideosConfig(`
`306`	`306`	`output_gcs_uri=OUTPUT_GCS_URI if client.vertexai else None,`
	`307`	`+ resize_mode=(types.ImageResizeMode.CROP`
	`308`	`+ if client.vertexai else None),`
`307`	`309`	`),`
`308`	`310`	`)`
`309`	`311`	`while not operation.done:`