[data] gemma3 plugin pan and scan (#7294)

* gemma3 pan and scan * add test case * fix test
2025-03-13 23:29:23 +08:00
parent 0be0d7796a
commit 93e6184cbe
5 changed files with 65 additions and 4 deletions
--- a/src/llamafactory/hparams/model_args.py
+++ b/src/llamafactory/hparams/model_args.py
@@ -218,6 +218,10 @@ class ProcessorArguments:
        default=32 * 32,
        metadata={"help": "The minimum number of pixels of image inputs."},
    )
+    image_do_pan_and_scan: bool = field(
+        default=False,
+        metadata={"help": "Use pan and scan to process image for gemma3."},
+    )
    video_max_pixels: int = field(
        default=256 * 256,
        metadata={"help": "The maximum number of pixels of video inputs."},
@@ -235,6 +239,13 @@ class ProcessorArguments:
        metadata={"help": "The maximum number of sampled frames for video inputs."},
    )

+    def __post_init__(self):
+        if self.image_max_pixels < self.image_min_pixels:
+            raise ValueError("`image_max_pixels` cannot be smaller than `image_min_pixels`.")
+
+        if self.video_max_pixels < self.video_min_pixels:
+            raise ValueError("`video_max_pixels` cannot be smaller than `video_min_pixels`.")
+

@dataclass
 class ExportArguments:
@@ -342,6 +353,7 @@ class ModelArguments(VllmArguments, ExportArguments, ProcessorArguments, Quantiz

    def __post_init__(self):
        BaseModelArguments.__post_init__(self)
+        ProcessorArguments.__post_init__(self)
        ExportArguments.__post_init__(self)
        VllmArguments.__post_init__(self)