From 7f1a97bae36e2d106175995931a506b3f735854d Mon Sep 17 00:00:00 2001 From: Mikhail Moskovchenko <43753582+simonreise@users.noreply.github.com> Date: Fri, 9 May 2025 19:51:46 +0400 Subject: [PATCH] Fix reduce-labels in BEIT Fast Image Processor (#38042) * Fixed reduce-labels * Little doc fix * Change docstring --- docs/source/en/model_doc/beit.md | 1 + docs/source/ja/model_doc/beit.md | 1 + .../models/beit/image_processing_beit_fast.py | 14 ++++++++++++-- 3 files changed, 14 insertions(+), 2 deletions(-) diff --git a/docs/source/en/model_doc/beit.md b/docs/source/en/model_doc/beit.md index e40fbdc9c8..7d29780260 100644 --- a/docs/source/en/model_doc/beit.md +++ b/docs/source/en/model_doc/beit.md @@ -150,6 +150,7 @@ If you're interested in submitting a resource to be included here, please feel f [[autodoc]] BeitImageProcessor - preprocess - post_process_semantic_segmentation + ## BeitImageProcessorFast [[autodoc]] BeitImageProcessorFast diff --git a/docs/source/ja/model_doc/beit.md b/docs/source/ja/model_doc/beit.md index e0b94693a3..948c3bad70 100644 --- a/docs/source/ja/model_doc/beit.md +++ b/docs/source/ja/model_doc/beit.md @@ -105,6 +105,7 @@ BEiT の使用を開始するのに役立つ公式 Hugging Face およびコミ [[autodoc]] BeitImageProcessor - preprocess + - post_process_semantic_segmentation ## BeitImageProcessorFast diff --git a/src/transformers/models/beit/image_processing_beit_fast.py b/src/transformers/models/beit/image_processing_beit_fast.py index 5f090b9276..ce3a9707b8 100644 --- a/src/transformers/models/beit/image_processing_beit_fast.py +++ b/src/transformers/models/beit/image_processing_beit_fast.py @@ -137,12 +137,22 @@ class BeitImageProcessorFast(BaseImageProcessorFast): processed_images = torch.stack(processed_images, dim=0) if return_tensors else processed_images return processed_images + def _preprocess_images( + self, + images, + **kwargs, + ): + """Preprocesses images.""" + kwargs["do_reduce_labels"] = False + processed_images = self._preprocess(images=images, **kwargs) + return processed_images + def _preprocess_segmentation_maps( self, segmentation_maps, **kwargs, ): - """Preprocesses a single segmentation map.""" + """Preprocesses segmentation maps.""" processed_segmentation_maps = [] for segmentation_map in segmentation_maps: segmentation_map = self._process_image( @@ -215,7 +225,7 @@ class BeitImageProcessorFast(BaseImageProcessorFast): kwargs.pop("default_to_square") kwargs.pop("data_format") - images = self._preprocess( + images = self._preprocess_images( images=images, **kwargs, )