Kwai-Keye commited on
Commit
a964671
·
verified ·
1 Parent(s): a88b27e

fix preprocessor

Browse files
image_processing_keye.py CHANGED
@@ -129,7 +129,7 @@ def smart_resize(
129
  width: int,
130
  factor: int = 28,
131
  min_pixels: int = 28 * 28 * 130,
132
- max_pixels: int = 28 * 28 * 1670,
133
  ):
134
  """Rescales the image so that the following conditions are met:
135
 
@@ -223,7 +223,7 @@ class SiglipImageProcessor(BaseImageProcessor):
223
  image_std: Optional[Union[float, List[float]]] = None,
224
  do_convert_rgb: bool = True,
225
  min_pixels: int = 28 * 28 * 130,
226
- max_pixels: int = 28 * 28 * 1670,
227
  patch_size: int = 14,
228
  temporal_patch_size: int = 1,
229
  merge_size: int = 2,
@@ -357,7 +357,6 @@ class SiglipImageProcessor(BaseImageProcessor):
357
  processed_images = []
358
 
359
  for image in images:
360
- # image = self.mvit_rescale(image, merge_size=self.merge_size)
361
  if do_resize:
362
  resized_height, resized_width = smart_resize(
363
  height,
@@ -385,7 +384,6 @@ class SiglipImageProcessor(BaseImageProcessor):
385
  std=image_std,
386
  input_data_format=input_data_format,
387
  )
388
-
389
  image = to_channel_dimension_format(
390
  image, data_format, input_channel_dim=input_data_format
391
  )
 
129
  width: int,
130
  factor: int = 28,
131
  min_pixels: int = 28 * 28 * 130,
132
+ max_pixels: int = 28 * 28 * 1280,
133
  ):
134
  """Rescales the image so that the following conditions are met:
135
 
 
223
  image_std: Optional[Union[float, List[float]]] = None,
224
  do_convert_rgb: bool = True,
225
  min_pixels: int = 28 * 28 * 130,
226
+ max_pixels: int = 28 * 28 * 1280,
227
  patch_size: int = 14,
228
  temporal_patch_size: int = 1,
229
  merge_size: int = 2,
 
357
  processed_images = []
358
 
359
  for image in images:
 
360
  if do_resize:
361
  resized_height, resized_width = smart_resize(
362
  height,
 
384
  std=image_std,
385
  input_data_format=input_data_format,
386
  )
 
387
  image = to_channel_dimension_format(
388
  image, data_format, input_channel_dim=input_data_format
389
  )
preprocessor_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "min_pixels": 101920,
3
- "max_pixels": 1309280,
4
  "patch_size": 14,
5
  "temporal_patch_size": 1,
6
  "merge_size": 2,
@@ -15,4 +15,4 @@
15
  "AutoProcessor": "processing_keye.KeyeProcessor",
16
  "AutoImageProcessor": "image_processing_keye.SiglipImageProcessor"
17
  }
18
- }
 
1
  {
2
+ "min_pixels": 102400,
3
+ "max_pixels": 1003520,
4
  "patch_size": 14,
5
  "temporal_patch_size": 1,
6
  "merge_size": 2,
 
15
  "AutoProcessor": "processing_keye.KeyeProcessor",
16
  "AutoImageProcessor": "image_processing_keye.SiglipImageProcessor"
17
  }
18
+ }