mirror of
https://github.com/ostris/ai-toolkit.git
synced 2026-02-20 04:13:57 +00:00
Change pixtral to crop based on number of pixels instead of largest dimension
This commit is contained in:
@@ -1,3 +1,4 @@
|
||||
import math
|
||||
from typing import List, Optional, Tuple, Any, Union
|
||||
import os
|
||||
import torch
|
||||
@@ -461,7 +462,12 @@ class PixtralVisionImagePreprocessor:
|
||||
|
||||
w, h = img.shape[-1], img.shape[-2]
|
||||
|
||||
ratio = max(h / self.max_image_size, w / self.max_image_size)
|
||||
# originally, pixtral used the largest of the 2 dimensions, but we
|
||||
# will use the base size of the image based on number of pixels.
|
||||
# ratio = max(h / self.max_image_size, w / self.max_image_size) # original
|
||||
|
||||
base_size = int(math.sqrt(w * h))
|
||||
ratio = base_size / self.max_image_size
|
||||
if ratio > 1:
|
||||
w = round(w / ratio)
|
||||
h = round(h / ratio)
|
||||
|
||||
Reference in New Issue
Block a user