Ë
    
­œiœ<  ã                   óN  — d Z ddlmZ ddlZddlmZmZmZ ddl	m
Z
mZmZ ddlmZmZmZmZmZmZmZmZmZ ddlmZ dd	lmZmZmZmZmZ dd
lm Z   e«       rddl!Z! e«       rddl"Z" ejF                  e$«      Z% G d„ ded¬«      Z&d„ Z'd„ Z( e d¬«       G d„ de«      «       Z)dgZ*y)z#Image processor class for ImageGPT.é    )ÚUnionNé   )ÚBaseImageProcessorÚBatchFeatureÚget_size_dict)ÚrescaleÚresizeÚto_channel_dimension_format)	ÚChannelDimensionÚ
ImageInputÚPILImageResamplingÚinfer_channel_dimension_formatÚis_scaled_imageÚmake_list_of_imagesÚto_numpy_arrayÚvalid_imagesÚvalidate_preprocess_arguments)ÚImagesKwargs)Ú
TensorTypeÚfilter_out_non_signature_kwargsÚis_torch_availableÚis_vision_availableÚlogging)Úrequiresc                   óX   — e Zd ZU dZeej                  eee      df   dz  e	d<   e
e	d<   y)ÚImageGPTImageProcessorKwargsa  
    clusters (`np.ndarray` or `list[list[int]]` or `torch.Tensor`, *optional*):
        The color clusters to use, of shape `(n_clusters, 3)` when color quantizing. Can be overridden by `clusters`
        in `preprocess`.
    do_color_quantize (`bool`, *optional*, defaults to `True`):
        Controls whether to apply color quantization to convert continuous pixel values to discrete cluster indices.
        When True, each pixel is assigned to its nearest color cluster, enabling ImageGPT's discrete token modeling.
    ztorch.TensorNÚclustersÚdo_color_quantize)Ú__name__Ú
__module__Ú__qualname__Ú__doc__r   ÚnpÚndarrayÚlistÚintÚ__annotations__Úbool© ó    úr/mnt/e/genesis-system/.venv/lib/python3.12/site-packages/transformers/models/imagegpt/image_processing_imagegpt.pyr   r   /   s2   … ñð B—J‘J  T¨#¡Y¡°Ð?Ñ@À4ÑGÓGØÔr*   r   F)Útotalc                 ó$  — |j                   }t        j                  t        j                  | «      d¬«      }t        j                  t        j                  |«      d¬«      }t        j                  | |«      }|d d …d f   d|z  z
  |d d d …f   z   }|S )Né   ©Úaxisr   é   )ÚTr#   ÚsumÚsquareÚmatmul)ÚaÚbÚa2Úb2ÚabÚds         r+   Úsquared_euclidean_distancer<   =   sr   € Ø	‰€AÜ	‰”—	‘	˜!“ 1Ô	%€BÜ	‰”—	‘	˜!“ 1Ô	%€BÜ	‰1a‹€BØ
Š1ˆdˆ7‰a˜"‘fÑ˜r $ª '™{Ñ*€AØ€Hr*   c                 ól   — | j                  dd«      } t        | |«      }t        j                  |d¬«      S )Néÿÿÿÿr   r.   r/   )Úreshaper<   r#   Úargmin)Úxr   r;   s      r+   Úcolor_quantizerB   F   s/   € Ø		‰	"aÓ€AÜ" 1 hÓ/€AÜ9‰9Q˜QÔÐr*   )Úvision)Úbackendsc                   ó¦  ‡ — e Zd ZdZdgZeZdddej                  ddfde	e	e
      ej                  z  dz  dedeee
f   dz  ded	ed
eddfˆ fd„Zej                  ddfdej                  deee
f   dedeez  dz  deez  dz  dej                  fd„Z	 	 ddej                  deez  dz  deez  dz  dej                  fd„Z e«       dddddddej*                  df	dededz  deee
f   dz  dedz  d	edz  d
edz  de	e	e
      ej                  z  dz  deez  dz  deez  dz  deez  dz  dej2                  j2                  fd„«       Zˆ fd„Zˆ xZS )ÚImageGPTImageProcessora®  
    Constructs a ImageGPT image processor. This image processor can be used to resize images to a smaller resolution
    (such as 32x32 or 64x64), normalize them and finally color quantize them to obtain sequences of "pixel values"
    (color clusters).

    Args:
        clusters (`np.ndarray` or `list[list[int]]`, *optional*):
            The color clusters to use, of shape `(n_clusters, 3)` when color quantizing. Can be overridden by `clusters`
            in `preprocess`.
        do_resize (`bool`, *optional*, defaults to `True`):
            Whether to resize the image's dimensions to `(size["height"], size["width"])`. Can be overridden by
            `do_resize` in `preprocess`.
        size (`dict[str, int]` *optional*, defaults to `{"height": 256, "width": 256}`):
            Size of the image after resizing. Can be overridden by `size` in `preprocess`.
        resample (`PILImageResampling`, *optional*, defaults to `Resampling.BILINEAR`):
            Resampling filter to use if resizing the image. Can be overridden by `resample` in `preprocess`.
        do_normalize (`bool`, *optional*, defaults to `True`):
            Whether to normalize the image pixel value to between [-1, 1]. Can be overridden by `do_normalize` in
            `preprocess`.
        do_color_quantize (`bool`, *optional*, defaults to `True`):
            Whether to color quantize the image. Can be overridden by `do_color_quantize` in `preprocess`.
    Úpixel_valuesNTr   Ú	do_resizeÚsizeÚresampleÚdo_normalizer   Úreturnc                 óÎ   •— t        ‰|   di |¤Ž ||ndddœ}t        |«      }|t        j                  |«      nd | _        || _        || _        || _        || _	        || _
        y )Né   )ÚheightÚwidthr)   )ÚsuperÚ__init__r   r#   Úarrayr   rH   rI   rJ   rK   r   )	Úselfr   rH   rI   rJ   rK   r   ÚkwargsÚ	__class__s	           €r+   rR   zImageGPTImageProcessor.__init__h   sl   ø€ ô 	‰ÑÑ"˜6Ò"ØÐ'‰t¸ÀcÑ-JˆÜ˜TÓ"ˆØ.6Ð.BœŸ™ Ô*ÈˆŒØ"ˆŒØˆŒ	Ø ˆŒØ(ˆÔØ!2ˆÕr*   ÚimageÚdata_formatÚinput_data_formatc                 ó–   — t        |«      }d|vsd|vrt        d|j                  «       › «      ‚|d   |d   f}t        |f||||dœ|¤ŽS )a  
        Resize an image to `(size["height"], size["width"])`.

        Args:
            image (`np.ndarray`):
                Image to resize.
            size (`dict[str, int]`):
                Dictionary in the format `{"height": int, "width": int}` specifying the size of the output image.
            resample (`PILImageResampling`, *optional*, defaults to `PILImageResampling.BILINEAR`):
                `PILImageResampling` filter to use when resizing the image e.g. `PILImageResampling.BILINEAR`.
            data_format (`ChannelDimension` or `str`, *optional*):
                The channel dimension format for the output image. If unset, the channel dimension format of the input
                image is used. Can be one of:
                - `"channels_first"` or `ChannelDimension.FIRST`: image in (num_channels, height, width) format.
                - `"channels_last"` or `ChannelDimension.LAST`: image in (height, width, num_channels) format.
                - `"none"` or `ChannelDimension.NONE`: image in (height, width) format.
            input_data_format (`ChannelDimension` or `str`, *optional*):
                The channel dimension format for the input image. If unset, the channel dimension format is inferred
                from the input image. Can be one of:
                - `"channels_first"` or `ChannelDimension.FIRST`: image in (num_channels, height, width) format.
                - `"channels_last"` or `ChannelDimension.LAST`: image in (height, width, num_channels) format.
                - `"none"` or `ChannelDimension.NONE`: image in (height, width) format.

        Returns:
            `np.ndarray`: The resized image.
        rO   rP   zFThe `size` dictionary must contain the keys `height` and `width`. Got )rI   rJ   rX   rY   )r   Ú
ValueErrorÚkeysr	   )rT   rW   rI   rJ   rX   rY   rU   Úoutput_sizes           r+   r	   zImageGPTImageProcessor.resize~   sy   € ôF ˜TÓ"ˆØ˜4Ñ 7°$Ñ#6ÜÐeÐfj×foÑfoÓfqÐerÐsÓtÐtØ˜H‘~ t¨G¡}Ð5ˆÜØð
àØØ#Ø/ñ
ð ñ
ð 	
r*   c                 ó.   — t        |d||¬«      }|dz
  }|S )a  
        Normalizes an images' pixel values to between [-1, 1].

        Args:
            image (`np.ndarray`):
                Image to normalize.
            data_format (`str` or `ChannelDimension`, *optional*):
                The channel dimension format of the image. If not provided, it will be the same as the input image.
            input_data_format (`ChannelDimension` or `str`, *optional*):
                The channel dimension format of the input image. If not provided, it will be inferred.
        g€?)rW   ÚscalerX   rY   r.   )r   )rT   rW   rX   rY   s       r+   Ú	normalizez ImageGPTImageProcessor.normalize®   s#   € ô" ˜e¨9À+ÐarÔsˆØ˜‘	ˆØˆr*   ÚimagesÚreturn_tensorsc           	      ó\  — ||n| j                   }||n| j                  }t        |«      }||n| j                  }||n| j                  }||n| j
                  }||n| j                  }t        j                  |«      }t        |«      }t        |«      st        d«      ‚t        |||¬«       |r|€t        d«      ‚|D cg c]  }t        |«      ‘Œ }}|r#t        |d   «      rt        j!                  d«       |
€t#        |d   «      }
|r"|D cg c]  }| j%                  ||||
¬«      ‘Œ }}|r |D cg c]  }| j'                  ||
¬«      ‘Œ }}|r–|D cg c]  }t)        |t*        j,                  |
«      ‘Œ }}t        j                  |«      }t/        ||«      j1                  |j2                  dd	 «      }|j2                  d   }|j1                  |d	«      }t5        |«      }d
|i}n|D cg c]  }t)        ||	|
«      ‘Œ }}d|i}t7        ||¬«      S c c}w c c}w c c}w c c}w c c}w )aœ
  
        Preprocess an image or batch of images.

        Args:
            images (`ImageInput`):
                Image to preprocess. Expects a single or batch of images with pixel values ranging from 0 to 255. If
                passing in images with pixel values between 0 and 1, set `do_normalize=False`.
            do_resize (`bool`, *optional*, defaults to `self.do_resize`):
                Whether to resize the image.
            size (`dict[str, int]`, *optional*, defaults to `self.size`):
                Size of the image after resizing.
            resample (`int`, *optional*, defaults to `self.resample`):
                Resampling filter to use if resizing the image. This can be one of the enum `PILImageResampling`, Only
                has an effect if `do_resize` is set to `True`.
            do_normalize (`bool`, *optional*, defaults to `self.do_normalize`):
                Whether to normalize the image
            do_color_quantize (`bool`, *optional*, defaults to `self.do_color_quantize`):
                Whether to color quantize the image.
            clusters (`np.ndarray` or `list[list[int]]`, *optional*, defaults to `self.clusters`):
                Clusters used to quantize the image of shape `(n_clusters, 3)`. Only has an effect if
                `do_color_quantize` is set to `True`.
            return_tensors (`str` or `TensorType`, *optional*):
                The type of tensors to return. Can be one of:
                    - Unset: Return a list of `np.ndarray`.
                    - `TensorType.PYTORCH` or `'pt'`: Return a batch of type `torch.Tensor`.
                    - `TensorType.NUMPY` or `'np'`: Return a batch of type `np.ndarray`.
            data_format (`ChannelDimension` or `str`, *optional*, defaults to `ChannelDimension.FIRST`):
                The channel dimension format for the output image. Can be one of:
                    - `ChannelDimension.FIRST`: image in (num_channels, height, width) format.
                    - `ChannelDimension.LAST`: image in (height, width, num_channels) format.
                Only has an effect if `do_color_quantize` is set to `False`.
            input_data_format (`ChannelDimension` or `str`, *optional*):
                The channel dimension format for the input image. If unset, the channel dimension format is inferred
                from the input image. Can be one of:
                - `"channels_first"` or `ChannelDimension.FIRST`: image in (num_channels, height, width) format.
                - `"channels_last"` or `ChannelDimension.LAST`: image in (height, width, num_channels) format.
                - `"none"` or `ChannelDimension.NONE`: image in (height, width) format.
        NzSInvalid image type. Must be of type PIL.Image.Image, numpy.ndarray, or torch.Tensor)rH   rI   rJ   z8Clusters must be specified if do_color_quantize is True.r   z®It looks like you are trying to rescale already rescaled images. If you wish to do this, make sure to set `do_normalize` to `False` and that pixel values are between [-1, 1].)rW   rI   rJ   rY   )rW   rY   r>   Ú	input_idsrG   )ÚdataÚtensor_type)rH   rI   r   rJ   rK   r   r   r#   rS   r   r   r[   r   r   r   ÚloggerÚwarning_oncer   r	   r`   r
   r   ÚLASTrB   r?   Úshaper%   r   )rT   ra   rH   rI   rJ   rK   r   r   rb   rX   rY   rW   Ú
batch_sizere   s                 r+   Ú
preprocessz!ImageGPTImageProcessor.preprocessÃ   sY  € ðh "+Ð!6‘I¸D¿N¹Nˆ	ØÐ'‰t¨T¯Y©YˆÜ˜TÓ"ˆØ'Ð3‘8¸¿¹ˆØ'3Ð'?‘|ÀT×EVÑEVˆØ1BÐ1NÑ-ÐTX×TjÑTjÐØ'Ð3‘8¸¿¹ˆÜ—8‘8˜HÓ%ˆä$ VÓ,ˆä˜FÔ#ÜÐrÓsÐsô 	&ØØØõ	
ñ  Ð!1ÜÐWÓXÐXð 6<Ö<¨E”. Õ'Ð<ˆÐ<áœO¨F°1©IÔ6Ü×Ñðhôð
 Ð$ä >¸vÀa¹yÓ IÐáð $öàð —‘ %¨d¸XÐYjÕkðˆFð ñ
 ØdjÖkÐ[`d—n‘n¨5ÐDUnÕVÐkˆFÐkáØpvÖwÐglÔ1°%Ô9I×9NÑ9NÐPaÕbÐwˆFÐwä—X‘X˜fÓ%ˆFÜ# F¨HÓ5×=Ñ=¸f¿l¹lÈ3ÈBÐ>OÓPˆFð  Ÿ™ a™ˆJØ—^‘^ J°Ó3ˆFô ˜&“\ˆFØ Ð(‰DàflÖmÐ]bÔ1°%¸ÐFWÕXÐmˆFÐmØ" FÐ+ˆDÜ °>ÔBÐBùòK =ùòùò lùò xùò ns   ÃHÄHÄ6HÅ"H$Ç.H)c                 óÖ   •— t         ‰|   «       }|j                  d«      3t        |d   t        j
                  «      r|d   j                  «       |d<   g d¢}|D ]  }||v sŒd ||<   Œ |S )Nr   )Ú
image_meanÚ	image_stdÚrescale_factorÚ
do_rescale)rQ   Úto_dictÚgetÚ
isinstancer#   r$   Útolist)rT   ÚoutputÚmissing_keysÚkeyrV   s       €r+   rr   zImageGPTImageProcessor.to_dict8  sv   ø€ Ü‘‘Ó"ˆà:‰:jÓ!Ð-´*¸VÀJÑ=OÔQS×Q[ÑQ[Ô2\Ø!'¨
Ñ!3×!:Ñ!:Ó!<ˆF:ÑâRˆØò 	#ˆCØfŠ}Ø"s’ð	#ð ˆr*   )NN)r   r    r!   r"   Úmodel_input_namesr   Úvalid_kwargsr   ÚBILINEARr%   r&   r#   r$   r(   ÚdictÚstrrR   r   r	   r`   r   ÚFIRSTr   r   ÚPILÚImagerl   rr   Ú__classcell__)rV   s   @r+   rF   rF   L   s  ø„ ñð. (Ð(ÐØ/€Lð
 9=ØØ&*Ø'9×'BÑ'BØ!Ø"&ñ3ð t˜C‘y‘/ B§J¡JÑ.°Ñ5ð3ð ð	3ð
 3˜8‰n˜tÑ#ð3ð %ð3ð ð3ð  ð3ð 
õ3ð4 (:×'BÑ'BØ59Ø;?ñ.
àz‰zð.
ð 3˜8‰nð.
ð %ð	.
ð
 Ð+Ñ+¨dÑ2ð.
ð Ð!1Ñ1°DÑ8ð.
ð 
‰ó.
ðf 6:Ø;?ñ	àz‰zðð Ð+Ñ+¨dÑ2ðð Ð!1Ñ1°DÑ8ð	ð
 
‰óñ* %Ó&ð "&Ø&*Ø.2Ø$(Ø)-Ø8<Ø26Ø5E×5KÑ5KØ;?ñrCàðrCð ˜$‘;ðrCð 3˜8‰n˜tÑ#ð	rCð
 % tÑ+ðrCð ˜T‘kðrCð   $™;ðrCð t˜C‘y‘/ B§J¡JÑ.°Ñ5ðrCð ˜jÑ(¨4Ñ/ðrCð Ð+Ñ+¨dÑ2ðrCð Ð!1Ñ1°DÑ8ðrCð 
‰‰òrCó 'ðrC÷hð r*   rF   )+r"   Útypingr   Únumpyr#   Úimage_processing_utilsr   r   r   Úimage_transformsr   r	   r
   Úimage_utilsr   r   r   r   r   r   r   r   r   Úprocessing_utilsr   Úutilsr   r   r   r   r   Úutils.import_utilsr   r   ÚtorchÚ
get_loggerr   rg   r   r<   rB   rF   Ú__all__r)   r*   r+   ú<module>r      s¦   ðñ *å ã ç UÑ Uß LÑ L÷
÷ 
õ 
õ -ß rÕ rÝ *ñ ÔÛáÔÛà	ˆ×	Ñ	˜HÓ	%€ô <°uõ òò ñ 
;ÔôvÐ/ó vó  ðvðr $Ð
$r*   