
    sg|                         d dl mZ ddlmZmZ ddlmZmZmZ  e       rddl	m
Z
  e ed      d	       G d
 de             Zy)    )Dict   )add_end_docstringsis_vision_available   )GenericTensorPipelinebuild_pipeline_init_args)
load_imageT)has_image_processora  
        image_processor_kwargs (`dict`, *optional*):
                Additional dictionary of keyword arguments passed along to the image processor e.g.
                {"size": {"height": 100, "width": 100}}
        pool (`bool`, *optional*, defaults to `False`):
            Whether or not to return the pooled output. If `False`, the model will return the raw hidden states.
    c                   P     e Zd ZdZddZd	deeef   fdZd Z	d
dZ
 fdZ xZS )ImageFeatureExtractionPipelinea+  
    Image feature extraction pipeline uses no model head. This pipeline extracts the hidden states from the base
    transformer, which can be used as features in downstream tasks.

    Example:

    ```python
    >>> from transformers import pipeline

    >>> extractor = pipeline(model="google/vit-base-patch16-224", task="image-feature-extraction")
    >>> result = extractor("https://huggingface.co/datasets/Narsil/image_dummy/raw/main/parrots.png", return_tensors=True)
    >>> result.shape  # This is a tensor of shape [1, sequence_lenth, hidden_dimension] representing the input image.
    torch.Size([1, 197, 768])
    ```

    Learn more about the basics of using a pipeline in the [pipeline tutorial](../pipeline_tutorial)

    This image feature extraction pipeline can currently be loaded from [`pipeline`] using the task identifier:
    `"image-feature-extraction"`.

    All vision models may be used for this pipeline. See a list of all models, including community-contributed models on
    [huggingface.co/models](https://huggingface.co/models).
    c                 P    |i n|}i }|||d<   |||d<   d|v r|d   |d<   |i |fS )Npoolreturn_tensorstimeout )selfimage_processor_kwargsr   r   kwargspreprocess_paramspostprocess_paramss          b/var/www/html/venv/lib/python3.12/site-packages/transformers/pipelines/image_feature_extraction.py_sanitize_parametersz3ImageFeatureExtractionPipeline._sanitize_parameters.   s_    "8"@BF\)-v&%3A/0+1)+<i( "&888    returnc                     t        ||      } | j                  |fd| j                  i|}| j                  dk(  r|j                  | j                        }|S )N)r   r   pt)r   image_processor	frameworktotorch_dtype)r   imager   r   model_inputss        r   
preprocessz)ImageFeatureExtractionPipeline.preprocess<   sU    5'2+t++Ek$..kTjk>>T!'??4+;+;<Lr   c                 *     | j                   di |}|S )Nr   )model)r   r$   model_outputss      r   _forwardz'ImageFeatureExtractionPipeline._forwardC   s    "

2\2r   c                     ||nd}|rd|vrt        d      |d   }n|d   }|r|S | j                  dk(  r|j                         S | j                  dk(  r|j                         j                         S y )NFpooler_outputzeNo pooled output was returned. Make sure the model has a `pooler` layer when using the `pool` option.r   r   tf)
ValueErrorr    tolistnumpy)r   r(   r   r   outputss        r   postprocessz*ImageFeatureExtractionPipeline.postprocessG   s    'tUm3 {  $O4G $A&GN>>T!>>##^^t#==?))++ $r   c                 "    t        |   |i |S )a  
        Extract the features of the input(s).

        Args:
            images (`str`, `List[str]`, `PIL.Image` or `List[PIL.Image]`):
                The pipeline handles three types of images:

                - A string containing a http link pointing to an image
                - A string containing a local path to an image
                - An image loaded in PIL directly

                The pipeline accepts either a single image or a batch of images, which must then be passed as a string.
                Images in a batch must all be in the same format: all as http links, all as local paths, or all as PIL
                images.
            timeout (`float`, *optional*, defaults to None):
                The maximum time in seconds to wait for fetching images from the web. If None, no timeout is used and
                the call may block forever.
        Return:
            A nested list of `float`: The features computed by the model.
        )super__call__)r   argsr   	__class__s      r   r4   z'ImageFeatureExtractionPipeline.__call__[   s    * w000r   )NNN)N)NF)__name__
__module____qualname____doc__r   r   strr   r%   r)   r1   r4   __classcell__)r6   s   @r   r   r      s9    094PSUbPbKc ,(1 1r   r   N)typingr   utilsr   r   baser   r	   r
   image_utilsr   r   r   r   r   <module>rA      sL     ; C C ( 6	[1X [1	[1r   