
    bi&                        d dl mZmZmZ d dlZddlmZmZm	Z	m
Z
mZ ddlmZmZ  e	            rd dlmZ ddlmZ  e            rdd	lmZmZmZmZ  e
j        e          Z e ed
                     G d de                      ZdS )    )AnyUnionoverloadN   )add_end_docstringsis_torch_availableis_vision_availableloggingrequires_backends   )Pipelinebuild_pipeline_init_args)Image)
load_image)*MODEL_FOR_IMAGE_SEGMENTATION_MAPPING_NAMES-MODEL_FOR_INSTANCE_SEGMENTATION_MAPPING_NAMES-MODEL_FOR_SEMANTIC_SEGMENTATION_MAPPING_NAMES.MODEL_FOR_UNIVERSAL_SEGMENTATION_MAPPING_NAMEST)has_image_processorc                       e Zd ZdZdZdZdZdZ fdZd Z	e
deedf         d	ed
eeeef                  fd            Ze
dee         ed         z  d	ed
eeeeef                           fd            Zdeedee         ed         f         d	ed
eeeef                  eeeeef                           z  f fdZddZd Z	 ddZ xZS )ImageSegmentationPipelinea  
    Image segmentation pipeline using any `AutoModelForXXXSegmentation`. This pipeline predicts masks of objects and
    their classes.

    Example:

    ```python
    >>> from transformers import pipeline

    >>> segmenter = pipeline(model="facebook/detr-resnet-50-panoptic")
    >>> segments = segmenter("https://huggingface.co/datasets/Narsil/image_dummy/raw/main/parrots.png")
    >>> len(segments)
    2

    >>> segments[0]["label"]
    'bird'

    >>> segments[1]["label"]
    'bird'

    >>> type(segments[0]["mask"])  # This is a black and white mask showing where is the bird on the original image.
    <class 'PIL.Image.Image'>

    >>> segments[0]["mask"].size
    (768, 512)
    ```


    This image segmentation pipeline can currently be loaded from [`pipeline`] using the following task identifier:
    `"image-segmentation"`.

    See the list of available models on
    [huggingface.co/models](https://huggingface.co/models?filter=image-segmentation).
    FTNc                 F    t                      j        |i | t          | d           t          j                    }|                    t                     |                    t                     |                    t                     | 	                    |           d S )Nvision)
super__init__r   r   copyupdater   r   r   check_model_type)selfargskwargsmapping	__class__s       d/root/projects/butler/venv/lib/python3.11/site-packages/transformers/pipelines/image_segmentation.pyr   z"ImageSegmentationPipeline.__init__D   s    $)&)))$)))<ACCDEEEDEEEEFFFg&&&&&    c                     i }i }d|v r|d         |d<   |d         |d<   d|v r|d         |d<   d|v r|d         |d<   d|v r|d         |d<   d|v r|d         |d<   |i |fS )Nsubtask	thresholdmask_thresholdoverlap_mask_area_thresholdtimeout )r   r!   preprocess_kwargspostprocess_kwargss       r$   _sanitize_parametersz.ImageSegmentationPipeline._sanitize_parametersN   s    ,29,=y)+1)+<i(&  .4[.A{+v%%39:J3K/0(F22@FGd@e<=+1)+<i( "&888r%   inputszImage.Imager!   returnc                     d S Nr,   r   r0   r!   s      r$   __call__z"ImageSegmentationPipeline.__call___   s    beber%   c                     d S r3   r,   r4   s      r$   r5   z"ImageSegmentationPipeline.__call__b   s    nqnqr%   c                     d|v r|                     d          }|t          d           t                      j        |fi |S )a	  
        Perform segmentation (detect masks & classes) in the image(s) passed as inputs.

        Args:
            inputs (`str`, `list[str]`, `PIL.Image` or `list[PIL.Image]`):
                The pipeline handles three types of images:

                - A string containing an HTTP(S) link pointing to an image
                - A string containing a local path to an image
                - An image loaded in PIL directly

                The pipeline accepts either a single image or a batch of images. Images in a batch must all be in the
                same format: all as HTTP(S) links, all as local paths, or all as PIL images.
            subtask (`str`, *optional*):
                Segmentation task to be performed, choose [`semantic`, `instance` and `panoptic`] depending on model
                capabilities. If not set, the pipeline will attempt tp resolve in the following order:
                  `panoptic`, `instance`, `semantic`.
            threshold (`float`, *optional*, defaults to 0.9):
                Probability threshold to filter out predicted masks.
            mask_threshold (`float`, *optional*, defaults to 0.5):
                Threshold to use when turning the predicted masks into binary values.
            overlap_mask_area_threshold (`float`, *optional*, defaults to 0.5):
                Mask overlap threshold to eliminate small, disconnected segments.
            timeout (`float`, *optional*, defaults to None):
                The maximum time in seconds to wait for fetching images from the web. If None, no timeout is set and
                the call may block forever.

        Return:
            If the input is a single image, will return a list of dictionaries, if the input is a list of several images,
            will return a list of list of dictionaries corresponding to each image.

            The dictionaries contain the mask, label and score (where applicable) of each detected object and contains
            the following keys:

            - **label** (`str`) -- The class label identified by the model.
            - **mask** (`PIL.Image`) -- A binary mask of the detected object as a Pil Image of shape (width, height) of
              the original image. Returns a mask filled with zeros if no object is found.
            - **score** (*optional* `float`) -- Optionally, when the model is capable of estimating a confidence of the
              "object" described by the label and the mask.
        imagesNzICannot call the image-classification pipeline without an inputs argument!)pop
ValueErrorr   r5   )r   r0   r!   r#   s      r$   r5   z"ImageSegmentationPipeline.__call__e   sU    X vZZ))F>hiiiuww11&111r%   c                    t          ||          }|j        |j        fg}| j        j        j        j        dk    rm|i }nd|gi} | j        d
|gdd|}|                    | j	                  }| 
                    |d         d| j        j        j        d          d         |d<   n2|                     |gd          }|                    | j	                  }||d	<   |S )N)r+   OneFormerConfigtask_inputspt)r8   return_tensors
max_length)paddingr@   r?   	input_idstarget_sizer,   )r   heightwidthmodelconfigr#   __name__image_processortodtype	tokenizertask_seq_len)r   imager'   r+   rC   r!   r0   s          r$   
preprocessz$ImageSegmentationPipeline.preprocess   s
   5'222ek23:&/3DDD''3)T)X%XXQWXXFYYtz**F$(NN}%$:,9#	 %3 % %
 %F=!! ))%)NNFYYtz**F +}r%   c                 T    |                     d          } | j        di |}||d<   |S )NrC   r,   )r9   rF   )r   model_inputsrC   model_outputss       r$   _forwardz"ImageSegmentationPipeline._forward   s<    "&&}55"
22\22'2m$r%   ?      ?c                 6   d }|dv r"t          | j        d          r| j        j        }n%|dv r!t          | j        d          r| j        j        }| ||||||d                   d         }g }|d         }	|d	         D ]}
|	|
d
         k    dz  }t	          j        |                                                    t          j	                  d          }| j
        j        j        |
d                  }|
d         }|                    |||d           n|dv rt          | j        d          r| j                            ||d                   d         }g }|                                }	t          j        |	          }|D ]n}|	|k    dz  }t	          j        |                    t          j	                  d          }| j
        j        j        |         }|                    d ||d           on't!          d| dt#          | j
                             |S )N>   Npanoptic"post_process_panoptic_segmentation>   Ninstance"post_process_instance_segmentationrC   )r(   r)   r*   target_sizesr   segmentationsegments_infoid   L)modelabel_idscore)rc   labelmask>   Nsemantic"post_process_semantic_segmentation)r[   zSubtask z is not supported for model )hasattrrI   rX   rZ   r   	fromarraynumpyastypenpuint8rF   rG   id2labelappendrg   uniquer:   type)r   rR   r'   r(   r)   r*   fnoutputs
annotationr\   segmentre   rd   rc   labelss                  r$   postprocessz%ImageSegmentationPipeline.postprocess   sh    (((WT5IKo-p-p(%HBB***wt7KMq/r/r*%HB>b#-,G*=9   G J">2L"?3 R R$5<tzz||':':28'D'D3OOO
)27:3FG(!!EE4"P"PQQQQR ***wt7KMq/r/r**MMM-,H N  G J"==??LY|,,F Q Q$-4t{{28'<'<3GGG
)259!!D5$"O"OPPPP	Q ___TRVR\M]M]__```r%   )NN)NrT   rU   rU   )rH   
__module____qualname____doc___load_processor_load_image_processor_load_feature_extractor_load_tokenizerr   r/   r   r   strr   listdictr5   rO   rS   rw   __classcell__)r#   s   @r$   r   r      s       ! !F O #O' ' ' ' '9 9 9" euS-%78eCeDQUVY[^V^Q_L`eee XeqtCy4+>>q#qRVW[\`adfiai\jWkRlqqq Xq02CS	4;NNO02[^02	d38n	T$sCx.%9 :	:02 02 02 02 02 02d   ,   kn, , , , , , , ,r%   r   )typingr   r   r   rj   rl   utilsr   r   r	   r
   r   baser   r   PILr   image_utilsr   models.auto.modeling_autor   r   r   r   
get_loggerrH   loggerr   r,   r%   r$   <module>r      so   ' ' ' ' ' ' ' ' ' '     k k k k k k k k k k k k k k 4 4 4 4 4 4 4 4  )((((((             
	H	%	% ,,FFFGGD D D D D D D HGD D Dr%   