
    Ig                        d dl Z d dlmZmZmZmZ ddlmZmZm	Z	m
Z
mZ ddlmZmZ  e	       rddlmZ  e       rd dlZddlmZmZ  e
j*                  e      Zeeef   Zee   Z e ed	
             G d de             Zy)    N)AnyDictListUnion   )add_end_docstringsis_torch_availableis_vision_availableloggingrequires_backends   )Pipelinebuild_pipeline_init_args)
load_image)(MODEL_FOR_OBJECT_DETECTION_MAPPING_NAMES,MODEL_FOR_TOKEN_CLASSIFICATION_MAPPING_NAMEST)has_image_processorc                   x     e Zd ZdZ fdZd Zdeeee	   f   f fdZ
ddZd ZddZd	d
deeef   fdZ xZS )ObjectDetectionPipelinea  
    Object detection pipeline using any `AutoModelForObjectDetection`. This pipeline predicts bounding boxes of objects
    and their classes.

    Example:

    ```python
    >>> from transformers import pipeline

    >>> detector = pipeline(model="facebook/detr-resnet-50")
    >>> detector("https://huggingface.co/datasets/Narsil/image_dummy/raw/main/parrots.png")
    [{'score': 0.997, 'label': 'bird', 'box': {'xmin': 69, 'ymin': 171, 'xmax': 396, 'ymax': 507}}, {'score': 0.999, 'label': 'bird', 'box': {'xmin': 398, 'ymin': 105, 'xmax': 767, 'ymax': 507}}]

    >>> # x, y  are expressed relative to the top left hand corner.
    ```

    Learn more about the basics of using a pipeline in the [pipeline tutorial](../pipeline_tutorial)

    This object detection pipeline can currently be loaded from [`pipeline`] using the following task identifier:
    `"object-detection"`.

    See the list of available models on [huggingface.co/models](https://huggingface.co/models?filter=object-detection).
    c                     t        |   |i | | j                  dk(  rt        d| j                   d      t        | d       t        j                         }|j                  t               | j                  |       y )NtfzThe z is only available in PyTorch.vision)super__init__	framework
ValueError	__class__r   r   copyupdater   check_model_type)selfargskwargsmappingr   s       d/var/www/html/answerous/venv/lib/python3.12/site-packages/transformers/pipelines/object_detection.pyr   z ObjectDetectionPipeline.__init__5   sn    $)&)>>T!tDNN#33QRSS$):??ACDg&    c                 x    i }d|v r"t        j                  dt               |d   |d<   i }d|v r|d   |d<   |i |fS )NtimeoutzUThe `timeout` argument is deprecated and will be removed in version 5 of Transformers	threshold)warningswarnFutureWarning)r!   r#   preprocess_paramspostprocess_kwargss       r%   _sanitize_parametersz,ObjectDetectionPipeline._sanitize_parameters@   s`    MMgiv ,2)+<i(& .4[.A{+ "&888r&   returnc                 Z    d|v rd|vr|j                  d      |d<   t        |   |i |S )a  
        Detect objects (bounding boxes & classes) in the image(s) passed as inputs.

        Args:
            inputs (`str`, `List[str]`, `PIL.Image` or `List[PIL.Image]`):
                The pipeline handles three types of images:

                - A string containing an HTTP(S) link pointing to an image
                - A string containing a local path to an image
                - An image loaded in PIL directly

                The pipeline accepts either a single image or a batch of images. Images in a batch must all be in the
                same format: all as HTTP(S) links, all as local paths, or all as PIL images.
            threshold (`float`, *optional*, defaults to 0.5):
                The probability necessary to make a prediction.

        Return:
            A list of dictionaries or a list of list of dictionaries containing the result. If the input is a single
            image, will return a list of dictionaries, if the input is a list of several images, will return a list of
            list of dictionaries corresponding to each image.

            The dictionaries contain the following keys:

            - **label** (`str`) -- The class label identified by the model.
            - **score** (`float`) -- The score attributed by the model for that label.
            - **box** (`List[Dict[str, int]]`) -- The bounding box of detected object in image's original size.
        imagesinputs)popr   __call__)r!   r"   r#   r   s      r%   r5   z ObjectDetectionPipeline.__call__L   s<    : v(&"8%zz(3F8w000r&   c                 J   t        ||      }t        j                  |j                  |j                  gg      }| j                  |gd      }| j                  dk(  r|j                  | j                        }| j                  | j                  |d   |d   d      }||d<   |S )N)r(   pt)r2   return_tensorswordsboxes)textr:   r8   target_size)
r   torch	IntTensorheightwidthimage_processorr   totorch_dtype	tokenizer)r!   imager(   r<   r3   s        r%   
preprocessz"ObjectDetectionPipeline.preprocessm   s    5'2ooekk'B&CD%%eWT%J>>T!YYt//0F>>%^^w`d^eF +}r&   c                     |j                  d      } | j                  di |}|j                  d|i|      }| j                  |d   |d<   |S )Nr<   bbox )r4   modelr   rD   )r!   model_inputsr<   outputsmodel_outputss        r%   _forwardz ObjectDetectionPipeline._forwardx   s^    "&&}5$**,|,))=+*Q*QR>>%$0$8M&!r&   c           	      6    |d   } j                   |d   j                         \   fd}|d   j                  d      j                  d      j	                  d      \  }}|j                         D cg c]%  } j
                  j                  j                  |   ' }}|d   j                  d      D 	cg c]
  }	 ||	       }
}	g d}t        |j                         ||
      D cg c]   }|d   |kD  st        t        ||            " }}|S  j                  j                  |||      }|d   }|d	   }|d
   }|d   }
|j                         |d	<   |D cg c]3  } j
                  j                  j                  |j                            5 c}|d
<   |
D cg c]  } j                  |       c}|d<   g d}t        |d	   |d
   |d         D cg c]  }t        t        ||             }}|S c c}w c c}	w c c}w c c}w c c}w c c}w )Nr<   r   c           
          j                  t        j                  | d   z  dz  | d   z  dz  | d   z  dz  | d   z  dz  g            S )Nr   i  r   r      )_get_bounding_boxr=   Tensor)rH   r?   r!   r@   s    r%   unnormalizez8ObjectDetectionPipeline.postprocess.<locals>.unnormalize   si    --LL"T!W_t3#d1g-4"T!W_t3#d1g-4		 	r&   logits)dimrH   )scorelabelboxscoreslabelsr:   )rD   tolistsqueezesoftmaxmaxrJ   configid2labelzipdictrA   post_process_object_detectionitemrR   )r!   rM   r)   r<   rT   r[   classes
predictionr\   rH   r:   keysvals
annotationraw_annotationsraw_annotationrY   rZ   r?   r@   s   `                 @@r%   postprocessz#ObjectDetectionPipeline.postprocess   s$   #M2>>% (N113MFE
 ,H5==a@HHRHPTTY[T\OFGOV~~O_`djj''00<`F`3@3H3P3PQR3ST4[&TET,D<?QWY^<_wDcghicjmvcv$s4/wJw( # #22PPQ^`ikvwO,Q/N#H-F#H-F"7+E'-}}N8$^d'eUZ

(9(9(B(B5::<(P'eN8$NS&Tst'='=c'B&TN7# -D  x 8.:RTbcjTkl St_%J 
 / aTw (f&Ts*   <*G=>H0H>H!8H#HHrZ   ztorch.Tensorc                     | j                   dk7  rt        d      |j                         j                         \  }}}}||||d}|S )a%  
        Turns list [xmin, xmax, ymin, ymax] into dict { "xmin": xmin, ... }

        Args:
            box (`torch.Tensor`): Tensor containing the coordinates in corners format.

        Returns:
            bbox (`Dict[str, int]`): Dict containing the coordinates in corners format.
        r7   z9The ObjectDetectionPipeline is only available in PyTorch.)xminyminxmaxymax)r   r   intr]   )r!   rZ   rp   rq   rr   rs   rH   s          r%   rR   z)ObjectDetectionPipeline._get_bounding_box   sS     >>T!XYY!$!1!1!3dD$	
 r&   )N)g      ?)__name__
__module____qualname____doc__r   r/   r   Predictionsr   
Predictionr5   rF   rN   rn   r   strrt   rR   __classcell__)r   s   @r%   r   r      sY    0	'
915d:>N1N+O 1B	+Z^ S#X r&   r   )r*   typingr   r   r   r   utilsr   r	   r
   r   r   baser   r   image_utilsr   r=   models.auto.modeling_autor   r   
get_loggerru   loggerr{   rz   ry   r   rI   r&   r%   <module>r      s     ) ) k k 4 ( 
 
		H	% #s(^
: ,FGdh d Hdr&   