
    g                         d Z ddlZddlmZmZmZ ddlmZ ddlm	Z	 ddl
mZmZmZmZmZ ddlmZ  G d	 d
e	          ZdS )z&
Image/Text processor class for FLAVA
    N)ListOptionalUnion   )
ImageInput)ProcessorMixin)BatchEncodingPaddingStrategyPreTokenizedInput	TextInputTruncationStrategy)
TensorTypec            (           e Zd ZdZddgZdZdZd# fd	Z	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 d$dee	         dee
eeee         ee         f                  dede
eeef         de
eeef         dee         dedee         dee         dee         dee         dee         dedededededee
eef                  f$dZd Zd Zed              Zed!             Zed"             Z xZS )%FlavaProcessora  
    Constructs a FLAVA processor which wraps a FLAVA image processor and a FLAVA tokenizer into a single processor.

    [`FlavaProcessor`] offers all the functionalities of [`FlavaImageProcessor`] and [`BertTokenizerFast`]. See the
    [`~FlavaProcessor.__call__`] and [`~FlavaProcessor.decode`] for more information.

    Args:
        image_processor ([`FlavaImageProcessor`], *optional*): The image processor is a required input.
        tokenizer ([`BertTokenizerFast`], *optional*): The tokenizer is a required input.
    image_processor	tokenizerFlavaImageProcessor)BertTokenizerBertTokenizerFastNc                    d }d|v r/t          j        dt                     |                    d          }||n|}|t	          d          |t	          d          t                                          ||           | j        | _        d S )Nfeature_extractorzhThe `feature_extractor` argument is deprecated and will be removed in v5, use `image_processor` instead.z)You need to specify an `image_processor`.z"You need to specify a `tokenizer`.)	warningswarnFutureWarningpop
ValueErrorsuper__init__r   current_processor)selfr   r   kwargsr   	__class__s        f/var/www/html/ai-engine/env/lib/python3.11/site-packages/transformers/models/flava/processing_flava.pyr   zFlavaProcessor.__init__,   s     &((M  
 !'

+> ? ?-<-H//N_"HIIIABBB)444!%!5    TFr   imagestextadd_special_tokenspadding
truncation
max_lengthstridepad_to_multiple_ofreturn_image_maskreturn_codebook_pixelsreturn_token_type_idsreturn_attention_maskreturn_overflowing_tokensreturn_special_tokens_maskreturn_offsets_mappingreturn_lengthverbosereturn_tensorsc                    ||t          d          | | j        d|||||||||||||||d|}| | j        |f|	|
|d|}|||                    |           |S ||S t	          t          di ||          S )a  
        This method uses [`FlavaImageProcessor.__call__`] method to prepare image(s) for the model, and
        [`BertTokenizerFast.__call__`] to prepare text for the model.

        Please refer to the docstring of the above two methods for more information.
        Nz?You have to specify either text or images. Both cannot be none.)r&   r'   r(   r)   r*   r+   r,   r/   r0   r1   r2   r3   r4   r5   r6   )r-   r.   r6   )datatensor_type )r   r   r   updater	   dict)r    r%   r&   r'   r(   r)   r*   r+   r,   r-   r.   r/   r0   r1   r2   r3   r4   r5   r6   r!   encodingimage_featuress                         r#   __call__zFlavaProcessor.__call__?   s   : <FN^___%t~ #5%%#5&;&;*C+E'=+-   ! H$ 1T1"3'=-	 
  N  2OON+++OO d&<&<^&<&<.YYYYr$   c                 &     | j         j        |i |S )z
        This method forwards all its arguments to BertTokenizerFast's [`~PreTrainedTokenizer.batch_decode`]. Please
        refer to the docstring of this method for more information.
        )r   batch_decoder    argsr!   s      r#   rA   zFlavaProcessor.batch_decode   s    
 +t~*D;F;;;r$   c                 &     | j         j        |i |S )z
        This method forwards all its arguments to BertTokenizerFast's [`~PreTrainedTokenizer.decode`]. Please refer to
        the docstring of this method for more information.
        )r   decoderB   s      r#   rE   zFlavaProcessor.decode   s    
 %t~$d5f555r$   c                     | j         j        }| j        j        }t          t                              ||z                       S )N)r   model_input_namesr   listr<   fromkeys)r    tokenizer_input_namesimage_processor_input_namess      r#   rG   z FlavaProcessor.model_input_names   s:     $ @&*&:&L#DMM"7:U"UVVWWWr$   c                 D    t          j        dt                     | j        S )Nzg`feature_extractor_class` is deprecated and will be removed in v5. Use `image_processor_class` instead.)r   r   r   image_processor_classr    s    r#   feature_extractor_classz&FlavaProcessor.feature_extractor_class   s'    u	
 	
 	
 ))r$   c                 D    t          j        dt                     | j        S )Nz[`feature_extractor` is deprecated and will be removed in v5. Use `image_processor` instead.)r   r   r   r   rN   s    r#   r   z FlavaProcessor.feature_extractor   s'    i	
 	
 	
 ##r$   )NN)NNTFFNr   NNNNNFFFFTN)__name__
__module____qualname____doc__
attributesrM   tokenizer_classr   r   r   r   r   r   r   boolstrr
   r   intr   r?   rA   rE   propertyrG   rO   r   __classcell__)r"   s   @r#   r   r      sd       	 	 $[1J1<O6 6 6 6 6 6* (,hl#'5:;@$(,0,0150404*/+0',#;?'BZ BZ$BZ uY(94	?DQbLccdeBZ !	BZ
 tS/12BZ $%778BZ SMBZ BZ %SMBZ $D>BZ !)BZ  (~BZ  (~BZ $(BZ %)BZ  !%!BZ" #BZ$ %BZ& !sJ!78'BZ BZ BZ BZH< < <6 6 6 X X XX
 * * X* $ $ X$ $ $ $ $r$   r   )rT   r   typingr   r   r   image_utilsr   processing_utilsr   tokenization_utils_baser	   r
   r   r   r   utilsr   r   r:   r$   r#   <module>ra      s      ( ( ( ( ( ( ( ( ( ( % % % % % % . . . . . . w w w w w w w w w w w w w w      I$ I$ I$ I$ I$^ I$ I$ I$ I$ I$r$   