o
    h??                     @   s  d Z ddlZddlZddlZddlZddlZddlmZ ddlm	Z	 ddl
mZmZ ddlmZ ddlmZ dd	lmZ dd
lmZmZmZ ddlmZ ddlmZmZmZmZ ddlmZ ddl m!Z! ddl"m#Z# e$e%Z&eg dZ'eee'Z(de)fddZ*G dd dZ+dS )z AutoProcessor class.    N)OrderedDict   )PretrainedConfig)get_class_from_dynamic_moduleresolve_trust_remote_code)FeatureExtractionMixin)ImageProcessingMixin)TOKENIZER_CONFIG_FILE)FEATURE_EXTRACTOR_NAMEget_file_from_repologging   )_LazyAutoMapping)CONFIG_MAPPING_NAMES
AutoConfigmodel_type_to_module_name!replace_list_option_in_docstrings)AutoFeatureExtractor)AutoImageProcessor)AutoTokenizer)1)alignAlignProcessor)altclipAltCLIPProcessor)barkBarkProcessor)blipBlipProcessor)zblip-2Blip2Processor)bridgetowerBridgeTowerProcessor)chinese_clipChineseCLIPProcessor)clapClapProcessor)clipCLIPProcessor)clipsegCLIPSegProcessor)clvpClvpProcessor)flavaFlavaProcessor)fuyuFuyuProcessor)gitGitProcessor)groupvitr&   )hubertWav2Vec2Processor)ideficsIdeficsProcessor)instructblipInstructBlipProcessor)zkosmos-2Kosmos2Processor)
layoutlmv2LayoutLMv2Processor)
layoutlmv3LayoutLMv3Processor)llavaLlavaProcessor)markuplmMarkupLMProcessor)mctctMCTCTProcessor)zmgp-strMgpstrProcessor)	oneformerOneFormerProcessor)owlv2Owlv2Processor)owlvitOwlViTProcessor)
pix2structPix2StructProcessor)	pop2pianoPop2PianoProcessor)samSamProcessor)seamless_m4tSeamlessM4TProcessor)sewr3   )zsew-dr3   )speech_to_textSpeech2TextProcessor)speech_to_text_2Speech2Text2Processor)speecht5SpeechT5Processor)trocrTrOCRProcessor)tvltTvltProcessor)tvpTvpProcessor)	unispeechr3   )zunispeech-satr3   )viltViltProcessor)zvision-text-dual-encoderVisionTextDualEncoderProcessor)wav2vec2r3   )zwav2vec2-conformerr3   )wavlmr3   )whisperWhisperProcessor)xclipXCLIPProcessor
class_namec              	   C   s   t  D ]'\}}| |v r+t|}td| d}zt|| W   S  ty*   Y qw qtj	 D ]}t|dd | kr?|  S q1td}t
|| rOt|| S d S )N.ztransformers.models__name__transformers)PROCESSOR_MAPPING_NAMESitemsr   	importlibimport_modulegetattrAttributeErrorPROCESSOR_MAPPING_extra_contentvalueshasattr)ri   module_name
processorsmodule	processormain_module r|   ^/var/www/html/ai/venv/lib/python3.10/site-packages/transformers/models/auto/processing_auto.pyprocessor_class_from_namee   s$   	


r~   c                   @   s:   e Zd ZdZdd Zeeedd Ze	d
ddZ
d	S )AutoProcessora  
    This is a generic processor class that will be instantiated as one of the processor classes of the library when
    created with the [`AutoProcessor.from_pretrained`] class method.

    This class cannot be instantiated directly using `__init__()` (throws an error).
    c                 C   s   t d)Nz}AutoProcessor is designed to be instantiated using the `AutoProcessor.from_pretrained(pretrained_model_name_or_path)` method.)EnvironmentError)selfr|   r|   r}   __init__   s   zAutoProcessor.__init__c                    s|    dd}|dur tdt  dddurtd| d<   dd}  dd}d d	< d}d} fd
dttj	
 D }t|tfi |}	|	durotj|fi  \}
}|
dd}d|
di v ro|
d d }|	dur|du rtj|fi  \}
}|
dd}d|
di v r|
d d }|du rt|tfi |}|durt|dd}t|}
W d   n1 sw   Y  |
dd}d|
di v r|
d d }|du rt|tstj|fd|i }t|dd}t|drd|jv r|jd }|durt|}|du}|dupt|tv }t||||}|rI|rIt||fi  }  dd}t j!"|r>|#  |j|fd|i S |durY|j|fd|i S t|tv rmtt| j|fi  S zt$j|fd|i W S  t%y   zt&j|fd|i W  Y S  t%y   Y nw zt'j|fd|i W  Y S  t%y   Y nw Y nw td| d)a  
        Instantiate one of the processor classes of the library from a pretrained model vocabulary.

        The processor class to instantiate is selected based on the `model_type` property of the config object (either
        passed as an argument or loaded from `pretrained_model_name_or_path` if possible):

        List options

        Params:
            pretrained_model_name_or_path (`str` or `os.PathLike`):
                This can be either:

                - a string, the *model id* of a pretrained feature_extractor hosted inside a model repo on
                  huggingface.co. Valid model ids can be located at the root-level, like `bert-base-uncased`, or
                  namespaced under a user or organization name, like `dbmdz/bert-base-german-cased`.
                - a path to a *directory* containing a processor files saved using the `save_pretrained()` method,
                  e.g., `./my_model_directory/`.
            cache_dir (`str` or `os.PathLike`, *optional*):
                Path to a directory in which a downloaded pretrained model feature extractor should be cached if the
                standard cache should not be used.
            force_download (`bool`, *optional*, defaults to `False`):
                Whether or not to force to (re-)download the feature extractor files and override the cached versions
                if they exist.
            resume_download (`bool`, *optional*, defaults to `False`):
                Whether or not to delete incompletely received file. Attempts to resume the download if such a file
                exists.
            proxies (`Dict[str, str]`, *optional*):
                A dictionary of proxy servers to use by protocol or endpoint, e.g., `{'http': 'foo.bar:3128',
                'http://hostname': 'foo.bar:4012'}.` The proxies are used on each request.
            token (`str` or *bool*, *optional*):
                The token to use as HTTP bearer authorization for remote files. If `True`, will use the token generated
                when running `huggingface-cli login` (stored in `~/.huggingface`).
            revision (`str`, *optional*, defaults to `"main"`):
                The specific model version to use. It can be a branch name, a tag name, or a commit id, since we use a
                git-based system for storing models and other artifacts on huggingface.co, so `revision` can be any
                identifier allowed by git.
            return_unused_kwargs (`bool`, *optional*, defaults to `False`):
                If `False`, then this function returns just the final feature extractor object. If `True`, then this
                functions returns a `Tuple(feature_extractor, unused_kwargs)` where *unused_kwargs* is a dictionary
                consisting of the key/value pairs whose keys are not feature extractor attributes: i.e., the part of
                `kwargs` which has not been used to update `feature_extractor` and is otherwise ignored.
            trust_remote_code (`bool`, *optional*, defaults to `False`):
                Whether or not to allow for custom models defined on the Hub in their own modeling files. This option
                should only be set to `True` for repositories you trust and in which you have read the code, as it will
                execute code present on the Hub on your local machine.
            kwargs (`Dict[str, Any]`, *optional*):
                The values in kwargs of any keys which are feature extractor attributes will be used to override the
                loaded values. Behavior concerning key/value pairs whose keys are *not* feature extractor attributes is
                controlled by the `return_unused_kwargs` keyword parameter.

        <Tip>

        Passing `token=True` is required when you want to use a private model.

        </Tip>

        Examples:

        ```python
        >>> from transformers import AutoProcessor

        >>> # Download processor from huggingface.co and cache.
        >>> processor = AutoProcessor.from_pretrained("facebook/wav2vec2-base-960h")

        >>> # If processor files are in a directory (e.g. processor was saved using *save_pretrained('./test/saved_model/')*)
        >>> # processor = AutoProcessor.from_pretrained("./test/saved_model/")
        ```use_auth_tokenNzrThe `use_auth_token` argument is deprecated and will be removed in v5 of Transformers. Please use `token` instead.tokenzV`token` and `use_auth_token` are both specified. Please set only the argument `token`.configtrust_remote_codeT
_from_autoc                    s   i | ]}| v r| | qS r|   r|   ).0keykwargsr|   r}   
<dictcomp>   s    z1AutoProcessor.from_pretrained.<locals>.<dictcomp>processor_classr   auto_mapzutf-8)encodingcode_revisionz!Unrecognized processing class in z. Can't instantiate a processor, a tokenizer, an image processor or a feature extractor for this model. Make sure the repository contains the files of at least one of those processing classes.)(popwarningswarnFutureWarningget
ValueErrorinspect	signaturer   
parameterskeysr
   r   get_image_processor_dictr   get_feature_extractor_dictr	   openjsonload
isinstancer   r   from_pretrainedrq   rv   r   r~   typers   r   r   ospathisdirregister_for_auto_classr   	Exceptionr   r   )clspretrained_model_name_or_pathr   r   r   r   r   processor_auto_mapget_file_from_repo_kwargspreprocessor_config_fileconfig_dict_tokenizer_config_filereaderhas_remote_codehas_local_coder|   r   r}   r      s   F





zAutoProcessor.from_pretrainedFc                 C   s   t j| ||d dS )a  
        Register a new processor for this class.

        Args:
            config_class ([`PretrainedConfig`]):
                The configuration corresponding to the model to register.
            processor_class ([`FeatureExtractorMixin`]): The processor to register.
        )exist_okN)rs   register)config_classr   r   r|   r|   r}   r   I  s   
zAutoProcessor.registerN)F)rk   
__module____qualname____doc__r   classmethodr   rm   r   staticmethodr   r|   r|   r|   r}   r   }   s     =r   ),r   ro   r   r   r   r   collectionsr   configuration_utilsr   dynamic_module_utilsr   r   feature_extraction_utilsr   image_processing_utilsr   tokenization_utilsr	   utilsr
   r   r   auto_factoryr   configuration_autor   r   r   r   feature_extraction_autor   image_processing_autor   tokenization_autor   
get_loggerrk   loggerrm   rs   strr~   r   r|   r|   r|   r}   <module>   s2   

6