o
    eiyR                     @   s8  d Z ddlZddlZddlZddlmZ ddlmZ ddlm	Z	m
Z
 ddlmZ ddlmZ dd	lmZ dd
lmZ ddlmZmZmZmZmZ ddlmZ ddlmZ ddlmZmZm Z m!Z! ddl"m#Z# ddl$m%Z% ddl&m'Z' ddl(m)Z) e*e+Z,eg dZ-eee-Z.de/fddZ0G dd dZ1ddgZ2dS )zAutoProcessor class.    N)OrderedDict   )PreTrainedConfig)get_class_from_dynamic_moduleresolve_trust_remote_code)FeatureExtractionMixin)ImageProcessingMixin)ProcessorMixin)TOKENIZER_CONFIG_FILE)FEATURE_EXTRACTOR_NAMEPROCESSOR_NAMEVIDEO_PROCESSOR_NAMEcached_filelogging)BaseVideoProcessor   )_LazyAutoMapping)CONFIG_MAPPING_NAMES
AutoConfigmodel_type_to_module_name!replace_list_option_in_docstrings)AutoFeatureExtractor)AutoImageProcessor)AutoTokenizer)AutoVideoProcessor)})aimv2CLIPProcessor)alignAlignProcessor)altclipAltCLIPProcessor)ariaAriaProcessor)audioflamingo3AudioFlamingo3Processor)
aya_visionAyaVisionProcessor)barkBarkProcessor)blipBlipProcessor)zblip-2Blip2Processor)bridgetowerBridgeTowerProcessor)	chameleonChameleonProcessor)chinese_clipChineseCLIPProcessor)clapClapProcessor)clipr   )clipsegCLIPSegProcessor)clvpClvpProcessor)cohere2_visionCohere2VisionProcessor)colpaliColPaliProcessor)colqwen2ColQwen2Processor)deepseek_vlDeepseekVLProcessor)deepseek_vl_hybridDeepseekVLHybridProcessor)diaDiaProcessor)edgetamSam2Processor)emu3Emu3Processor)ernie4_5_vl_moeErnie4_5_VL_MoeProcessor)evollaEvollaProcessor)flavaFlavaProcessor)	florence2Florence2Processor)fuyuFuyuProcessor)gemma3Gemma3Processor)gemma3nGemma3nProcessor)gitGitProcessor)glm46vGlm46VProcessor)glm4vGlm4vProcessor)	glm4v_moer\   )	glm_imager\   )glmasrGlmAsrProcessor)got_ocr2GotOcr2Processor)granite_speechGraniteSpeechProcessor)zgrounding-dinoGroundingDinoProcessor)groupvitr   )hubertWav2Vec2Processor)ideficsIdeficsProcessor)idefics2Idefics2Processor)idefics3Idefics3Processor)instructblipInstructBlipProcessor)instructblipvideoInstructBlipVideoProcessor)internvlInternVLProcessor)janusJanusProcessor)zkosmos-2Kosmos2Processor)z
kosmos-2.5Kosmos2_5Processor)kyutai_speech_to_textKyutaiSpeechToTextProcessor)lasr_ctcLasrProcessor)lasr_encoderr|   )
layoutlmv2LayoutLMv2Processor)
layoutlmv3LayoutLMv3Processor)	layoutxlmLayoutXLMProcessor)lfm2_vlLfm2VlProcessor)lighton_ocrLightOnOcrProcessor)llama4Llama4Processor)llavaLlavaProcessor)
llava_nextLlavaNextProcessor)llava_next_videoLlavaNextVideoProcessor)llava_onevisionLlavaOnevisionProcessor)markuplmMarkupLMProcessor)
metaclip_2r   )zmgp-strMgpstrProcessor)mistral3PixtralProcessor)mllamaMllamaProcessor)zmm-grounding-dinore   )	moonshinerh   )moonshine_streamingMoonshineStreamingProcessor)zomdet-turboOmDetTurboProcessor)	oneformerOneFormerProcessor)ovis2Ovis2Processor)owlv2Owlv2Processor)owlvitOwlViTProcessor)paddleocr_vlPaddleOCRVLProcessor)	paligemmaPaliGemmaProcessor)perception_lmPerceptionLMProcessor)phi4_multimodalPhi4MultimodalProcessor)
pix2structPix2StructProcessor)pixtralr   )	pop2pianoPop2PianoProcessor)qwen2_5_omniQwen2_5OmniProcessor)
qwen2_5_vlQwen2_5_VLProcessor)qwen2_audioQwen2AudioProcessor)qwen2_vlQwen2VLProcessor)qwen3_5Qwen3VLProcessor)qwen3_5_moer   )qwen3_omni_moeQwen3OmniMoeProcessor)qwen3_vlr   )qwen3_vl_moer   )samSamProcessor)sam2rF   )sam3Sam3Processor)sam_hqSamHQProcessor)seamless_m4tSeamlessM4TProcessor)sewrh   )zsew-drh   )shieldgemma2ShieldGemma2Processor)siglipSiglipProcessor)siglip2Siglip2Processor)smolvlmSmolVLMProcessor)speech_to_textSpeech2TextProcessor)speecht5SpeechT5Processor)t5gemma2rT   )t5gemma2_encoderrT   )trocrTrOCRProcessor)tvpTvpProcessor)udopUdopProcessor)	unispeechrh   )zunispeech-satrh   )video_llavaVideoLlavaProcessor)viltViltProcessor)vipllavar   )zvision-text-dual-encoderVisionTextDualEncoderProcessor)voxtralVoxtralProcessor)voxtral_realtimeVoxtralRealtimeProcessor)wav2vec2rh   )zwav2vec2-bertrh   )zwav2vec2-conformerrh   )wavlmrh   )whisperWhisperProcessor)xclipXCLIPProcessor
class_namec              	   C   s   t  D ]'\}}| |v r+t|}td| d}zt|| W   S  ty*   Y qw qtj	 D ]}t|dd | kr?|  S q1td}t
|| rOt|| S d S )N.ztransformers.models__name__transformers)PROCESSOR_MAPPING_NAMESitemsr   	importlibimport_modulegetattrAttributeErrorPROCESSOR_MAPPING_extra_contentvalueshasattr)r   module_name
processorsmodule	processormain_module r  f/home/ubuntu/transcripts/venv/lib/python3.10/site-packages/transformers/models/auto/processing_auto.pyprocessor_class_from_name   s$   	


r  c                   @   s:   e Zd ZdZdd Zeeedd Ze	d
ddZ
d	S )AutoProcessora  
    This is a generic processor class that will be instantiated as one of the processor classes of the library when
    created with the [`AutoProcessor.from_pretrained`] class method.

    This class cannot be instantiated directly using `__init__()` (throws an error).
    c                 C   s   t d)Nz}AutoProcessor is designed to be instantiated using the `AutoProcessor.from_pretrained(pretrained_model_name_or_path)` method.)OSError)selfr  r  r  __init__   s   zAutoProcessor.__init__c              	      s    dd}  dd}d d< d}d} fddttjD }|dddd	 t|tfi |}|durUtj|fi  \}	}
|		d
}d|		di v rU|	d d }|du rt|t
fi |}|durtj|fi  \}	}
|		d
d}d|		di v r|	d d }|du rt|tfi |}|durtj|fi  \}	}
|		d
d}d|		di v r|	d d }|du rt|t
fi |}|dur|du rtj|fi  \}	}
|		d
d}d|		di v r|	d d }|du r-t|tfi |}|dur-t|dd}t|}	W d   n	1 sw   Y  |		d
d}d|		di v r-|	d d }|du rgz*t|tsDtj|fd|i }t|d
d}t|dr[d|jv r[|jd }W n
 tyf   Y nw |durpt|}|du}|dup~t|t v }|rd|v r|!dd }nd}t"|||||}|r|rt#||fi  }  dd}
|$  |j|fd|i S |dur|j|fd|i S t|t v rt t| j|fi  S t%t&t't(fD ]}z|j|fd|i W   S  t)y   Y qw td| d)a3  
        Instantiate one of the processor classes of the library from a pretrained model vocabulary.

        The processor class to instantiate is selected based on the `model_type` property of the config object (either
        passed as an argument or loaded from `pretrained_model_name_or_path` if possible):

        List options

        Params:
            pretrained_model_name_or_path (`str` or `os.PathLike`):
                This can be either:

                - a string, the *model id* of a pretrained feature_extractor hosted inside a model repo on
                  huggingface.co.
                - a path to a *directory* containing a processor files saved using the `save_pretrained()` method,
                  e.g., `./my_model_directory/`.
            cache_dir (`str` or `os.PathLike`, *optional*):
                Path to a directory in which a downloaded pretrained model feature extractor should be cached if the
                standard cache should not be used.
            force_download (`bool`, *optional*, defaults to `False`):
                Whether or not to force to (re-)download the feature extractor files and override the cached versions
                if they exist.
            proxies (`dict[str, str]`, *optional*):
                A dictionary of proxy servers to use by protocol or endpoint, e.g., `{'http': 'foo.bar:3128',
                'http://hostname': 'foo.bar:4012'}.` The proxies are used on each request.
            token (`str` or *bool*, *optional*):
                The token to use as HTTP bearer authorization for remote files. If `True`, will use the token generated
                when running `hf auth login` (stored in `~/.huggingface`).
            revision (`str`, *optional*, defaults to `"main"`):
                The specific model version to use. It can be a branch name, a tag name, or a commit id, since we use a
                git-based system for storing models and other artifacts on huggingface.co, so `revision` can be any
                identifier allowed by git.
            return_unused_kwargs (`bool`, *optional*, defaults to `False`):
                If `False`, then this function returns just the final feature extractor object. If `True`, then this
                functions returns a `Tuple(feature_extractor, unused_kwargs)` where *unused_kwargs* is a dictionary
                consisting of the key/value pairs whose keys are not feature extractor attributes: i.e., the part of
                `kwargs` which has not been used to update `feature_extractor` and is otherwise ignored.
            trust_remote_code (`bool`, *optional*, defaults to `False`):
                Whether or not to allow for custom models defined on the Hub in their own modeling files. This option
                should only be set to `True` for repositories you trust and in which you have read the code, as it will
                execute code present on the Hub on your local machine.
            kwargs (`dict[str, Any]`, *optional*):
                The values in kwargs of any keys which are feature extractor attributes will be used to override the
                loaded values. Behavior concerning key/value pairs whose keys are *not* feature extractor attributes is
                controlled by the `return_unused_kwargs` keyword parameter.

        <Tip>

        Passing `token=True` is required when you want to use a private model.

        </Tip>

        Examples:

        ```python
        >>> from transformers import AutoProcessor

        >>> # Download processor from huggingface.co and cache.
        >>> processor = AutoProcessor.from_pretrained("facebook/wav2vec2-base-960h")

        >>> # If processor files are in a directory (e.g. processor was saved using *save_pretrained('./test/saved_model/')*)
        >>> # processor = AutoProcessor.from_pretrained("./test/saved_model/")
        ```configNtrust_remote_codeT
_from_autoc                    s   i | ]}| v r| | qS r  r  ).0keykwargsr  r  
<dictcomp>#  s    z1AutoProcessor.from_pretrained.<locals>.<dictcomp>F) _raise_exceptions_for_gated_repo%_raise_exceptions_for_missing_entries'_raise_exceptions_for_connection_errorsprocessor_classr  auto_mapzutf-8)encodingz--r   code_revisionz!Unrecognized processing class in z. Can't instantiate a processor, a tokenizer, an image processor, a video processor or a feature extractor for this model. Make sure the repository contains the files of at least one of those processing classes.)*popinspect	signaturer   
parametersupdater   r	   get_processor_dictgetr   r   get_image_processor_dictr   r   get_video_processor_dictr   get_feature_extractor_dictr
   openjsonload
isinstancer   r   from_pretrainedr   r   r  
ValueErrorr  typer   splitr   r   register_for_auto_classr   r   r   r   	Exception)clspretrained_model_name_or_pathr  r  r  r  processor_auto_mapcached_file_kwargsprocessor_config_fileconfig_dict_preprocessor_config_filetokenizer_config_filereaderhas_remote_codehas_local_codeupstream_repoklassr  r  r  r(     s  B	











zAutoProcessor.from_pretrainedFc                 C   s   t j| ||d dS )a  
        Register a new processor for this class.

        Args:
            config_class ([`PreTrainedConfig`]):
                The configuration corresponding to the model to register.
            processor_class ([`ProcessorMixin`]): The processor to register.
        )exist_okN)r   register)config_classr  r<  r  r  r  r=    s   
zAutoProcessor.registerN)F)r   
__module____qualname____doc__r
  classmethodr   r   r(  staticmethodr=  r  r  r  r  r     s     Pr  r   )3rA  r   r  r%  collectionsr   configuration_utilsr   dynamic_module_utilsr   r   feature_extraction_utilsr   image_processing_utilsr   processing_utilsr	   tokenization_pythonr
   utilsr   r   r   r   r   video_processing_utilsr   auto_factoryr   configuration_autor   r   r   r   feature_extraction_autor   image_processing_autor   tokenization_autor   video_processing_autor   
get_loggerr   loggerr   r   strr  r  __all__r  r  r  r  <module>   s:   
 
 m