Ë
    «q±i*  ã                   ó<   — d dl mZ ddlmZmZ  G d„ de«      ZdgZy)é   )ÚPreTrainedConfigé   )ÚCONFIG_MAPPINGÚ
AutoConfigc                   óJ   ‡ — e Zd ZdZdZeedœZdgZ	 	 	 	 	 	 	 	 	 dˆ fd„	Zˆ xZ	S )ÚGlm46VConfigaÖ  
    This is the configuration class to store the configuration of a [`Glm4vModel`]. It is used to instantiate a
    GLM-4.6V model according to the specified arguments, defining the model architecture. Instantiating a
    configuration with the defaults will yield a similar configuration to that of
    GLM-4.1V-9B-Thinking [zai-org/GLM-4.1V-9B-Thinking](https://huggingface.co/zai-org/GLM-4.1V-9B-Thinking).

    Configuration objects inherit from [`PreTrainedConfig`] and can be used to control the model outputs. Read the
    documentation from [`PreTrainedConfig`] for more information.

    Args:
        text_config (`Union[PreTrainedConfig, dict]`, *optional*, defaults to `Glm4vTextConfig`):
            The config object or dictionary of the text backbone.
        vision_config (`Union[PreTrainedConfig, dict]`,  *optional*, defaults to `Glm4vVisionConfig`):
            The config object or dictionary of the vision backbone.
        image_token_id (`int`, *optional*, defaults to 151343):
            The image token index to encode the image prompt.
        video_token_id (`int`, *optional*, defaults to 151344):
            The video token index to encode the image prompt.
        image_start_token_id (`int`, *optional*, defaults to 151339):
            The image start token index to encode the start of image.
        image_end_token_id (`int`, *optional*, defaults to 151340):
            The image end token index to encode the end of image.
        video_start_token_id (`int`, *optional*, defaults to 151361):
            The video start token index to encode the start of video.
        video_end_token_id (`int`, *optional*, defaults to 151362):
            The video end token index to encode the end of video.
        tie_word_embeddings (`bool`, *optional*, defaults to `False`):
            Whether to tie weight embeddings

    ```python
    >>> from transformers import Glm46VForConditionalGeneration, Glm46VConfig

    >>> # Initializing a GLM-4.6V style configuration
    >>> configuration = Glm46VConfig()

    >>> # Initializing a model from the GLM-4.6V style configuration
    >>> model = Glm4vForConditionalGeneration(configuration)

    >>> # Accessing the model configuration
    >>> configuration = model.config
    ```Úglm46v)Útext_configÚvision_configÚpast_key_valuesc
                 óÆ  •— t        |t        «      r,|j                  dd«      |d<   t        |d      di |¤Ž| _        n|€t        d   «       | _        t        |t        «      r,|j                  dd«      |d<   t        |d      di |¤Ž| _        n|€t        d   «       | _        || _        || _        || _        || _	        || _
        || _        |	| _        t        ‰| 8  di |
¤Ž y )NÚ
model_typeÚglm4v_visionÚ
glm4v_text© )Ú
isinstanceÚdictÚgetr   r   r
   Úimage_token_idÚvideo_token_idÚvideo_start_token_idÚvideo_end_token_idÚimage_start_token_idÚimage_end_token_idÚtie_word_embeddingsÚsuperÚ__init__)Úselfr
   r   r   r   r   r   r   r   r   ÚkwargsÚ	__class__s              €úa/opt/pipecat/venv/lib/python3.12/site-packages/transformers/models/glm46v/configuration_glm46v.pyr   zGlm46VConfig.__init__I   sí   ø€ ô m¤TÔ*Ø*7×*;Ñ*;¸LÈ.Ó*YˆM˜,Ñ'Ü!/°¸lÑ0KÑ!LÑ!]È}Ñ!]ˆDÕØÐ"Ü!/°Ñ!?Ó!AˆDÔäk¤4Ô(Ø(3¯©¸ÀlÓ(SˆK˜Ñ%Ü-¨k¸,Ñ.GÑHÑWÈ;ÑWˆDÕØÐ Ü-¨lÑ;Ó=ˆDÔà,ˆÔØ,ˆÔØ$8ˆÔ!Ø"4ˆÔØ$8ˆÔ!Ø"4ˆÔØ#6ˆÔ ä‰ÑÑ"˜6Ó"ó    )	NNi/O i0O i+O i,O iAO iBO F)
Ú__name__Ú
__module__Ú__qualname__Ú__doc__r   r   Úsub_configsÚkeys_to_ignore_at_inferencer   Ú__classcell__)r    s   @r!   r   r      sJ   ø„ ñ(ðT €JØ",¸zÑJ€KØ#4Ð"5Ðð ØØØØ#Ø!Ø#Ø!Ø!÷!#ñ !#r"   r   N)Úconfiguration_utilsr   Úautor   r   r   Ú__all__r   r"   r!   ú<module>r-      s'   ðõ, 4ß -ôP#Ð#ô P#ðf Ð
r"   