
    qi$                     ,    d dl mZ  G d de      ZdgZy)   )PreTrainedConfigc            1            e Zd ZdZdZ	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 ddee   dz  dee   dz  dee   dz  deded	ed
edededededede	dede	dededededede
dz  dededef0 fdZ xZS )EfficientLoFTRConfigad  
    This is the configuration class to store the configuration of a [`EfficientLoFTRFromKeypointMatching`].
    It is used to instantiate a EfficientLoFTR model according to the specified arguments, defining the model
    architecture. Instantiating a configuration with the defaults will yield a similar configuration to that of the
    EfficientLoFTR [zju-community/efficientloftr](https://huggingface.co/zju-community/efficientloftr) architecture.

    Configuration objects inherit from [`PreTrainedConfig`] and can be used to control the model outputs. Read the
    documentation from [`PreTrainedConfig`] for more information.

    Args:
        stage_num_blocks (`List`, *optional*, defaults to [1, 2, 4, 14]):
            The number of blocks in each stages
        out_features (`List`, *optional*, defaults to [64, 64, 128, 256]):
            The number of channels in each stage
        stage_stride (`List`, *optional*, defaults to [2, 1, 2, 2]):
            The stride used in each stage
        hidden_size (`int`, *optional*, defaults to 256):
            The dimension of the descriptors.
        activation_function (`str`, *optional*, defaults to `"relu"`):
            The activation function used in the backbone
        q_aggregation_kernel_size (`int`, *optional*, defaults to 4):
            The kernel size of the aggregation of query states in the fusion network
        kv_aggregation_kernel_size (`int`, *optional*, defaults to 4):
            The kernel size of the aggregation of key and value states in the fusion network
        q_aggregation_stride (`int`, *optional*, defaults to 4):
            The stride of the aggregation of query states in the fusion network
        kv_aggregation_stride (`int`, *optional*, defaults to 4):
            The stride of the aggregation of key and value states in the fusion network
        num_attention_layers (`int`, *optional*, defaults to 4):
            Number of attention layers in the LocalFeatureTransformer
        num_attention_heads (`int`, *optional*, defaults to 8):
            The number of heads in the GNN layers.
        attention_dropout (`float`, *optional*, defaults to 0.0):
            The dropout ratio for the attention probabilities.
        attention_bias (`bool`, *optional*, defaults to `False`):
            Whether to use a bias in the query, key, value and output projection layers during attention.
        mlp_activation_function (`str`, *optional*, defaults to `"leaky_relu"`):
            Activation function used in the attention mlp layer.
        coarse_matching_skip_softmax (`bool`, *optional*, defaults to `False`):
            Whether to skip softmax or not at the coarse matching step.
        coarse_matching_threshold (`float`, *optional*, defaults to 0.2):
            The threshold for the minimum score required for a match.
        coarse_matching_temperature (`float`, *optional*, defaults to 0.1):
            The temperature to apply to the coarse similarity matrix
        coarse_matching_border_removal (`int`, *optional*, defaults to 2):
            The size of the border to remove during coarse matching
        fine_kernel_size (`int`, *optional*, defaults to 8):
            Kernel size used for the fine feature matching
        batch_norm_eps (`float`, *optional*, defaults to 1e-05):
            The epsilon used by the batch normalization layers
        rope_parameters (`RopeParameters`, *optional*):
            Dictionary containing the configuration parameters for the RoPE embeddings. The dictionary should contain
            a value for `rope_theta` and optionally parameters used for scaling in case you want to use RoPE
            with longer `max_position_embeddings`.
        fine_matching_slice_dim (`int`, *optional*, defaults to 8):
            The size of the slice used to divide the fine features for the first and second fine matching stages.
        fine_matching_regress_temperature (`float`, *optional*, defaults to 10.0):
            The temperature to apply to the fine similarity matrix
        initializer_range (`float`, *optional*, defaults to 0.02):
            The standard deviation of the truncated_normal_initializer for initializing all weight matrices.

    Examples:
        ```python
        >>> from transformers import EfficientLoFTRConfig, EfficientLoFTRForKeypointMatching

        >>> # Initializing a EfficientLoFTR configuration
        >>> configuration = EfficientLoFTRConfig()

        >>> # Initializing a model from the EfficientLoFTR configuration
        >>> model = EfficientLoFTRForKeypointMatching(configuration)

        >>> # Accessing the model configuration
        >>> configuration = model.config
        ```
    efficientloftrNstage_num_blocksout_featuresstage_stridehidden_sizeactivation_functionq_aggregation_kernel_sizekv_aggregation_kernel_sizeq_aggregation_stridekv_aggregation_stridenum_attention_layersnum_attention_headsattention_dropoutattention_biasmlp_activation_functioncoarse_matching_skip_softmaxcoarse_matching_thresholdcoarse_matching_temperaturecoarse_matching_border_removalfine_kernel_sizebatch_norm_epsrope_parametersfine_matching_slice_dim!fine_matching_regress_temperatureinitializer_rangec                    ||ng d| _         ||ng d| _        ||ng d| _        dg| j                  d d z   | _        t	        | j                  | j                         D cg c]  \  }}|gdg|dz
  z  z    c}}| _        t        | j                         D cg c]  \  }}| j                  |   g|z   c}}| _        t        t        | j                               D cg c]%  }| j                  |   g| j                  |   d d z   ' c}| _
        t        t        | j                              d d | _        || _        | j                  | j                  d   k7  r(t        d| j                   d| j                  d          || _        || _        || _        || _        |	| _        |
| _        || _        || _        || _        | j                  dz  | _        || _        || _        || _        || _        || _        || _        || _         || _!        || _"        || _#        || _$        || _%        |jM                  d	d
       tO        |   di | y c c}}w c c}}w c c}w )N)            )r!   r    r!   r!   )@   r$         r    zMhidden_size should be equal to the last value in out_features. hidden_size = z, out_features = r!   partial_rotary_factorg      @ ))r   r	   r   stage_in_channelszipstage_block_stride	enumeratestage_block_out_channelsrangelenstage_block_in_channelslistreversedfine_fusion_dimsr
   
ValueErrorr   r   r   r   r   r   r   r   r   intermediate_sizer   r   r   r   r   r   r   r   r   num_key_value_headsr   r   
setdefaultsuper__init__)selfr   r   r	   r
   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   kwargsstride
num_blocks	stage_idx	__class__s                                q/opt/pipecat/venv/lib/python3.12/site-packages/transformers/models/efficientloftr/configuration_efficientloftr.pyr:   zEfficientLoFTRConfig.__init__a   s   : 5E4P 0Vc,8,DL,,8,DLJ\"#t'8'8"'=!= ILDL]L]_c_t_tHu#
2D&*VHsj1n--#
 V__c_t_tUu)
<QIzTy)*Z7)
%
 #3t'<'<#=>(
 ##I./$2O2OPY2Z[^\^2__(
$ !%Xd.?.?%@ A#2 F&t0044_`d`p`p_q  rC  DH  DU  DU  VX  DY  CZ  [  $7 )B&*D'$8!%:"$8!#6 !2,!%!1!1A!5'>$,H))B&+F(.L+ 0,'>$1R.#6 !2.137"6"[#
)
(
s   $II"*I)NNNr&   relur"   r"   r"   r"   r"      g        F
leaky_reluFg?g?r!   rC   gh㈵>NrC   g      $@g{Gz?)__name__
__module____qualname____doc__
model_typer2   intstrfloatbooldictr:   __classcell__)r@   s   @rA   r   r      s   JX "J .2)-)-#))**+$%%&$%#$#&$'3-2+.-0./ ! $'+'(37#'3P#s)d*P# 3i$&P# 3i$&	P#
 P# !P# $'P# %(P# "P#  #P# "P# !P# !P# P# "%P#  '+!P#" $)#P#$ &+%P#& ),'P#( )P#* +P#, -P#. "%/P#0 ,11P#2 !3P# P#    r   N)configuration_utilsr   r   __all__r)   rP   rA   <module>rS      s$    4_#+ _#D "
"rP   