
    i                     r    d dl mZ ddlmZ ddlmZ ddlmZ  ed      e G d d	e                    Zd	gZ	y
)    )strict   )PreTrainedConfig)RopeParameters)auto_docstringz$mistralai/Ministral-8B-Instruct-2410)
checkpointc                       e Zd ZU dZdZdgZddddddddZdgdgfd	d
gd	gfd	gd	gfdZdZe	e
d<   dZe	e
d<   dZe	e
d<   dZe	e
d<   dZe	e
d<   dZe	e
d<   dZe	dz  e
d<   dZee
d<   dZe	e
d<   dZee
d<   dZee
d <   d!Zee
d"<   dZe	dz  e
d#<   d$Ze	dz  e
d%<   d&Ze	ee	   z  dz  e
d'<   d(Zee
d)<   dZee z  dz  e
d*<   dZ!e	dz  e
d+<   d,Z"ee	z  e
d-<   dZ#ee   dz  e
d.<    fd/Z$ xZ%S )0MinistralConfiga  
    Example:

    ```python
    >>> from transformers import MinistralModel, MinistralConfig

    >>> # Initializing a Ministral 8B style configuration
    >>> configuration = MinistralConfig()

    >>> # Initializing a model from the Ministral 8B style configuration
    >>> model = MinistralModel(configuration)

    >>> # Accessing the model configuration
    >>> configuration = model.config
    ```	ministralpast_key_valuescolwiserowwise)zlayers.*.self_attn.q_projzlayers.*.self_attn.k_projzlayers.*.self_attn.v_projzlayers.*.self_attn.o_projzlayers.*.mlp.gate_projzlayers.*.mlp.up_projzlayers.*.mlp.down_proj	input_idsinputs_embedshidden_statesattention_mask)embed_tokenslayersnormi }  
vocab_sizei   hidden_sizei 8  intermediate_size    num_hidden_layersnum_attention_heads   num_key_value_headsNhead_dimsilu
hidden_acti   max_position_embeddingsg{Gz?initializer_rangegư>rms_norm_epsT	use_cachepad_token_id   bos_token_id   eos_token_idFtie_word_embeddingsrope_parameterssliding_windowg        attention_dropoutlayer_typesc                     | j                   | j                  | _         | j                  #| j                  dndg| j                  z  | _        t        |   di | y )Nsliding_attentionfull_attention )r   r   r.   r,   r   super__post_init__)selfkwargs	__class__s     /var/www/vps2.regionflexible.com/Desarrollo/venv/lib/python3.12/site-packages/transformers/models/ministral/configuration_ministral.pyr4   zMinistralConfig.__post_init__X   se    ##+'+'?'?D$#'+':':'F#L\ && 'D 	''    )&__name__
__module____qualname____doc__
model_typekeys_to_ignore_at_inferencebase_model_tp_planbase_model_pp_planr   int__annotations__r   r   r   r   r   r   r    strr!   r"   floatr#   r$   boolr%   r'   r)   listr*   r+   r   dictr,   r-   r.   r4   __classcell__)r7   s   @r8   r
   r
      s}     J#4"5 &/%.%.%."+ )"+ &(9:#%568IJ!"_$56 JK"s"s!!  HcDjJ#,S,#u#L%It#L#*# L#* +,L#S	/D(, %%48O^d*T18!%NC$J%%(us{($(KcT!(	( 	(r9   r
   N)
huggingface_hub.dataclassesr   configuration_utilsr   modeling_rope_utilsr   utilsr   r
   __all__r2   r9   r8   <module>rO      sL   , / 3 1 # ABB(& B(  CB(J 
r9   