
    i,
                     r    d dl mZ ddlmZ ddlmZ ddlmZ  ed      e G d d	e                    Zd	gZ	y
)    )strict   )PretrainedConfig)RopeParameters)auto_docstringzkarpathy/nanochat-d32)
checkpointc                       e Zd ZU dZdZdgZdddddddZdZee	d<   d	Z
ee	d
<   dZee	d<   dZee	d<   dZee	d<   dZedz  e	d<   dZee	d<   dZee	d<   dZeez  e	d<   dZee	d<   dZee	d<   dZeez  dz  e	d<   dZee	d<   d Zedz  e	d!<   d"Zee	d#<   d$Zedz  e	d%<   d&Zeee   z  dz  e	d'<   d&Z edz  e	d(<   d"Z!ee	d)<    fd*Z" xZ#S )+NanoChatConfiga  
    Example:

    ```python
    >>> from transformers import NanoChatModel, NanoChatConfig

    >>> # Initializing a NanoChat style configuration
    >>> configuration = NanoChatConfig()

    >>> # Initializing a model from the NanoChat style configuration
    >>> model = NanoChatModel(configuration)

    >>> # Accessing the model configuration
    >>> configuration = model.config
    ```nanochatpast_key_valuescolwiserowwise)zlayers.*.self_attn.q_projzlayers.*.self_attn.k_projzlayers.*.self_attn.v_projzlayers.*.self_attn.o_projzlayers.*.mlp.fc1zlayers.*.mlp.fc2i  
vocab_sizei   hidden_sizei    intermediate_size   num_hidden_layers   num_attention_headsNnum_key_value_headsi   max_position_embeddingsrelu2
hidden_actg        attention_dropoutgư>rms_norm_epsg{Gz?initializer_rangerope_parametersT	use_cacheg      .@final_logit_softcappingFattention_biasr   bos_token_id   eos_token_idpad_token_idtie_word_embeddingsc                 ^    | j                   | j                  | _         t        |   di | y )N )r   r   super__post_init__)selfkwargs	__class__s     /var/www/vps2.regionflexible.com/Desarrollo/venv/lib/python3.12/site-packages/transformers/models/nanochat/configuration_nanochat.pyr)   zNanoChatConfig.__post_init__J   s-    ##+'+'?'?D$''    )$__name__
__module____qualname____doc__
model_typekeys_to_ignore_at_inferencebase_model_tp_planr   int__annotations__r   r   r   r   r   r   r   strr   floatr   r   r   r   dictr   boolr   r    r!   r#   listr$   r%   r)   __classcell__)r,   s   @r-   r
   r
      s2     J#4"5 &/%.%.%.%% JK!s!s  &*t*#'S'J%(us{(L%#u#48O^d*T18It,0UT\0 ND  L#* +,L#S	/D(, L#*  %%( (r.   r
   N)
huggingface_hub.dataclassesr   configuration_utilsr   modeling_rope_utilsr   utilsr   r
   __all__r'   r.   r-   <module>rC      sH     / 3 1 # 235(% 5(  45(p 
r.   