
    i
                     j    d Z ddlmZ ddlmZ ddlmZ  ed      e G d d	e                    Zd	gZy
)zRWKV configuration    )strict   )PreTrainedConfig)auto_docstringzRWKV/rwkv-4-169m-pile)
checkpointc                        e Zd ZU dZdZddiZdZeed<   dZ	eed<   dZ
eed	<   d
Zeed<   dZedz  ed<   dZedz  ed<   dZeed<   dZedz  ed<   dZeee   z  dz  ed<   dZeed<   dZeed<   dZeed<    fdZ xZS )
RwkvConfiga  
    context_length (`int`, *optional*, defaults to 1024):
        The maximum sequence length that this model can be used with in a single forward (using it in RNN mode
        lets use any sequence length).
    attention_hidden_size (`int`, *optional*):
        Dimensionality of the attention hidden states. Will default to `hidden_size` if unset.
    rescale_every (`int`, *optional*, defaults to 6):
        At inference, the hidden states (and weights of the corresponding output layers) are divided by 2 every
        `rescale_every` layer. If set to 0 or a negative number, no rescale is done.

    Example:

    ```python
    >>> from transformers import RwkvConfig, RwkvModel

    >>> # Initializing a Rwkv configuration
    >>> configuration = RwkvConfig()

    >>> # Initializing a model (with random weights) from the configuration
    >>> model = RwkvModel(configuration)

    >>> # Accessing the model configuration
    >>> configuration = model.config
    ```rwkvmax_position_embeddingscontext_lengthie  
vocab_sizei   i   hidden_size    num_hidden_layersNattention_hidden_sizeintermediate_sizegh㈵>layer_norm_epsilonr   bos_token_ideos_token_id   rescale_everyFtie_word_embeddingsT	use_cachec                     | j                   | j                   n| j                  | _         | j                  | j                  nd| j                  z  | _        t        |   di | y )N    )r   r   r   super__post_init__)selfkwargs	__class__s     |/var/www/vps2.regionflexible.com/Desarrollo/venv/lib/python3.12/site-packages/transformers/models/rwkv/configuration_rwkv.pyr   zRwkvConfig.__post_init__C   sc    *.*D*D*PD&&VZVfVf 	" <@;Q;Q;]!7!7cdgkgwgwcw''    )__name__
__module____qualname____doc__
model_typeattribute_mapr   int__annotations__r   r   r   r   r   r   floatr   r   listr   r   boolr   r   __classcell__)r!   s   @r"   r	   r	      s    2 J.0@AMJNCKs(,3:,$(sTz( $$ L#* +,L#S	/D(,M3 %%It( (r#   r	   N)	r'   huggingface_hub.dataclassesr   configuration_utilsr   utilsr   r	   __all__r   r#   r"   <module>r4      sG     . 3 # 230(! 0(  40(f .r#   