
    i                     v    d Z ddlmZ ddlmZ ddlmZ ddlmZ  ed      e G d	 d
e                    Z	d
gZ
y)zOLMo model configuration    )strict   )PreTrainedConfig)RopeParameters)auto_docstringzallenai/OLMo-7B-hf)
checkpointc                       e Zd ZU dZdZdgZddddddddZdgdgfd	d
gd	gfd	gd	gfdZdZe	e
d<   dZe	e
d<   dZe	e
d<   dZe	e
d<   dZe	e
d<   dZe	dz  e
d<   dZee
d<   dZe	e
d<   dZee
d<   dZee
d<   dZe	dz  e
d <   dZe	dz  e
d!<   d"Ze	ee	   z  dz  e
d#<   d$Zee
d%<   dZeez  dz  e
d&<   d$Zee
d'<   d(Z ee	z  e
d)<   dZ!edz  e
d*<    fd+Z" xZ#S ),
OlmoConfiga(  
    clip_qkv (`float`, *optional*):
        If not `None`, elements of query, key and value attention states are clipped so that their
        absolute value does not exceed this value.

    ```python
    >>> from transformers import OlmoModel, OlmoConfig

    >>> # Initializing a OLMo 7B style configuration
    >>> configuration = OlmoConfig()

    >>> # Initializing a model from the OLMo 7B style configuration
    >>> model = OlmoModel(configuration)

    >>> # Accessing the model configuration
    >>> configuration = model.config
    ```
    olmopast_key_valuescolwiserowwise)zlayers.*.self_attn.q_projzlayers.*.self_attn.k_projzlayers.*.self_attn.v_projzlayers.*.self_attn.o_projzlayers.*.mlp.gate_projzlayers.*.mlp.up_projzlayers.*.mlp.down_proj	input_idsinputs_embedshidden_statesattention_mask)embed_tokenslayersnormi  
vocab_sizei   hidden_sizei +  intermediate_size    num_hidden_layersnum_attention_headsNnum_key_value_headssilu
hidden_acti   max_position_embeddingsg{Gz?initializer_rangeT	use_cache   pad_token_idbos_token_idig  eos_token_idFtie_word_embeddingsrope_parametersattention_biasg        attention_dropoutclip_qkvc                 ^    | j                   | j                  | _         t        |   di | y )N )r   r   super__post_init__)selfkwargs	__class__s     |/var/www/vps2.regionflexible.com/Desarrollo/venv/lib/python3.12/site-packages/transformers/models/olmo/configuration_olmo.pyr.   zOlmoConfig.__post_init__V   s-    ##+'+'?'?D$''    )$__name__
__module____qualname____doc__
model_typekeys_to_ignore_at_inferencebase_model_tp_planbase_model_pp_planr   int__annotations__r   r   r   r   r   r   strr   r    floatr!   boolr#   r$   r%   listr&   r'   r   dictr(   r)   r*   r.   __classcell__)r1   s   @r2   r
   r
      s^   & J#4"5%.%.%.%."+ )"+ &(9:#%568IJ!"_$56 JK"s"s!!&*t*J#'S'#u#It L#* #L#*#+0L#S	/D(0 %%48O^d*T18 ND %(us{(!Hedl!( (r3   r
   N)r7   huggingface_hub.dataclassesr   configuration_utilsr   modeling_rope_utilsr   utilsr   r
   __all__r,   r3   r2   <module>rI      sJ   &  . 3 1 # /0;(! ;(  1;(| .r3   