
    it                     v    d Z ddlmZ ddlmZ ddlmZ ddlmZ  ed      e G d	 d
e                    Z	d
gZ
y)zGranite model configuration    )strict   )PreTrainedConfig)RopeParameters)auto_docstringzibm-granite/granite-3.0-8b-base)
checkpointc                       e Zd ZU dZdZdgZddddddddZdgdgfd	d
gd	gfd	gd	gfdZdZe	e
d<   dZe	e
d<   dZe	e
d<   dZe	e
d<   dZe	e
d<   dZe	dz  e
d<   dZee
d<   dZe	e
d<   dZee
d<   dZee
d<   dZee
d <   dZe	dz  e
d!<   d"Ze	dz  e
d#<   d$Ze	ee	   z  dz  e
d%<   d&Zee
d'<   dZeez  dz  e
d(<   d&Z ee
d)<   d*Z!ee	z  e
d+<   d&Z"ee
d,<   d-Z#ee	z  e
d.<   d-Z$ee	z  e
d/<   d-Z%ee	z  e
d0<   d-Z&ee	z  e
d1<    fd2Z' xZ(S )3GraniteConfiga  
    ```python
    >>> from transformers import GraniteModel, GraniteConfig

    >>> # Initializing a Granite granite-3b style configuration
    >>> configuration = GraniteConfig()

    >>> # Initializing a model from the granite-7b style configuration
    >>> model = GraniteModel(configuration)

    >>> # Accessing the model configuration
    >>> configuration = model.config
    ```
    granitepast_key_valuescolwiserowwise)zlayers.*.self_attn.q_projzlayers.*.self_attn.k_projzlayers.*.self_attn.v_projzlayers.*.self_attn.o_projzlayers.*.mlp.gate_projzlayers.*.mlp.up_projzlayers.*.mlp.down_proj	input_idsinputs_embedshidden_statesattention_mask)embed_tokenslayersnormi }  
vocab_sizei   hidden_sizei +  intermediate_size    num_hidden_layersnum_attention_headsNnum_key_value_headssilu
hidden_acti   max_position_embeddingsg{Gz?initializer_rangegư>rms_norm_epsT	use_cachepad_token_id   bos_token_id   eos_token_idFtie_word_embeddingsrope_parametersattention_biasg        attention_dropoutmlp_biasg      ?embedding_multiplierlogits_scalingresidual_multiplierattention_multiplierc                 ^    | j                   | j                  | _         t        |   di | y )N )r   r   super__post_init__)selfkwargs	__class__s     /var/www/vps2.regionflexible.com/Desarrollo/venv/lib/python3.12/site-packages/transformers/models/granite/configuration_granite.pyr4   zGraniteConfig.__post_init__X   s-    ##+'+'?'?D$''    ))__name__
__module____qualname____doc__
model_typekeys_to_ignore_at_inferencebase_model_tp_planbase_model_pp_planr   int__annotations__r   r   r   r   r   r   strr   r    floatr!   r"   boolr#   r%   r'   listr(   r)   r   dictr*   r+   r,   r-   r.   r/   r0   r4   __classcell__)r7   s   @r8   r
   r
      s    J#4"5 &/%.%.%."+ )"+ &(9:#%568IJ!"_$56 JK"s"s!!&*t*J#'S'#u#L%It#L#*# L#* +,L#S	/D(, %%48O^d*T18 ND %(us{(Hd(+%#++"%NECK%'**(+%#++( (r9   r
   N)r=   huggingface_hub.dataclassesr   configuration_utilsr   modeling_rope_utilsr   utilsr   r
   __all__r2   r9   r8   <module>rO      sK   & " . 3 1 # <=>($ >(  >>(B 
r9   