
    is                        d Z ddlmZ ddlmZmZ ddlmZ ddlm	Z	 ddl
mZmZmZmZ dd	lmZ  ej"                  e      Z ed
      e G d de	                    Z G d de      Z ed
       G d de             Z ed
       G d de             Z ed
       G d de             Z ed
       G d de             Zg dZy)zPyTorch Arcee model.    )strict)auto_docstringlogging   )RopeParameters   )LlamaConfig)LlamaForCausalLMLlamaForQuestionAnsweringLlamaForSequenceClassificationLlamaForTokenClassification)NemotronMLPzarcee-ai/AFM-4.5B)
checkpointc                      e Zd ZU dZdZdddddddZdZeed<   dZ	eed	<   d
Z
eed<   dZeed<   dZeed<   dZedz  ed<   dZeed<   dZeed<   dZeed<   dZeed<   dZeed<   dZedz  ed<   dZedz  ed<   dZeee   z  dz  ed<   d Zeed!<   dZeez  dz  ed"<   d Zeed#<   d$Zeez  ed%<   d Z eed&<   dZ!edz  ed'<    e"       Z#y)(ArceeConfiga  
    ```python
    >>> from transformers import ArceeModel, ArceeConfig

    >>> # Initializing an Arcee AFM-4.5B-Base style configuration
    >>> configuration = ArceeConfig()

    >>> # Initializing a model from the AFM-4.5B-Base style configuration
    >>> model = ArceeModel(configuration)

    >>> # Accessing the model configuration
    >>> configuration = model.config
    ```arceecolwiserowwise)zlayers.*.self_attn.q_projzlayers.*.self_attn.k_projzlayers.*.self_attn.v_projzlayers.*.self_attn.o_projzlayers.*.mlp.up_projzlayers.*.mlp.down_proji }  
vocab_sizei 
  hidden_sizei H  intermediate_size    num_hidden_layersnum_attention_headsNnum_key_value_headsrelu2
hidden_acti   max_position_embeddingsg{Gz?initializer_rangegh㈵>rms_norm_epsT	use_cachepad_token_idi  bos_token_idi eos_token_idFtie_word_embeddingsrope_parametersattention_biasg        attention_dropoutmlp_biashead_dim)$__name__
__module____qualname____doc__
model_typebase_model_tp_planr   int__annotations__r   r   r   r   r   r   strr   r   floatr    r!   boolr"   r#   r$   listr%   r&   r   dictr'   r(   r)   r*   AttributeErrorpretraining_tp     x/var/www/vps2.regionflexible.com/Desarrollo/venv/lib/python3.12/site-packages/transformers/models/arcee/modular_arcee.pyr   r   "   s-    J%.%.%.%. )"+ JK"s"s!!&*t*J#'S'#u#L%It#L#*#%L#*%+1L#S	/D(1 %%48O^d*T18 ND %(us{(HdHcDj#%Nr;   r   c                       e Zd Zy)ArceeMLPNr+   r,   r-   r:   r;   r<   r>   r>   U   s    r;   r>   c                       e Zd Zy)ArceeForCausalLMNr?   r:   r;   r<   rA   rA   Y       r;   rA   c                       e Zd Zy)ArceeForSequenceClassificationNr?   r:   r;   r<   rD   rD   ^   rB   r;   rD   c                       e Zd Zy)ArceeForQuestionAnsweringNr?   r:   r;   r<   rF   rF   c   rB   r;   rF   c                       e Zd Zy)ArceeForTokenClassificationNr?   r:   r;   r<   rH   rH   h   rB   r;   rH   )r   rA   rF   rD   rH   
ArceeModelArceePreTrainedModelN)r.   huggingface_hub.dataclassesr   transformers.utilsr   r   modeling_rope_utilsr   llama.configuration_llamar	   llama.modeling_llamar
   r   r   r   nemotron.modeling_nemotronr   
get_loggerr+   loggerr   r>   rA   rD   rF   rH   __all__r:   r;   r<   <module>rT      s     . 6 1 3  5 
		H	% ./.&+ .&  0.&b	{ 	 ./	' 	 0	 ./	%C 	 0	 ./	 9 	 0	 ./	"= 	 0	r;   