
    i                     j    d Z ddlmZ ddlmZ ddlmZ  ed      e G d d	e                    Zd	gZy
)zPop2Piano model configuration    )strict   )PreTrainedConfig)auto_docstringzsweetcocoa/pop2piano)
checkpointc                       e Zd ZU dZdZdgZddddZdZee	d	<   d
Z
ee	d<   dZee	d<   dZee	d<   dZee	d<   dZee	d<   dZedz  e	d<   dZee	d<   dZee	d<   dZee	d<   dZeez  e	d<   dZee	d<   dZee	d<   dZee	d <   d!Zee	d"<   d!Zee	d#<   d$Zedz  e	d%<   d&Zeee   z  dz  e	d'<   d(Zee	d)<   d*Z ee	d+<   d!Z!ee	d,<    fd-Z" xZ#S ).Pop2PianoConfiga  
    composer_vocab_size (`int`, *optional*, defaults to 21):
        Denotes the number of composers.
    relative_attention_num_buckets (`int`, *optional*, defaults to 32):
        The number of buckets to use for each attention layer.
    relative_attention_max_distance (`int`, *optional*, defaults to 128):
        The maximum distance of the longer sequences for the bucket separation.
    feed_forward_proj (`string`, *optional*, defaults to `"gated-gelu"`):
        Type of feed forward layer to be used. Should be one of `"relu"` or `"gated-gelu"`.
    dense_act_fn (`string`, *optional*, defaults to `"relu"`):
        Type of Activation Function to be used in `Pop2PianoDenseActDense` and in `Pop2PianoDenseGatedActDense`.
    	pop2pianopast_key_values
num_layersd_model	num_heads)num_hidden_layershidden_sizenum_attention_headsi`	  
vocab_size   composer_vocab_sizei   @   d_kvi   d_ff   Nnum_decoder_layers       relative_attention_num_buckets   relative_attention_max_distanceg?dropout_rategư>layer_norm_epsilong      ?initializer_factorz
gated-gelufeed_forward_projTis_encoder_decoder	use_cacher   pad_token_id   eos_token_idreludense_act_fnF
is_decodertie_word_embeddingsc                     | j                   | j                   n| j                  | _         | j                  j                  d      d   dk(  | _        t        |   di | y )N-r   gated )r   r   r"   splitis_gated_actsuper__post_init__)selfkwargs	__class__s     /var/www/vps2.regionflexible.com/Desarrollo/venv/lib/python3.12/site-packages/transformers/models/pop2piano/configuration_pop2piano.pyr3   zPop2PianoConfig.__post_init__@   sX    =A=T=T=`$"9"9fjfufu 2288=a@GK''    )$__name__
__module____qualname____doc__
model_typekeys_to_ignore_at_inferenceattribute_mapr   int__annotations__r   r   r   r   r   r   r   r   r   r   floatr    r!   r"   strr#   boolr$   r%   r'   listr)   r*   r+   r3   __classcell__)r6   s   @r7   r	   r	      s"    J#4"5*6yituMJ!!GSD#ND#J%)d
)Is*,"C,+.#S. #L%#+# $$ ##)s)##It L#* +,L#S	/D(,L#J $$( (r8   r	   N)	r<   huggingface_hub.dataclassesr   configuration_utilsr   utilsr   r	   __all__r/   r8   r7   <module>rK      sH    $ . 3 # 12+(& +(  3+(\ 
r8   