Ë
    ¥ãiE  ã                   ój   — d Z ddlmZ ddlmZ ddlmZ  ed¬«      e G d„ d	e«      «       «       Zd	gZy
)zFlaubert configurationé    )Ústricté   )ÚPreTrainedConfig)Úauto_docstringzflaubert/flaubert_base_uncased)Ú
checkpointc                   ól  — e Zd ZU dZdZddddddd	d
œZdZeed<   dZ	e
ez  ed<   dZeed<   dZeed<   dZeed<   dZeed<   dZe
ez  ed<   dZe
ez  ed<   dZeed<   dZeed<   dZeed<   dZeed<   dZeed<   dZeed<   dZeed<   d Ze
ed!<   d"Ze
ed#<   d$Ze
ed%<   d&Zeed'<   dZeed(<   d)Zeed*<   d+Zeed,<   d-Z eed.<   dZ!eed/<   d0Z"e#ed1<   dZ$eed2<   d3Z%e#d3z  ed4<   dZ&eed5<   dZ'e
ez  ed6<   d-Z(eed7<   d-Z)eed8<   d&Z*eed9<   d&Z+eed:<   d)Z,ed3z  ed	<   d&Z-ed3z  ed<   dZ.ee/e   z  d3z  ed<   dZ0eed;<   y3)<ÚFlaubertConfigaÚ  
    pre_norm (`bool`, *optional*, defaults to `False`):
        Whether to apply the layer normalization before or after the feed forward layer following the attention in
        each layer (Vaswani et al., Tensor2Tensor for Neural Machine Translation. 2018)
    emb_dim (`int`, *optional*, defaults to 2048):
        The dimensionality of embedding layer.
    gelu_activation (`bool`, *optional*, defaults to True):
        Whether to use GeLU activation function.
    sinusoidal_embeddings (`bool`, *optional*, defaults to `False`):
        Whether or not to use sinusoidal positional embeddings instead of absolute positional embeddings.
    causal (`bool`, *optional*, defaults to `False`):
        Whether or not the model should behave in a causal manner. Causal models use a triangular attention mask in
        order to only attend to the left-side context instead if a bidirectional context.
    asm (`bool`, *optional*, defaults to `False`):
        Whether or not to use an adaptive log softmax projection layer instead of a linear layer for the prediction
        layer.
    n_langs (`int`, *optional*, defaults to 1):
        The number of languages the model handles. Set to 1 for monolingual models.
    use_lang_emb (`bool`, *optional*, defaults to `True`)
        Whether to use language embeddings. Some models use additional language embeddings, see [the multilingual
        models page](http://huggingface.co/transformers/multilingual.html#xlm-language-embeddings) for information
        on how to use them.
    embed_init_std (`float`, *optional*, defaults to 2048^-0.5):
        The standard deviation of the truncated_normal_initializer for initializing the embedding matrices.
    embed_init_std (`float`, *optional*, defaults to `2048**-0.5`):
        Initializer std for embedding layers.
    bos_index (`int`, *optional*, defaults to 0):
        The index of the beginning of sentence token in the vocabulary.
    eos_index (`int`, *optional*, defaults to 1):
        The index of the end of sentence token in the vocabulary.
    pad_index (`int`, *optional*, defaults to 2):
        The index of the padding token in the vocabulary.
    unk_index (`int`, *optional*, defaults to 3):
        The index of the unknown token in the vocabulary.
    mask_index (`int`, *optional*, defaults to 5):
        The index of the masking token in the vocabulary.
    is_encoder (`bool`, *optional*, defaults to True):
        Whether the model is used as an encoder.
    summary_type (`string`, *optional*, defaults to "first"):
        Argument used when doing sequence summary. Used in the sequence classification and multiple choice models.
        Has to be one of the following options:
            - `"last"`: Take the last token hidden state (like XLNet).
            - `"first"`: Take the first token hidden state (like BERT).
            - `"mean"`: Take the mean of all tokens hidden states.
            - `"cls_index"`: Supply a Tensor of classification token position (like GPT/GPT-2).
            - `"attn"`: Not implemented now, use multi-head attention.
    summary_use_proj (`bool`, *optional*, defaults to `True`):
        Argument used when doing sequence summary. Used in the sequence classification and multiple choice models.
        Whether or not to add a projection after the vector extraction.
    summary_activation (`str`, *optional*):
        Argument used when doing sequence summary. Used in the sequence classification and multiple choice models.
        Pass `"tanh"` for a tanh activation to the output, any other value will result in no activation.
    summary_proj_to_labels (`bool`, *optional*, defaults to `True`):
        Used in the sequence classification and multiple choice models.
        Whether the projection outputs should have `config.num_labels` or `config.hidden_size` classes.
    summary_first_dropout (`float`, *optional*, defaults to 0.1):
        Used in the sequence classification and multiple choice models.
        The dropout ratio to be used after the projection and activation.
    start_n_top (`int`, *optional*, defaults to 5):
        Used in the SQuAD evaluation script.
    end_n_top (`int`, *optional*, defaults to 5):
        Used in the SQuAD evaluation script.
    mask_token_id (`int`, *optional*, defaults to 0):
        Model agnostic parameter to identify masked tokens when generating text in an MLM context.
    lang_id (`int`, *optional*, defaults to 1):
        The ID of the language used by the model. This parameter is used when generating text in a given language.
    ÚflaubertÚemb_dimÚn_headsÚn_layersÚ
vocab_sizeÚbos_token_idÚeos_token_idÚpad_token_id)Úhidden_sizeÚnum_attention_headsÚnum_hidden_layersÚn_wordsÚ	bos_indexÚ	eos_indexÚ	pad_indexFÚpre_normg        Ú	layerdropiÁu  i   é   é   gš™™™™™¹?ÚdropoutÚattention_dropoutTÚgelu_activationÚsinusoidal_embeddingsÚcausalÚasmé   Ún_langsÚuse_lang_embi   Úmax_position_embeddingsgÍ;fž –?Úembed_init_stdgê-™—q=Úlayer_norm_epsg{®Gáz”?Úinit_stdr   r   r   é   r   r   Ú	unk_indexé   Ú
mask_indexÚ
is_encoderÚfirstÚsummary_typeÚsummary_use_projNÚsummary_activationÚsummary_proj_to_labelsÚsummary_first_dropoutÚstart_n_topÚ	end_n_topÚmask_token_idÚlang_idÚtie_word_embeddings)1Ú__name__Ú
__module__Ú__qualname__Ú__doc__Ú
model_typeÚattribute_mapr   ÚboolÚ__annotations__r   ÚfloatÚintr   r   r   r   r   r   r   r    r!   r"   r$   r%   r&   r'   r(   r)   r   r   r   r+   r-   r.   r0   Ústrr1   r2   r3   r4   r5   r6   r7   r8   r   r   r   Úlistr9   © ó    ú„/var/www/vps2.regionflexible.com/Desarrollo/venv/lib/python3.12/site-packages/transformers/models/flaubert/configuration_flaubert.pyr	   r	      sÑ  … ñBðH €Jà Ø(Ø'ØØ#Ø#Ø#ñ€Mð €HˆdÓØ €Iˆus‰{Ó Ø€JÓØ€GˆSÓØ€HˆcÓØ€GˆSÓØ€GˆUS‰[ÓØ%(Ðu˜s‘{Ó(Ø €OTÓ Ø"'Ð˜4Ó'Ø€FˆDÓØ€CˆÓØ€GˆSÓØ€L$ÓØ#&Ð˜SÓ&Ø&€NEÓ&Ø!€NEÓ!Ø€HˆeÓØ€IˆsÓØ€IˆsÓØ€IˆsÓØ€IˆsÓØ€JÓØ€JÓØ€L#ÓØ!ÐdÓ!Ø%)Ð˜˜d™
Ó)Ø#'Ð˜DÓ'Ø),Ð˜5 3™;Ó,Ø€KÓØ€IˆsÓØ€M3ÓØ€GˆSÓØ €L#˜‘*Ó Ø €L#˜‘*Ó Ø+,€L#˜˜S™	‘/ DÑ(Ó,Ø $Ð˜Ô$rG   r	   N)	r=   Úhuggingface_hub.dataclassesr   Úconfiguration_utilsr   Úutilsr   r	   Ú__all__rF   rG   rH   ú<module>rM      sK   ðñ å .å 3Ý #ñ Ð;Ô<Øôt%Ð%ó t%ó ó =ðt%ðn Ð
rG   