
    im                     j    d Z ddlmZ ddlmZ ddlmZ  ed      e G d d	e                    Zd	gZy
)zYOSO model configuration    )strict   )PreTrainedConfig)auto_docstringzuw-madison/yoso-4096)
checkpointc                      e Zd ZU dZdZdZeed<   dZeed<   dZ	eed<   dZ
eed	<   d
Zeed<   dZeed<   dZeez  ed<   dZeez  ed<   dZeed<   dZeed<   dZeed<   dZeed<   dZeed<   dZeed<   dZeed<   dZedz  ed <   dZeed!<   dZeed"<   dZedz  ed#<   d$Zedz  ed%<   d&Zeee   z  dz  ed'<   d(Z eed)<   dZ!eed*<   y)+
YosoConfiga  
    use_expectation (`bool`, *optional*, defaults to `True`):
        Whether or not to use YOSO Expectation. Overrides any effect of num_hash.
    hash_code_len (`int`, *optional*, defaults to 9):
        The length of hashes generated by the hash functions.
    num_hash (`int`, *optional*, defaults to 64):
        Number of hash functions used in [`YosoSelfAttention`].
    conv_window (`int`, *optional*):
        Kernel size of depth-wise convolution.
    use_fast_hash (`bool`, *optional*, defaults to `False`):
        Whether or not to use custom cuda kernels which perform fast random projection via hadamard transform.
    lsh_backward (`bool`, *optional*, defaults to `True`):
        Whether or not to perform backpropagation using Locality Sensitive Hashing.

    Example:

    ```python
    >>> from transformers import YosoConfig, YosoModel

    >>> # Initializing a YOSO uw-madison/yoso-4096 style configuration
    >>> configuration = YosoConfig()

    >>> # Initializing a model (with random weights) from the uw-madison/yoso-4096 style configuration
    >>> model = YosoModel(configuration)

    >>> # Accessing the model configuration
    >>> configuration = model.config
    ```yosoiY  
vocab_sizei   hidden_size   num_hidden_layersnum_attention_headsi   intermediate_sizegelu
hidden_actg?hidden_dropout_probattention_probs_dropout_probi   max_position_embeddings   type_vocab_sizeg{Gz?initializer_rangeg-q=layer_norm_epsTuse_expectation	   hash_code_len@   num_hashNconv_windowuse_fast_hashlsh_backwardpad_token_idr   bos_token_id   eos_token_idFadd_cross_attentiontie_word_embeddings)"__name__
__module____qualname____doc__
model_typer   int__annotations__r   r   r   r   r   strr   floatr   r   r   r   r   r   boolr   r   r   r    r!   r"   r#   r%   listr&   r'        |/var/www/vps2.regionflexible.com/Desarrollo/venv/lib/python3.12/site-packages/transformers/models/yoso/configuration_yoso.pyr	   r	      s   : JJKs!!!s!J'**03 %#+3#'S'OS#u#!NE! OT M3Hc"Kt"M4L$ L#*  L#* +,L#S	/D(, %% $$r4   r	   N)	r+   huggingface_hub.dataclassesr   configuration_utilsr   utilsr   r	   __all__r3   r4   r5   <module>r:      sG     . 3 # 126%! 6%  36%r .r4   