
    i[                         d dl mZ ddlmZ ddlmZ ddlmZ  ed      e G d	 d
e                    Z ed      e G d de                    Z	d
dgZ
y)    )strict   )PreTrainedConfig)auto_docstring   )Qwen2Configzthisisiron/Ovis2-1B-hf)
checkpointc                   B   e Zd ZU dZdZdZeed<   dZeed<   dZ	eed<   d	Z
eed
<   dZeed<   dZeee   z  eeef   z  ed<   dZeee   z  eeef   z  ed<   dZeed<   dZeez  ed<   dZeed<   dZeed<   dZeed<   dZeed<   dZeed<   dZeed<   d Zeed!<   d"Zeed#<   y$)%Ovis2VisionConfigas  
    hidden_stride (`int`, *optional*, defaults to 1):
        The stride of the hidden layer in the Vision Transformer.
    num_visual_indicator_tokens (`int`, *optional*, defaults to 5):
        Number of visual indicator tokens.
    tokenize_function (`str`, *optional*, defaults to `"softmax"`):
        The function used to tokenize the visual indicator tokens.
    vision_configi   hidden_sizei   intermediate_size   num_hidden_layers   num_attention_headsr   num_channels   
image_size   
patch_sizegh㈵>rms_norm_epsg        attention_dropoutFqkv_biasmlp_biassilu
hidden_acti @  
vocab_size   hidden_stride   num_visual_indicator_tokensg{Gz?initializer_rangesoftmaxtokenize_functionN)__name__
__module____qualname____doc__base_config_keyr   int__annotations__r   r   r   r   r   listtupler   r   floatr   r   boolr   r   strr   r    r"   r#   r%        ~/var/www/vps2.regionflexible.com/Desarrollo/venv/lib/python3.12/site-packages/transformers/models/ovis2/configuration_ovis2.pyr   r      s     &OK!s!s  L#47Jd3i%S/1746Jd3i%S/16L%%(us{(HdHdJJM3'((#u#&s&r3   r   c                        e Zd ZU dZdZeedZdZe	e
z  dz  ed<   dZe	e
z  dz  ed<   dZeed<   d	Zee   eed
f   z  ed<   dZeed<   dZeed<   dZeed<    fdZ xZS )Ovis2ConfigaL  
    visual_indicator_token_ids (`List[int]`, *optional*, defaults to `[151666, 151667, 151668, 151669, 151670]`):
        The visual indicator token ids to encode the image prompt.

    ```python
    >>> from transformers import Ovis2ForConditionalGeneration, Ovis2Config

    >>> # Initializing a Ovis2 style configuration
    >>> configuration = Ovis2Config()

    >>> # Initializing a model from the Ovis2-2B style configuration
    >>> model = Ovis2ForConditionalGeneration(configuration)

    >>> # Accessing the model configuration
    >>> configuration = model.config
    ```
    ovis2)text_configr   Nr   r8   iqP image_token_id)irP isP itP iuP ivP .visual_indicator_token_idsi[P r   i   r   Ttie_word_embeddingsc                    t        | j                  t              rt        di | j                  | _        | j                  $t        t	        | j
                              | _        t        | j                  t              rt        di | j                  | _        n| j                  t               | _        t        | $  di | y )N)r"   r2   )

isinstancer   dictr   lenr:   r8   r   super__post_init__)selfkwargs	__class__s     r4   rA   zOvis2Config.__post_init__X   s    d(($/!2!HT5G5G!HD%!2sSWSrSrOs!tDd&&-*>T-=-=>D%*}D''r3   )r&   r'   r(   r)   
model_typer   r   sub_configsr   r>   r   r,   r8   r9   r+   r:   r-   r.   r   r   r;   r0   rA   __classcell__)rD   s   @r4   r6   r6   8   s    $ J"-@QRK48M4**T1826K((4/6 NC >fS	E#s(O ;fJK $$( (r3   r6   N)huggingface_hub.dataclassesr   configuration_utilsr   utilsr   qwen2.configuration_qwen2r   r   r6   __all__r2   r3   r4   <module>rM      st     / 3 # 3 34'( '  5'> 34)(" )(  5)(X 
.r3   