
    Z j                         S SK Jr  SSKJr  SSKJr  SSKJr  SSKJ	r	  SSK
JrJr  \" S	S
9\ " S S\5      5       5       r\" S	S
9\ " S S\5      5       5       rSS/rg)    )strict   )PreTrainedConfig)RopeParameters)auto_docstring)interval   )CONFIG_MAPPING
AutoConfigzrhymes-ai/Aria)
checkpointc                   &  ^  \ rS rSr% SrSrS/rSSSSSSSS.rS/S	/4S
S/S
/4S
/S
/4S.rSr	\
\S'   Sr\
\S'   Sr\
\S'   Sr\
\S'   Sr\
\S'   Sr\
S-  \S'   Sr\\S'   Sr\
\S'   \" SSS9" SS9r\\S '   S!r\\S"'   S#r\\S$'   S%r\
S-  \S&'   S'r\
S-  \S('   S%r\
\\
   -  S-  \S)'   S'r\
S-  \S*'   S+r\\S,'   Sr \!\"-  S-  \S-'   S+r#\\S.'   Sr$\
\-  S-  \S/'   S+r%\\S0'   Sr&\
S-  \S1'   S2r'S3r(\
\S4'   S%r)\
\S5'   S%r*\
\S6'   U 4S7 jr+S8 r,S9r-U =r.$ ):AriaTextConfig   a%  
moe_num_experts (`int`, *optional*, defaults to 8):
    The number of experts in the MoE layer.
moe_topk (`int`, *optional*, defaults to 2):
    The number of top experts to route to for each token.
moe_num_shared_experts (`int`, *optional*, defaults to 2):
    The number of shared experts.
	aria_textpast_key_valuescolwiserowwise)zlayers.*.self_attn.q_projzlayers.*.self_attn.k_projzlayers.*.self_attn.v_projzlayers.*.self_attn.o_projz%layers.*.mlp.shared_experts.gate_projz#layers.*.mlp.shared_experts.up_projz%layers.*.mlp.shared_experts.down_proj	input_idsinputs_embedshidden_statesattention_mask)embed_tokenslayersnormi }  
vocab_sizei   hidden_sizeintermediate_size    num_hidden_layersnum_attention_headsNnum_key_value_headssilu
hidden_acti   max_position_embeddingsg        g      ?)minmax{Gz?)defaultinitializer_rangegư>rms_norm_epsT	use_cacher	   pad_token_id   bos_token_ideos_token_idpretraining_tpFtie_word_embeddingsrope_parametersattention_biasattention_dropoutmlp_biashead_dimtext_config   moe_num_expertsmoe_topkmoe_num_shared_expertsc                    > U R                   c  U R                  U R                  -  U l         U R                  c  U R                  U l        [        TU ]  " S0 UD6  g )N )r6   r   r    r!   super__post_init__)selfkwargs	__class__s     |/root/GenerationalWealth/GenerationalWealth/venv/lib/python3.13/site-packages/transformers/models/aria/configuration_aria.pyr?   AriaTextConfig.__post_init__U   sO    ==  ,,0H0HHDM##+'+'?'?D$''    c                     U R                   U R                  -  S:w  a&  [        SU R                    SU R                   S35      eg)zOPart of `@strict`-powered validation. Validates the architecture of the config.r   zThe hidden size (z6) is not a multiple of the number of attention heads (z).N)r   r    
ValueError)r@   s    rC   validate_architecture$AriaTextConfig.validate_architecture]   sS    d666!;#D$4$4#5 622327  <rE   )r6   r!   )/__name__
__module____qualname____firstlineno____doc__
model_typekeys_to_ignore_at_inferencebase_model_tp_planbase_model_pp_planr   int__annotations__r   r   r   r    r!   r#   strr$   r   r)   floatr*   r+   boolr,   r.   r/   listr0   r1   r2   r   dictr3   r4   r5   r6   base_config_keyr9   r:   r;   r?   rH   __static_attributes____classcell__rB   s   @rC   r   r      s    J#4"5%.%.%.%.1:/81: &(9:#%568IJ!"_$56 JK!s!s!!&*t*J#'S''CS9$GuGL%It L#*  L#* +,L#S	/D(,!"NC$J" %%48O^d*T18 ND ,/sU{T)/HdHcDj#OOSHc"#C#( rE   r   c                      ^  \ rS rSr% SrSrSS0r\\S.r	Sr
\\-  S-  \S'   Sr\\-  S-  \S	'   S
r\\\   -  \S'   Sr\S-  \S'   Sr\\S'   Sr\\S'   Sr\\S'   U 4S jrSrU =r$ )
AriaConfigf   ze
projector_patch_to_query_dict (`dict`, *optional*):
    Mapping of patch sizes to query dimensions.
ariaimage_token_idimage_token_index)r7   vision_configNrd   r7   vision_feature_layerprojector_patch_to_query_dict	   r'   r)   Fr1   c                   > U R                   c
  SSS.U l         U R                   R                  5        VVs0 s H  u  p#[        U5      [        U5      _M     snnU l         [        U R                   R	                  5       5      U l        [        U R                  [        5      (       a;  SU R                  S'   [        U R                  S      " S0 U R                  D6U l        O U R                  c  [        S   " 5       U l        [        U R                  [        5      (       a+  SU R                  ;   a  [        S0 U R                  D6U l
        OU R                  c  [        5       U l
        [        TU ]4  " S0 UD6  g s  snnf )N      )i  i$  idefics3_visionrO   r=   )rg   itemsrS   r&   values'max_value_projector_patch_to_query_dict
isinstancerd   rY   r
   r7   r   r>   r?   )r@   rA   kvrB   s       rC   r?   AriaConfig.__post_init__|   sA    --52D. JNIkIkIqIqIs-tIsc!fc!fnIs-t*7:4;];];d;d;f7g4d(($///@D|,!/0B0B<0P!Q!gTXTfTf!gD'!/0A!B!DDd&&--,$BRBR2R-A0@0@AD%-/D'' .us   !E9)ro   rg   r7   rd   )rJ   rK   rL   rM   rN   rO   attribute_mapr   r   sub_configsrd   rY   r   rT   r7   rf   rS   rX   rg   rc   r)   rV   r1   rW   r?   r[   r\   r]   s   @rC   r_   r_   f   s    
 J-M #1:NK48M4**T1804K&-4,.#S	/.15!4$;5s#u# %%( (rE   r_   N)huggingface_hub.dataclassesr   configuration_utilsr   modeling_rope_utilsr   utilsr   utils.type_validatorsr   autor
   r   r   r_   __all__r=   rE   rC   <module>r}      s   ( / 3 1 # - - +,D% D  -DN +,*(! *(  -*(Z )
*rE   