
    Z j                     x    S SK Jr  SSKJr  SSKJr  SSKJr  SSKJ	r	  \" SS9\ " S	 S
\5      5       5       r
S
/rg)    )strict   )PreTrainedConfig)RopeParameters)auto_docstring)intervalzinceptionai/Jais-2-8B-Chat)
checkpointc                     ^  \ rS rSr% SrSrS/rSSSSSSS.rS/S	/4S
S/S
/4S
/S
/4S.rSr	\
\S'   Sr\
\S'   Sr\
\S'   Sr\
\S'   Sr\
\S'   Sr\
S-  \S'   Sr\\S'   Sr\
\S'   \" SSS9" S S!9r\\S"'   S#r\\S$'   Sr\
S-  \S%'   S&r\
S-  \S''   S(r\
\\
   -  S-  \S)'   S*r\\S+'   Sr\\ -  S-  \S,'   S#r!\\S-'   Sr"\
\-  S-  \S.'   S#r#\\S/'   Sr$\
S-  \S0'   S1r%\\S2'   U 4S3 jr&S4 r'S5r(U =r)$ )6Jais2Config   aP  
```python
>>> from transformers import Jais2Model, Jais2Config

>>> # Initializing a Jais2 jais2-7b style configuration
>>> configuration = Jais2Config()

>>> # Initializing a model from the jais2-7b style configuration
>>> model = Jais2Model(configuration)

>>> # Accessing the model configuration
>>> configuration = model.config
```jais2past_key_valuescolwiserowwise)zlayers.*.self_attn.q_projzlayers.*.self_attn.k_projzlayers.*.self_attn.v_projzlayers.*.self_attn.o_projzlayers.*.mlp.up_projzlayers.*.mlp.down_proj	input_idsinputs_embedshidden_statesattention_mask)embed_tokenslayersnormi K 
vocab_sizei   hidden_sizei h  intermediate_size    num_hidden_layers   num_attention_headsNnum_key_value_headsrelu2
hidden_acti    max_position_embeddingsg        g      ?)minmaxg{Gz?)defaultinitializer_rangeT	use_cachepad_token_idr   bos_token_idiJ eos_token_idFtie_word_embeddingsrope_parametersattention_biasattention_dropoutmlp_biashead_dimgh㈵>layer_norm_epsc                    > U R                   c  U R                  U R                  -  U l         U R                  c  U R                  U l        [        TU ]  " S0 UD6  g )N )r0   r   r   r   super__post_init__)selfkwargs	__class__s     ~/root/GenerationalWealth/GenerationalWealth/venv/lib/python3.13/site-packages/transformers/models/jais2/configuration_jais2.pyr5   Jais2Config.__post_init__T   sO    ==  ,,0H0HHDM##+'+'?'?D$''    c                     U R                   U R                  -  S:w  a&  [        SU R                    SU R                   S35      eg)zOPart of `@strict`-powered validation. Validates the architecture of the config.r   zThe hidden size (z6) is not a multiple of the number of attention heads (z).N)r   r   
ValueError)r6   s    r9   validate_architecture!Jais2Config.validate_architecture\   sS    d666!;#D$4$4#5 622327  <r;   )r0   r   )*__name__
__module____qualname____firstlineno____doc__
model_typekeys_to_ignore_at_inferencebase_model_tp_planbase_model_pp_planr   int__annotations__r   r   r   r   r   r!   strr"   r   r&   floatr'   boolr(   r)   r*   listr+   r,   r   dictr-   r.   r/   r0   r1   r5   r>   __static_attributes____classcell__)r8   s   @r9   r   r      s    J#4"5%.%.%.%. )"+ &(9:#%568IJ!"_$56 JK"s"s!!&*t*J#'S''CS9$GuGIt#L#*# L#* +1L#S	/D(1 %%48O^d*T18ND,/sU{T)/HdHcDj NE ( r;   r   N)huggingface_hub.dataclassesr   configuration_utilsr   modeling_rope_utilsr   utilsr   utils.type_validatorsr   r   __all__r3   r;   r9   <module>rX      sM   , / 3 1 # - 78B" B  9BJ /r;   