ó
    Z– jý  ã                   ól   • S SK Jr  SSKJr  SSKJr  SSKJr  \" SS9\ " S S	\5      5       5       rS	/r	g
)é    )Ústricté   )ÚPreTrainedConfig)ÚRopeParameters)Úauto_docstringzCohereForAI/c4ai-command-r-v01)Ú
checkpointc                   óà  ^ • \ rS rSr% SrSrS/rSSSSSSSS.rS/S	/4S
S/S
/4S
/S
/4S.rSr	\
\S'   Sr\
\S'   Sr\
\S'   Sr\\S'   Sr\
\S'   Sr\
\S'   Sr\
S-  \S'   Sr\\S'   Sr\
\S'   Sr\\S'   S r\\S!'   S"r\\S#'   S$r\
S-  \S%'   S&r\
S-  \S''   S(r\
\\
   -  S-  \S)'   S"r\\S*'   Sr\ \!-  S-  \S+'   S,r"\\S-'   S.r#\\
-  \S/'   S0r$\
S-  \S1'   Sr%\\   S-  \S2'   U 4S3 jr&S4r'U =r($ )5ÚCohere2Configé   aÖ  
logit_scale (`float`, *optional*, defaults to 0.0625):
    The scaling factor for the output logits.

```python
>>> from transformers import Cohere2Model, Cohere2Config

>>> # Initializing a Cohere Nextmodel configuration
>>> configuration = Cohere2Config()

>>> # Initializing a model from the Cohere2 configuration
>>> model = Cohere2Model(configuration) # doctest: +SKIP

>>> # Accessing the model configuration
>>> configuration = model.config # doctest: +SKIP
```
Úcohere2Úpast_key_valuesÚcolwiseÚrowwise)zlayers.*.self_attn.q_projzlayers.*.self_attn.k_projzlayers.*.self_attn.v_projzlayers.*.self_attn.o_projzlayers.*.mlp.gate_projzlayers.*.mlp.up_projzlayers.*.mlp.down_projÚ	input_idsÚinputs_embedsÚhidden_statesÚattention_mask)Úembed_tokensÚlayersÚnormi è Ú
vocab_sizei    Úhidden_sizei X  Úintermediate_sizeg      °?Úlogit_scaleé(   Únum_hidden_layersé@   Únum_attention_headsNÚnum_key_value_headsÚsiluÚ
hidden_actÚmax_position_embeddingsg{®Gáz”?Úinitializer_rangegñhãˆµøä>Úlayer_norm_epsTÚ	use_cacher   Úpad_token_idé   Úbos_token_idiä Úeos_token_idÚtie_word_embeddingsÚrope_parametersFÚattention_biasg        Úattention_dropouti   Úsliding_windowÚlayer_typesc                 ól  >• U R                   c  U R                  U l         U R                  U R                  -  U l        U R                  cU  UR                  SS5      n[        U R                  5       Vs/ s H  n[        US-   U-  5      (       a  SOSPM     snU l        [        TU ](  " S0 UD6  g s  snf )NÚsliding_window_patterné   é   Úsliding_attentionÚfull_attention© )r   r   r   Úhead_dimr/   ÚpopÚranger   ÚboolÚsuperÚ__post_init__)ÚselfÚkwargsÚ_sliding_window_patternÚiÚ	__class__s       €Ú‚/root/GenerationalWealth/GenerationalWealth/venv/lib/python3.13/site-packages/transformers/models/cohere2/configuration_cohere2.pyr<   ÚCohere2Config.__post_init__X   s¶   ø€ Ø×#Ñ#Ñ+Ø'+×'?Ñ'?ˆDÔ$ð ×(Ñ(¨D×,DÑ,DÑDˆŒð ×ÑÑ#à&,§j¡jÐ1IÈ1Ó&MÐ#ô ˜t×5Ñ5Ô6ó â6Aô (,¨Q°©UÐ6MÑ,M×'NÑ'NÑ#ÐTdÒdÙ6ñ ˆDÔô
 	‰ÒÑ' Ó'ùò s   Á4$B1)r7   r/   r   ))Ú__name__Ú
__module__Ú__qualname__Ú__firstlineno__Ú__doc__Ú
model_typeÚkeys_to_ignore_at_inferenceÚbase_model_tp_planÚbase_model_pp_planr   ÚintÚ__annotations__r   r   r   Úfloatr   r   r   r!   Ústrr"   r#   r$   r%   r:   r&   r(   r)   Úlistr*   r+   r   Údictr,   r-   r.   r/   r<   Ú__static_attributes__Ú__classcell__)rA   s   @rB   r
   r
      s…  ø‡ ñð$ €JØ#4Ð"5Ðà%.Ø%.Ø%.Ø%.Ø"+Ø )Ø"+ñÐð &˜¨Ð(9Ð:Ø#Ð%5Ð6¸Ð8IÐJØ!Ð" _Ð$5Ð6ñÐð €JÓØ€KÓØ"ÐsÓ"Ø€KÓØÐsÓØ!Ð˜Ó!Ø&*Ð˜˜t™Ó*Ø€JÓØ#'Ð˜SÓ'Ø#ÐuÓ#Ø €NEÓ Ø€IˆtÓØ €L#˜‘*Ó Ø €L#˜‘*Ó Ø+1€L#˜˜S™	‘/ DÑ(Ó1Ø $Ð˜Ó$Ø48€O^ dÑ*¨TÑ1Ó8Ø €NDÓ Ø%(Ðu˜s‘{Ó(Ø!%€NC˜$‘JÓ%Ø$(€Kc‘˜TÑ!Ó(÷(ó (ó    r
   N)
Úhuggingface_hub.dataclassesr   Úconfiguration_utilsr   Úmodeling_rope_utilsr   Úutilsr   r
   Ú__all__r6   rU   rB   Ú<module>r[      sK   ðõ* /å 3Ý 1Ý #ñ Ð;Ñ<ØôJ(Ð$ó J(ó ó =ðJ(ðZ Ð
rU   