
    Z j                     l    S SK Jr  SSKJr  SSKJr  SSKJr  \" SS9\ " S S	\5      5       5       rS	/r	g
)    )strict   )PreTrainedConfig)RopeParameters)auto_docstringz$mistralai/Ministral-8B-Instruct-2410)
checkpointc                     ^  \ rS rSr% SrSrS/rSSSSSSSS.rS/S	/4S
S/S
/4S
/S
/4S.rSr	\
\S'   Sr\
\S'   Sr\
\S'   Sr\
\S'   Sr\
\S'   Sr\
\S'   Sr\
S-  \S'   Sr\\S'   Sr\
\S'   Sr\\S'   S r\\S!'   S"r\\S#'   Sr\
S-  \S$'   S%r\
S-  \S&'   S'r\
\\
   -  S-  \S('   S)r\\S*'   Sr\ \!-  S-  \S+'   Sr"\
S-  \S,'   S-r#\\
-  \S.'   Sr$\\   S-  \S/'   U 4S0 jr%S1r&U =r'$ )2MinistralConfig   al  
Example:

```python
>>> from transformers import MinistralModel, MinistralConfig

>>> # Initializing a Ministral 8B style configuration
>>> configuration = MinistralConfig()

>>> # Initializing a model from the Ministral 8B style configuration
>>> model = MinistralModel(configuration)

>>> # Accessing the model configuration
>>> configuration = model.config
```	ministralpast_key_valuescolwiserowwise)zlayers.*.self_attn.q_projzlayers.*.self_attn.k_projzlayers.*.self_attn.v_projzlayers.*.self_attn.o_projzlayers.*.mlp.gate_projzlayers.*.mlp.up_projzlayers.*.mlp.down_proj	input_idsinputs_embedshidden_statesattention_mask)embed_tokenslayersnormi }  
vocab_sizei   hidden_sizei 8  intermediate_size    num_hidden_layersnum_attention_heads   num_key_value_headsNhead_dimsilu
hidden_acti   max_position_embeddingsg{Gz?initializer_rangegư>rms_norm_epsT	use_cachepad_token_id   bos_token_id   eos_token_idFtie_word_embeddingsrope_parameterssliding_windowg        attention_dropoutlayer_typesc                    > U R                   c  U R                  U l         U R                  c$  U R                  b  SOS/U R                  -  U l        [
        TU ]  " S0 UD6  g )Nsliding_attentionfull_attention )r   r   r/   r-   r   super__post_init__)selfkwargs	__class__s     چ/root/GenerationalWealth/GenerationalWealth/venv/lib/python3.13/site-packages/transformers/models/ministral/configuration_ministral.pyr5   MinistralConfig.__post_init__X   se    ##+'+'?'?D$#'+':':'F#L\ && 'D 	''    )r/   r   )(__name__
__module____qualname____firstlineno____doc__
model_typekeys_to_ignore_at_inferencebase_model_tp_planbase_model_pp_planr   int__annotations__r   r   r   r   r   r   r!   strr"   r#   floatr$   r%   boolr&   r(   r*   listr+   r,   r   dictr-   r.   r/   r5   __static_attributes____classcell__)r8   s   @r9   r
   r
      s}     J#4"5 &/%.%.%."+ )"+ &(9:#%568IJ!"_$56 JK"s"s!!  HcDjJ#,S,#u#L%It#L#*# L#* +,L#S	/D(, %%48O^d*T18!%NC$J%%(us{($(KcT!(	( 	(r;   r
   N)
huggingface_hub.dataclassesr   configuration_utilsr   modeling_rope_utilsr   utilsr   r
   __all__r3   r;   r9   <module>rS      sL   , / 3 1 # ABB(& B(  CB(J 
r;   