
    Z jF                         S r SSKJr  SSKJr  SSKJr  SSKJrJ	r	  \	R                  " \5      r\" SS9\ " S	 S
\5      5       5       rS
/rg)zMinistral model configuration    )strict   )PreTrainedConfig)RopeParameters)auto_docstringloggingz"mistralai/Ministral-3-8B-Base-2512)
checkpointc                     ^  \ rS rSr% SrSrS/rSSSSSSSS.rS/S	/4S
S/S
/4S
/S
/4S.rSS1r	Sr
\\S'   Sr\\S'   Sr\\S'   Sr\\S'   Sr\\S'   Sr\\S'   Sr\\S'   Sr\\S'   Sr\\S'   S r\\S!'   S"r\\S#'   S$r\\S%'   S&r\S'-  \S('   S)r\S'-  \S*'   S+r\\\   -  S'-  \S,'   S-r\\S.'   S'r \!\"-  S'-  \S/'   S'r#\S'-  \S0'   S1r$\\-  \S2'   U 4S3 jr%S4r&U =r'$ )5Ministral3Config   a  
Example:

```python
>>> from transformers import Ministral3Config, Ministral3ForCausalLM, Mistral3Config, Mistral3ForConditionalGeneration, PixtralVisionConfig

>>> # Initializing a Pixtral-vision config
>>> vision_config = PixtralVisionConfig()

>>> # Initializing a Ministral3 config
>>> text_config = Ministral3Config()

>>> # Initializing a Mistral3 configuration
>>> configuration = Mistral3Config(vision_config, text_config)

>>> # Initializing a model from the Ministral3 configuration
>>> text_model = Ministral3ForCausalLM(text_config)

>>> # Initializing a model from the Mistral3 configuration
>>> model = Mistral3ForConditionalGeneration(configuration)

>>> # Accessing the model configuration
>>> configuration = model.config
```
ministral3past_key_valuescolwiserowwise)zlayers.*.self_attn.q_projzlayers.*.self_attn.k_projzlayers.*.self_attn.v_projzlayers.*.self_attn.o_projzlayers.*.mlp.gate_projzlayers.*.mlp.up_projzlayers.*.mlp.down_proj	input_idsinputs_embedshidden_statesattention_mask)embed_tokenslayersnormllama_4_scaling_betamax_position_embeddingsi   
vocab_sizei   hidden_sizei 8  intermediate_size"   num_hidden_layers    num_attention_heads   num_key_value_heads   head_dimsilu
hidden_acti   g{Gz?initializer_rangegh㈵>rms_norm_epsT	use_cache   Npad_token_id   bos_token_id   eos_token_idFtie_word_embeddingsrope_parameterssliding_windowg        attention_dropoutc                 X  > U R                   c  SSSSU R                  SSSSSS.
U l         U R                  b  U R                  OU R                  U R                  -  U l        U R
                  c  U R                  U l        S	U;   a  [        R                  S
5        [        TU ]$  " S0 UD6  g )Nyarng    .Ag      0@i @  g      @@g      ?g?)
type
rope_thetafactor original_max_position_embeddingsr   	beta_fast	beta_slowmscale_all_dimmscaler   layer_typeszDetected Mistral model with layer_types. Consider using AutoModel or Ministral classes instead to enable alternating attention compatibility. )
r1   r   r$   r   r    r"   loggerwarning_oncesuper__post_init__)selfkwargs	__class__s     ڈ/root/GenerationalWealth/GenerationalWealth/venv/lib/python3.13/site-packages/transformers/models/ministral3/configuration_ministral3.pyrC   Ministral3Config.__post_init__]   s    ''49+/+G+G! "%(+$D  *.)BHXHX\`\t\tHt##+'+'?'?D$F" ` 	''    )r$   r"   r1   )(__name__
__module____qualname____firstlineno____doc__
model_typekeys_to_ignore_at_inferencebase_model_tp_planbase_model_pp_planignore_keys_at_rope_validationr   int__annotations__r   r   r   r    r"   r$   r&   strr   r'   floatr(   r)   boolr+   r-   r/   listr0   r1   r   dictr2   r3   rC   __static_attributes____classcell__)rF   s   @rG   r   r      sr   2 J#4"5 &/%.%.%."+ )"+ &(9:#%568IJ!"_$56
 '=>W%X"JK"s"s!!  HcJ#)S)#u#L%It!L#*! L#* +,L#S	/D(, %%48O^d*T18!%NC$J%%(us{(( (rI   r   N)rN   huggingface_hub.dataclassesr   configuration_utilsr   modeling_rope_utilsr   utilsr   r   
get_loggerrJ   r@   r   __all__r?   rI   rG   <module>rc      sa    $ . 3 1 , 
		H	% ?@Z(' Z(  AZ(z 
rI   