
    Z jt                     p    S r SSKJr  SSKJr  SSKJr  SSKJr  \" SS9\ " S	 S
\5      5       5       r	S
/r
g)zGranite model configuration    )strict   )PreTrainedConfig)RopeParameters)auto_docstringzibm-granite/granite-3.0-8b-base)
checkpointc                     ^  \ rS rSr% SrSrS/rSSSSSSSS.rS/S	/4S
S/S
/4S
/S
/4S.rSr	\
\S'   Sr\
\S'   Sr\
\S'   Sr\
\S'   Sr\
\S'   Sr\
S-  \S'   Sr\\S'   Sr\
\S'   Sr\\S'   Sr\\S'   S r\\S!'   Sr\
S-  \S"'   S#r\
S-  \S$'   S%r\
\\
   -  S-  \S&'   S'r\\S('   Sr\\ -  S-  \S)'   S'r!\\S*'   S+r"\\
-  \S,'   S'r#\\S-'   S.r$\\
-  \S/'   S.r%\\
-  \S0'   S.r&\\
-  \S1'   S.r'\\
-  \S2'   U 4S3 jr(S4r)U =r*$ )5GraniteConfig   a_  
```python
>>> from transformers import GraniteModel, GraniteConfig

>>> # Initializing a Granite granite-3b style configuration
>>> configuration = GraniteConfig()

>>> # Initializing a model from the granite-7b style configuration
>>> model = GraniteModel(configuration)

>>> # Accessing the model configuration
>>> configuration = model.config
```
granitepast_key_valuescolwiserowwise)zlayers.*.self_attn.q_projzlayers.*.self_attn.k_projzlayers.*.self_attn.v_projzlayers.*.self_attn.o_projzlayers.*.mlp.gate_projzlayers.*.mlp.up_projzlayers.*.mlp.down_proj	input_idsinputs_embedshidden_statesattention_mask)embed_tokenslayersnormi }  
vocab_sizei   hidden_sizei +  intermediate_size    num_hidden_layersnum_attention_headsNnum_key_value_headssilu
hidden_acti   max_position_embeddingsg{Gz?initializer_rangegư>rms_norm_epsT	use_cachepad_token_id   bos_token_id   eos_token_idFtie_word_embeddingsrope_parametersattention_biasg        attention_dropoutmlp_biasg      ?embedding_multiplierlogits_scalingresidual_multiplierattention_multiplierc                 b   > U R                   c  U R                  U l         [        TU ]  " S0 UD6  g )N )r   r   super__post_init__)selfkwargs	__class__s     ڂ/root/GenerationalWealth/GenerationalWealth/venv/lib/python3.13/site-packages/transformers/models/granite/configuration_granite.pyr5   GraniteConfig.__post_init__X   s-    ##+'+'?'?D$''    )r   )+__name__
__module____qualname____firstlineno____doc__
model_typekeys_to_ignore_at_inferencebase_model_tp_planbase_model_pp_planr   int__annotations__r   r   r   r   r   r   strr    r!   floatr"   r#   boolr$   r&   r(   listr)   r*   r   dictr+   r,   r-   r.   r/   r0   r1   r5   __static_attributes____classcell__)r8   s   @r9   r
   r
      s    J#4"5 &/%.%.%."+ )"+ &(9:#%568IJ!"_$56 JK"s"s!!&*t*J#'S'#u#L%It#L#*# L#* +,L#S	/D(, %%48O^d*T18 ND %(us{(Hd(+%#++"%NECK%'**(+%#++( (r;   r
   N)r@   huggingface_hub.dataclassesr   configuration_utilsr   modeling_rope_utilsr   utilsr   r
   __all__r3   r;   r9   <module>rS      sK   & " . 3 1 # <=>($ >(  >>(B 
r;   