
    Z j,
                     l    S SK Jr  SSKJr  SSKJr  SSKJr  \" SS9\ " S S	\5      5       5       rS	/r	g
)    )strict   )PreTrainedConfig)RopeParameters)auto_docstringzkarpathy/nanochat-d32)
checkpointc                     ^  \ rS rSr% SrSrS/rSSSSSSS.rSr\	\
S	'   S
r\	\
S'   Sr\	\
S'   Sr\	\
S'   Sr\	\
S'   Sr\	S-  \
S'   Sr\	\
S'   Sr\\
S'   Sr\\	-  \
S'   Sr\\
S'   Sr\\
S'   Sr\\-  S-  \
S'   Sr\\
S '   S!r\S-  \
S"'   S#r\\
S$'   S%r\	S-  \
S&'   S'r\	\ \	   -  S-  \
S('   S'r!\	S-  \
S)'   S#r"\\
S*'   U 4S+ jr#S,r$U =r%$ )-NanoChatConfig   a`  
Example:

```python
>>> from transformers import NanoChatModel, NanoChatConfig

>>> # Initializing a NanoChat style configuration
>>> configuration = NanoChatConfig()

>>> # Initializing a model from the NanoChat style configuration
>>> model = NanoChatModel(configuration)

>>> # Accessing the model configuration
>>> configuration = model.config
```nanochatpast_key_valuescolwiserowwise)zlayers.*.self_attn.q_projzlayers.*.self_attn.k_projzlayers.*.self_attn.v_projzlayers.*.self_attn.o_projzlayers.*.mlp.fc1zlayers.*.mlp.fc2i  
vocab_sizei   hidden_sizei    intermediate_size   num_hidden_layers   num_attention_headsNnum_key_value_headsi   max_position_embeddingsrelu2
hidden_actg        attention_dropoutgư>rms_norm_epsg{Gz?initializer_rangerope_parametersT	use_cacheg      .@final_logit_softcappingFattention_biasr   bos_token_id   eos_token_idpad_token_idtie_word_embeddingsc                 b   > U R                   c  U R                  U l         [        TU ]  " S0 UD6  g )N )r   r   super__post_init__)selfkwargs	__class__s     ڄ/root/GenerationalWealth/GenerationalWealth/venv/lib/python3.13/site-packages/transformers/models/nanochat/configuration_nanochat.pyr*   NanoChatConfig.__post_init__J   s-    ##+'+'?'?D$''    )r   )&__name__
__module____qualname____firstlineno____doc__
model_typekeys_to_ignore_at_inferencebase_model_tp_planr   int__annotations__r   r   r   r   r   r   r   strr   floatr   r   r   r   dictr   boolr    r!   r"   r$   listr%   r&   r*   __static_attributes____classcell__)r-   s   @r.   r
   r
      s2     J#4"5 &/%.%.%.%% JK!s!s  &*t*#'S'J%(us{(L%#u#48O^d*T18It,0UT\0 ND  L#* +,L#S	/D(, L#*  %%( (r0   r
   N)
huggingface_hub.dataclassesr   configuration_utilsr   modeling_rope_utilsr   utilsr   r
   __all__r(   r0   r.   <module>rG      sH     / 3 1 # 235(% 5(  45(p 
r0   