
    Z js                     t   S r SSKJr  SSKJrJr  SSKJr  SSKJ	r	  SSK
JrJrJrJr  SS	KJr  \R"                  " \5      r\" S
S9\ " S S\	5      5       5       r " S S\5      r\" S
S9 " S S\5      5       r\" S
S9 " S S\5      5       r\" S
S9 " S S\5      5       r\" S
S9 " S S\5      5       r/ SQrg)zPyTorch Arcee model.    )strict)auto_docstringlogging   )RopeParameters   )LlamaConfig)LlamaForCausalLMLlamaForQuestionAnsweringLlamaForSequenceClassificationLlamaForTokenClassification)NemotronMLPzarcee-ai/AFM-4.5B)
checkpointc                      \ rS rSr% SrSrSSSSSSS.rSr\\	S'   S	r
\\	S
'   Sr\\	S'   Sr\\	S'   Sr\\	S'   Sr\S-  \	S'   Sr\\	S'   Sr\\	S'   Sr\\	S'   Sr\\	S'   Sr\\	S'   Sr\S-  \	S'   Sr\S-  \	S'   Sr\\\   -  S-  \	S '   S!r\\	S"'   Sr\\-  S-  \	S#'   S!r\\	S$'   S%r \\-  \	S&'   S!r!\\	S''   Sr"\S-  \	S('   \#" 5       r$S)r%g)*ArceeConfig"   a[  
```python
>>> from transformers import ArceeModel, ArceeConfig

>>> # Initializing an Arcee AFM-4.5B-Base style configuration
>>> configuration = ArceeConfig()

>>> # Initializing a model from the AFM-4.5B-Base style configuration
>>> model = ArceeModel(configuration)

>>> # Accessing the model configuration
>>> configuration = model.config
```arceecolwiserowwise)zlayers.*.self_attn.q_projzlayers.*.self_attn.k_projzlayers.*.self_attn.v_projzlayers.*.self_attn.o_projzlayers.*.mlp.up_projzlayers.*.mlp.down_proji }  
vocab_sizei 
  hidden_sizei H  intermediate_size    num_hidden_layersnum_attention_headsNnum_key_value_headsrelu2
hidden_acti   max_position_embeddingsg{Gz?initializer_rangegh㈵>rms_norm_epsT	use_cachepad_token_idi  bos_token_idi eos_token_idFtie_word_embeddingsrope_parametersattention_biasg        attention_dropoutmlp_biashead_dim )&__name__
__module____qualname____firstlineno____doc__
model_typebase_model_tp_planr   int__annotations__r   r   r   r   r   r   strr   r    floatr!   r"   boolr#   r$   r%   listr&   r'   r   dictr(   r)   r*   r+   AttributeErrorpretraining_tp__static_attributes__r,       x/root/GenerationalWealth/GenerationalWealth/venv/lib/python3.13/site-packages/transformers/models/arcee/modular_arcee.pyr   r   "   s-    J%.%.%.%. )"+ JK"s"s!!&*t*J#'S'#u#L%It#L#*#%L#*%+1L#S	/D(1 %%48O^d*T18 ND %(us{(HdHcDj#%Nr>   r   c                       \ rS rSrSrg)ArceeMLPU   r,   Nr-   r.   r/   r0   r=   r,   r>   r?   rA   rA   U   s    r>   rA   c                       \ rS rSrSrg)ArceeForCausalLMY   r,   NrC   r,   r>   r?   rE   rE   Y       r>   rE   c                       \ rS rSrSrg)ArceeForSequenceClassification^   r,   NrC   r,   r>   r?   rI   rI   ^   rG   r>   rI   c                       \ rS rSrSrg)ArceeForQuestionAnsweringc   r,   NrC   r,   r>   r?   rL   rL   c   rG   r>   rL   c                       \ rS rSrSrg)ArceeForTokenClassificationh   r,   NrC   r,   r>   r?   rO   rO   h   rG   r>   rO   )r   rE   rL   rI   rO   
ArceeModelArceePreTrainedModelN)r1   huggingface_hub.dataclassesr   transformers.utilsr   r   modeling_rope_utilsr   llama.configuration_llamar	   llama.modeling_llamar
   r   r   r   nemotron.modeling_nemotronr   
get_loggerr-   loggerr   rA   rE   rI   rL   rO   __all__r,   r>   r?   <module>r\      s     . 6 1 3  5 
		H	% ./.&+ .&  0.&b	{ 	 ./	' 	 0	 ./	%C 	 0	 ./	 9 	 0	 ./	"= 	 0	r>   