
    Z j                     p    S r SSKJr  SSKJr  SSKJr  SSKJr  \" SS9\ " S	 S
\5      5       5       r	S
/r
g)zStarcoder2 model configuration    )strict   )PreTrainedConfig)RopeParameters)auto_docstringzbigcode/starcoder2-7b)
checkpointc                      \ rS rSr% SrSrS/rSSSSSSS.rS/S	/4S
S/S
/4S
/S
/4S.rSr	\
\S'   Sr\
\S'   Sr\
\S'   Sr\
\S'   Sr\
\S'   Sr\
\S'   Sr\\S'   Sr\
\S'   Sr\\S'   Sr\\S '   S!r\\S"'   S#r\
S$-  \S%'   S#r\
\\
   -  S$-  \S&'   S$r\
S$-  \S''   S$r\\-  S$-  \S('   S$r \
S$-  \S)'   S*r!\\
-  \S+'   S*r"\\
-  \S,'   S*r#\\
-  \S-'   S!r$\\S.'   S!r%\\S/'   S0r&g$)1Starcoder2Config   a  
use_bias (`bool`, *optional*, defaults to `True`):
    Whether to use bias term on linear layers of the model.

```python
>>> from transformers import Starcoder2Model, Starcoder2Config

>>> # Initializing a Starcoder2 7B style configuration
>>> configuration = Starcoder2Config()

>>> # Initializing a model from the Starcoder2 7B style configuration
>>> model = Starcoder2Model(configuration)

>>> # Accessing the model configuration
>>> configuration = model.config
```

starcoder2past_key_valuescolwiserowwise)zlayers.*.self_attn.q_projzlayers.*.self_attn.k_projzlayers.*.self_attn.v_projzlayers.*.self_attn.o_projzlayers.*.mlp.c_fczlayers.*.mlp.c_proj	input_idsinputs_embedshidden_statesattention_mask)embed_tokenslayersnormi   
vocab_sizei   hidden_sizei 0  intermediate_size   num_hidden_layers   num_attention_heads   num_key_value_headsgelu_pytorch_tanh
hidden_acti   max_position_embeddingsgVy?initializer_rangegh㈵>norm_epsilonT	use_cacheiP  Nbos_token_ideos_token_idpad_token_idrope_parameterssliding_windowg        attention_dropoutresidual_dropoutembedding_dropoutuse_biastie_word_embeddings )'__name__
__module____qualname____firstlineno____doc__
model_typekeys_to_ignore_at_inferencebase_model_tp_planbase_model_pp_planr   int__annotations__r   r   r   r   r   r!   strr"   r#   floatr$   r%   boolr&   r'   listr(   r)   r   dictr*   r+   r,   r-   r.   r/   __static_attributes__r0       ڈ/root/GenerationalWealth/GenerationalWealth/venv/lib/python3.13/site-packages/transformers/models/starcoder2/configuration_starcoder2.pyr
   r
      sv   $ J#4"5 &/%.%.%.&( &(9:#%568IJ!"_$56 JK"s"s!!  )J)#'S''u'L%It$L#*$+0L#S	/D(0#L#*#48O^d*T18!%NC$J%%(us{($'eck'%(us{(Hd $$rB   r
   N)r5   huggingface_hub.dataclassesr   configuration_utilsr   modeling_rope_utilsr   utilsr   r
   __all__r0   rB   rC   <module>rI      sK    % . 3 1 # 238%' 8%  48%v 
rB   