
    Z j                     d    S r SSKJr  SSKJr  SSKJr  \" SS9\ " S S	\5      5       5       rS	/rg
)zFSMT configuration    )strict   )PreTrainedConfig)auto_docstringzfacebook/wmt19-en-ru)
checkpointc                   \  ^  \ rS rSr% SrSrSSSSS.rS	r\\	   \
\	S
4   -  \S'   Sr\\S'   Sr\\S'   Sr\	\S'   Sr\\S'   Sr\\S'   Sr\\S'   Sr\\S'   Sr\\S'   Sr\\S'   Sr\\-  \S'   Sr\\S'   Sr\\S'   Sr\\S'   Sr\\-  \S'   Sr\\-  \S'   Sr\\-  \S '   Sr\\-  \S!'   S"r\\S#'   S$r \S%-  \S&'   S'r!\"\S('   S'r#\"\S)'   S*r$\"\S+'   S,r%\\S-'   S.r&\\S/'   S*r'\"\S0'   S'r(\"\S1'   S2r)\S%-  \S3'   S4r*\S%-  \S5'   S$r+\\\   -  S%-  \S6'   S$r,\\\   -  S%-  \S7'   U 4S8 jr-S9r.U =r/$ ):
FSMTConfig   a  
langs (`list[str]`):
    A list with source language and target_language (e.g., ['en', 'ru']).
src_vocab_size (`int`):
    Vocabulary size of the encoder. Defines the number of different tokens that can be represented by the
    `inputs_ids` passed to the forward method in the encoder.
tgt_vocab_size (`int`):
    Vocabulary size of the decoder. Defines the number of different tokens that can be represented by the
    `inputs_ids` passed to the forward method in the decoder.
max_length (`int`, *optional*, defaults to 200):
    Maximum length to generate.
num_beams (`int`, *optional*, defaults to 5):
    Number of beams for beam search that will be used by default in the `generate` method of the model. 1 means
    no beam search.
length_penalty (`float`, *optional*, defaults to 1):
    Exponential penalty to the length that is used with beam-based generation. It is applied as an exponent to
    the sequence length, which in turn is used to divide the score of the sequence. Since the score is the log
    likelihood of the sequence (i.e. negative), `length_penalty` > 0.0 promotes longer sequences, while
    `length_penalty` < 0.0 encourages shorter sequences.
early_stopping (`bool`, *optional*, defaults to `False`):
    Flag that will be used by default in the `generate` method of the model. Whether to stop the beam search
    when at least `num_beams` sentences are finished per batch or not.

Examples:

```python
>>> from transformers import FSMTConfig, FSMTModel

>>> # Initializing a FSMT facebook/wmt19-en-ru style configuration
>>> config = FSMTConfig()

>>> # Initializing a model (with random weights) from the configuration
>>> model = FSMTModel(config)

>>> # Accessing the model configuration
>>> configuration = model.config
```fsmtencoder_attention_headsd_modeltgt_vocab_sizeencoder_layers)num_attention_headshidden_size
vocab_sizenum_hidden_layers)ende.langsi(  src_vocab_sizereluactivation_functioni      
max_lengthmax_position_embeddingsi   encoder_ffn_dim      g        encoder_layerdropdecoder_ffn_dimdecoder_layersdecoder_attention_headsdecoder_layerdropattention_dropoutg?dropoutactivation_dropoutg{Gz?init_std   Ndecoder_start_token_idTis_encoder_decoderscale_embeddingFtie_word_embeddings   	num_beamsg      ?length_penaltyearly_stopping	use_cache   pad_token_idr   bos_token_ideos_token_idforced_eos_token_idc                 J   > UR                  SS 5        [        TU ]  " S0 UD6  g )Ndecoder )popsuper__post_init__)selfkwargs	__class__s     |/root/GenerationalWealth/GenerationalWealth/venv/lib/python3.13/site-packages/transformers/models/fsmt/configuration_fsmt.pyr=   FSMTConfig.__post_init__g   s!    

9d#''    r:   )0__name__
__module____qualname____firstlineno____doc__
model_typeattribute_mapr   liststrtuple__annotations__r   intr   r   r   r   r   r   r   r   r    floatr!   r"   r#   r$   r%   r&   r'   r(   r*   r+   boolr,   r-   r/   r0   r1   r2   r4   r5   r6   r7   r=   __static_attributes____classcell__)r@   s   @rA   r	   r	      s   $L J8 &-	M *6E49uS#X&5NCNC%%GSJ#'S'OSNC#%S%%(us{(OSNC#%S%%(us{(%(us{(GUS[&))He)*C$J*## OT  %%IsNE ND It L#*  L#* +,L#S	/D(,23tCy4/3( (rC   r	   N)	rH   huggingface_hub.dataclassesr   configuration_utilsr   utilsr   r	   __all__r:   rC   rA   <module>rX      sJ     . 3 # 12Q(! Q(  3Q(h .rC   