
    Z j>8                     &   S SK r SSKJr  SSKJr  SSKJrJrJrJ	r	J
r
JrJrJrJrJrJrJrJrJrJrJrJrJrJrJrJrJrJrJr  SSKJr  SSK J!r!  SS	K"J#r#  SS
K$J%r%  SSK&J'r'  SSK(J)r)  SSK*J+r+  SSK,J-r-  SSK.J/r/  SSK0J1r1  SSK2J3r3  SSK4J5r5  SSK6J7r7  SSK8J9r9  SSK:J;r;  SSK<J=r=  SSK>J?r?  SSK@JArA  SSKBJCrC  SSKDJErE  SSKFJGrG  SSKHJIrI  SSKJJKrK  SSKLJMrM  0 S\%_S \)_S!\+_S"\9_S#\!_S$\C_S%\E_S&\5_S'\7_S(\/_S)\;_S*\=_S+\-_S,\1_S-\K_S.\'_S/\M_\I\3\#\A\?\GS0.ErN0 S\_S \
_S!\
_S(\_S"\_S#\_S$\_S%\_S&\_S'\_S*\_S+\_S,\_S)\_S-\_S.\	_S/\_\\\\\\S0.ErO\\\\\\\\4rP\R                  " \R5      rS " S1 S25      rT " S3 S45      rUS5\V4S6 jrWS7\V4S8 jrXS9 rYg):    N   )
AutoConfig)logging)
AqlmConfigAutoRoundConfig	AwqConfigBitNetQuantConfigBitsAndBytesConfigCompressedTensorsConfig
EetqConfigFbgemmFp8ConfigFineGrainedFP8ConfigFourOverSixConfigFPQuantConfig
GPTQConfigHiggsConfig	HqqConfigMetalConfigMxfp4ConfigQuantizationConfigMixinQuantizationMethodQuantoConfigQuarkConfig
SinqConfig
SpQRConfigTorchAoConfig
VptqConfig   )HfQuantizer)AqlmHfQuantizer)AutoRoundQuantizer)AwqQuantizer)BitNetHfQuantizer)Bnb4BitHfQuantizer)Bnb8BitHfQuantizer)CompressedTensorsHfQuantizer)EetqHfQuantizer)FbgemmFp8HfQuantizer)FineGrainedFP8HfQuantizer)FourOverSixHfQuantizer)FPQuantHfQuantizer)GptqHfQuantizer)HiggsHfQuantizer)HqqHfQuantizer)MetalHfQuantizer)Mxfp4HfQuantizer)QuantoHfQuantizer)QuarkHfQuantizer)SinqHfQuantizer)SpQRHfQuantizer)TorchAoHfQuantizer)VptqHfQuantizerawqbitsandbytes_4bitbitsandbytes_8bitgptqaqlmquantoquarkfouroversixfp_quanteetqhiggshqqzcompressed-tensors
fbgemm_fp8torchaobitnetvptq)spqrfp8z
auto-roundmxfp4metalsinqc                   @    \ rS rSrSr\S\4S j5       r\S 5       rSr	g)AutoQuantizationConfig   z
The Auto-HF quantization config class that takes care of automatically dispatching to the correct
quantization config given a quantization config stored in a dictionary.
quantization_config_dictc           	         UR                  S5      nUR                  SS5      (       d  UR                  SS5      (       a/  UR                  SS5      (       a  SOSn[        R                  U-   nOUc  [        S5      eU[        ;  a,  [        SU S	[        [        R                  5       5       35      e[        U   nUR                  U5      $ )
Nquant_methodload_in_8bitFload_in_4bit_4bit_8bitThe model's quantization config from the arguments has no `quant_method` attribute. Make sure that the model has been correctly quantizedUnknown quantization type, got  - supported types are: )	getr   BITS_AND_BYTES
ValueError AUTO_QUANTIZATION_CONFIG_MAPPINGlistAUTO_QUANTIZER_MAPPINGkeys	from_dict)clsrO   rQ   suffix
target_clss        m/root/GenerationalWealth/GenerationalWealth/venv/lib/python3.13/site-packages/transformers/quantizers/auto.pyr`    AutoQuantizationConfig.from_dict   s    /33NC#''>>BZB^B^_motBuBu 8 < <^U S SWY`F-<<vEL! \  ??1, @/44678: 
 6lC
##$<==    c                     [         R                  " U40 UD6n[        USS 5      c  [        SU S35      eUR                  nU R                  U5      nUR                  " S0 UD6  U$ )Nquantization_configz)Did not found a `quantization_config` in z2. Make sure that the model is correctly quantized. )r   from_pretrainedgetattrr[   rh   r`   update)ra   pretrained_model_name_or_pathkwargsmodel_configrO   rh   s         rd   rj   &AutoQuantizationConfig.from_pretrained   s    !112OZSYZ<!6=E;<Y;Z  [M  N  $0#C#C !mm,DE"",V,""rf   ri   N)
__name__
__module____qualname____firstlineno____doc__classmethoddictr`   rj   __static_attributes__ri   rf   rd   rM   rM      s6    
 > > >( 
# 
#rf   rM   c                   ~    \ rS rSrSr\S\\-  4S j5       r\S 5       r	\S\\-  S\S-  4S j5       r
\S	 5       rS
rg)AutoHfQuantizer   z
 The Auto-HF quantizer class that takes care of automatically instantiating to the correct
`HfQuantizer` given the `QuantizationConfig`.
rh   c           	         [        U[        5      (       a  [        R                  U5      nUR                  nU[
        R                  :X  a<  [        U[        5      (       d  [        S5      eUR                  (       a  US-  nOUS-  nU[        ;  a,  [        SU S[        [        R                  5       5       35      e[        U   nU" U40 UD6$ )NzZFound `quant_method=bitsandbytes` but `quantization_config` is not a `BitsAndBytesConfig`.rU   rT   rW   rX   )
isinstancerw   rM   r`   rQ   r   rZ   r
   	TypeErrorrR   r^   r[   r]   r_   )ra   rh   rn   rQ   rc   s        rd   from_configAutoHfQuantizer.from_config   s     )400"8"B"BCV"W*77 -<<<13EFFp  #//''551, @/44678: 
 ,L9
-888rf   c                 R    [         R                  " U40 UD6nU R                  U5      $ )N)rM   rj   r   )ra   rm   rn   rh   s       rd   rj   AutoHfQuantizer.from_pretrained   s*    4DDEbmflm233rf   quantization_config_from_argsNc                 J   Ub  SnOSn[        U[        5      (       aA  [        U[        5      (       a  [        R                  " U5      nO[        R                  U5      nUbh  UR
                  R                  UR
                  R                  :w  a:  [        SUR
                  R                   SUR
                  R                   S35      e[        U[        5      (       aq  [        U[        5      (       a\  UR                  5       nUR                  5        H  u  pV[        XU5        M     U(       a   US[        UR                  5       5       S3-  nUS:w  a8  [        U[        [        [         45      (       d  ["        R$                  " U5        U$ [&        R)                  U5        U$ )zt
handles situations where both quantization_config from args and quantization_config from model config are present.
zYou passed `quantization_config` or equivalent parameters to `from_pretrained` but the model you're loading already has a `quantization_config` attribute. The `quantization_config` from the model will be used. zThe model is quantized with z but you are passing a z| config. Please make sure to pass the same quantization config class to `from_pretrained` with different loading attributes.z"However, loading attributes (e.g. z]) will be overwritten with the one you passed to `from_pretrained`. The rest will be ignored.)r}   rw   r   r`   rM   	__class__rq   r[   LOADING_ATTRIBUTES_CONFIG_TYPESget_loading_attributesitemssetattrr]   r_   r   r   r   warningswarnloggerinfo)ra   rh   r   warning_msgloading_attr_dictattrvals          rd   merge_quantization_configs*AutoHfQuantizer.merge_quantization_configs   s    )4y 
 K)4007II&5&?&?@S&T#&<&F&FGZ&[# *5#--66:W:a:a:j:jj./B/L/L/U/U.VVm  oL  oV  oV  o_  o_  n` `F F 
 )+JKKPZ)+JQ
 Q
 !> T T V.446	+37 7 !!CDIZI_I_IaDbCc  dA   B  B"Z0CkS^`tEu%v%vMM+& #" KK$""rf   c           	         U R                  SS 5      nU R                  SS5      (       d  U R                  SS5      (       a/  U R                  SS5      (       a  SOSn[        R                  U-   nOUc  [        S5      eU[        ;  a8  [
        R                  SU S	[        [        R                  5       5       S
35        gg)NrQ   rR   FrS   rT   rU   rV   rW   rX   z~. Hence, we will skip the quantization. To remove the warning, you can delete the quantization_config attribute in config.jsonT)
rY   r   rZ   r[   r\   r   warningr]   r^   r_   )rO   rQ   rb   s      rd   supports_quant_method%AutoHfQuantizer.supports_quant_method  s    /33NDI#''>>BZB^B^_motBuBu 8 < <^U S SWY`F-<<vEL! \  ??NN1, @/44678 9ii
 rf   ri   )rq   rr   rs   rt   ru   rv   r   rw   r   rj   r   staticmethodr   rx   ri   rf   rd   rz   rz      s    
 9.E.L 9 98 4 4 /#!$;;/# (?'E/# /#b  rf   rz   methodc                    ^  U 4S jnU$ )z-Register a custom quantization configuration.c                    > T[         ;   a  [        ST S35      e[        U [        5      (       d  [	        S5      eU [         T'   U $ )NzConfig '' already registeredz*Config must extend QuantizationConfigMixin)r\   r[   
issubclassr   r~   )ra   r   s    rd   register_config_fn8register_quantization_config.<locals>.register_config_fn$  sK    55xx/CDEE#677HII36(0
rf   ri   )r   r   s   ` rd   register_quantization_configr   !  s     rf   namec                    ^  U 4S jnU$ )zRegister a custom quantizer.c                    > T[         ;   a  [        ST S35      e[        U [        5      (       d  [	        S5      eU [         T'   U $ )NzQuantizer 'r   z!Quantizer must extend HfQuantizer)r^   r[   r   r   r~   )ra   r   s    rd   register_quantizer_fn1register_quantizer.<locals>.register_quantizer_fn4  sJ    )){4&0DEFF#{++?@@'*t$
rf   ri   )r   r   s   ` rd   register_quantizerr   1  s     ! rf   c                 H   [        U S5      nU(       a&  [        R                  U R                  5      (       d  SnU(       d  UbR  U(       a&  [        R	                  U R                  U5      U l        OXl        [        R                  U R                  US9nOS nUb  UR                  UUS9  UR                  U5      nUR                  U 5      n UR                  U 5      n [        UR                  SS5      (       d&  UR                  R                  n[        USU5      US'   X`U4$ )Nrh   F)pre_quantized)
device_mapweights_only
dequantizevaluequant)hasattrrz   r   rh   r   r   validate_environmentupdate_device_mapupdate_tp_planupdate_ep_planrk   rQ   )configrh   r   r   
user_agentr   hf_quantizerrQ   s           rd   get_hf_quantizerr   A  s   F$9:M_BB6C]C]^^+7)8)S)S**,?*F& *=&&22&&' 3 

 ))!% 	* 	
 "33J?
,,V4,,V4 |77uMM';;HHL"),"NJw++rf   )Zr   models.auto.configuration_autor   utilsr   utils.quantization_configr   r   r   r	   r
   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   baser   quantizer_aqlmr    quantizer_auto_roundr!   quantizer_awqr"   quantizer_bitnetr#   quantizer_bnb_4bitr$   quantizer_bnb_8bitr%   quantizer_compressed_tensorsr&   quantizer_eetqr'   quantizer_fbgemm_fp8r(   quantizer_finegrained_fp8r)   quantizer_fouroversixr*   quantizer_fp_quantr+   quantizer_gptqr,   quantizer_higgsr-   quantizer_hqqr.   quantizer_metalr/   quantizer_mxfp4r0   quantizer_quantor1   quantizer_quarkr2   quantizer_sinqr3   quantizer_spqrr4   quantizer_torchaor5   quantizer_vptqr6   r^   r\   r   
get_loggerrq   r   rM   rz   strr   r   r   ri   rf   rd   <module>r      s    7       4  + 4 ' / 2 2 F + 6 @ 9 2 + - ) - - / - + + 1 +	<+ + O	
 O   ) " O  
> 6 & !  !" O#$ $$/ 4$	9$+$ +$ J	$
 J$ J$ l$ [$ $$ $ 
9$ 1$ /$ [$ }$  !$" J#$$ !/$  6 	#  
		H	%&# &#Rl l^  !S ! !,rf   