ث
    §ظbiش!  م                   َ>   — d dl mZmZ d dlmZ e G d„ d«      «       Zy)é    )ع	dataclassعfield)عOptionalc                   َ²  — e Zd ZU dZ edddi¬«      Zee   ed<    edddi¬«      Z	eed	<    edd
g d¢dœ¬«      Z
ee   ed<    edddi¬«      Zeed<    edddi¬«      Zee   ed<    edddi¬«      Zeed<    edddi¬«      Zeed<    edddi¬«      Zeed<    edddi¬«      Zeed<    edddi¬«      Zeee      ed<    eddd i¬«      Zeee      ed!<    ed"dd#i¬«      Zeed$<    eddd%i¬«      Zeed&<    eddd'i¬«      Zeed(<    eddd)i¬«      Zeed*<    eddd+i¬«      Zeed,<    ed-d.d/d-gdœ¬«      Zeed0<    eddd1i¬«      Zeed2<   d3„ Zy)4عModelConfigu&  
    Configuration class for the models.

    Using [`~transformers.HfArgumentParser`] we can turn this class into
    [argparse](https://docs.python.org/3/library/argparse#module-argparse) arguments that can be specified on the
    command line.

    Parameters:
        model_name_or_path (`str` or `None`, *optional*, defaults to `None`):
            Model checkpoint for weights initialization.
        model_revision (`str`, *optional*, defaults to `"main"`):
            Specific model version to use. It can be a branch name, a tag name, or a commit id.
        torch_dtype (`Literal["auto", "bfloat16", "float16", "float32"]` or `None`, *optional*, defaults to `None`):
            Override the default `torch.dtype` and load the model under this dtype. Possible values are

                - `"bfloat16"`: `torch.bfloat16`
                - `"float16"`: `torch.float16`
                - `"float32"`: `torch.float32`
                - `"auto"`: Automatically derive the dtype from the model's weights.

        trust_remote_code (`bool`, *optional*, defaults to `False`):
            Whether to allow for custom models defined on the Hub in their own modeling files. This option should only
            be set to `True` for repositories you trust and in which you have read the code, as it will execute code
            present on the Hub on your local machine.
        attn_implementation (`str` or `None`, *optional*, defaults to `None`):
            Which attention implementation to use. You can run `--attn_implementation=flash_attention_2`, in which case
            you must install this manually by running `pip install flash-attn --no-build-isolation`.
        use_peft (`bool`, *optional*, defaults to `False`):
            Whether to use PEFT for training.
        lora_r (`int`, *optional*, defaults to `16`):
            LoRA R value.
        lora_alpha (`int`, *optional*, defaults to `32`):
            LoRA alpha.
        lora_dropout (`float`, *optional*, defaults to `0.05`):
            LoRA dropout.
        lora_target_modules (`Union[str, list[str]]` or `None`, *optional*, defaults to `None`):
            LoRA target modules.
        lora_modules_to_save (`list[str]` or `None`, *optional*, defaults to `None`):
            Model layers to unfreeze & train.
        lora_task_type (`str`, *optional*, defaults to `"CAUSAL_LM"`):
            Task type to pass for LoRA (use `"SEQ_CLS"` for reward modeling).
        use_rslora (`bool`, *optional*, defaults to `False`):
            Whether to use Rank-Stabilized LoRA, which sets the adapter scaling factor to `lora_alpha/âˆڑr`, instead of
            the original default value of `lora_alpha/r`.
        use_dora (`bool`, *optional*, defaults to `False`):
            Enable [Weight-Decomposed Low-Rank Adaptation (DoRA)](https://huggingface.co/papers/2402.09353). This
            technique decomposes the updates of the weights into two parts, magnitude and direction. Direction is
            handled by normal LoRA, whereas the magnitude is handled by a separate learnable parameter. This can
            improve the performance of LoRA, especially at low ranks. Right now, DoRA only supports linear and Conv2D
            layers. DoRA introduces a bigger overhead than pure LoRA, so it is recommended to merge weights for
            inference.
        load_in_8bit (`bool`, *optional*, defaults to `False`):
            Whether to use 8 bit precision for the base model. Works only with LoRA.
        load_in_4bit (`bool`, *optional*, defaults to `False`):
            Whether to use 4 bit precision for the base model. Works only with LoRA.
        bnb_4bit_quant_type (`str`, *optional*, defaults to `"nf4"`):
            Quantization type (`"fp4"` or `"nf4"`).
        use_bnb_nested_quant (`bool`, *optional*, defaults to `False`):
            Whether to use nested quantization.
    Nعhelpz,Model checkpoint for weights initialization.)عdefaultعmetadataعmodel_name_or_pathعmainzSSpecific model version to use. It can be a branch name, a tag name, or a commit id.عmodel_revisionzGOverride the default `torch.dtype` and load the model under this dtype.)عautoعbfloat16عfloat16عfloat32)r   عchoicesعtorch_dtypeFz‎Whether to allow for custom models defined on the Hub in their own modeling files. This option should only be set to `True` for repositories you trust and in which you have read the code, as it will execute code present on the Hub on your local machine.عtrust_remote_codezؤWhich attention implementation to use. You can run `--attn_implementation=flash_attention_2`, in which case you must install this manually by running `pip install flash-attn --no-build-isolation`.عattn_implementationz!Whether to use PEFT for training.عuse_pefté   zLoRA R value.عlora_ré    zLoRA alpha.ع
lora_alphagڑ™™™™™©?zLoRA dropout.عlora_dropoutzLoRA target modules.عlora_target_modulesz!Model layers to unfreeze & train.عlora_modules_to_saveع	CAUSAL_LMz?Task type to pass for LoRA (use 'SEQ_CLS' for reward modeling).عlora_task_typeu™   Whether to use Rank-Stabilized LoRA, which sets the adapter scaling factor to `lora_alpha/âˆڑr`, instead of the original default value of `lora_alpha/r`.ع
use_rsloraaف  Enable Weight-Decomposed Low-Rank Adaptation (DoRA). This technique decomposes the updates of the weights into two parts, magnitude and direction. Direction is handled by normal LoRA, whereas the magnitude is handled by a separate learnable parameter. This can improve the performance of LoRA, especially at low ranks. Right now, DoRA only supports linear and Conv2D layers. DoRA introduces a bigger overhead than pure LoRA, so it is recommended to merge weights for inference.عuse_dorazHWhether to use 8 bit precision for the base model. Works only with LoRA.عload_in_8bitzHWhether to use 4 bit precision for the base model. Works only with LoRA.عload_in_4bitعnf4zQuantization type.عfp4عbnb_4bit_quant_typez#Whether to use nested quantization.عuse_bnb_nested_quantc                 َز   — | j                   r| j                  rt        d«      ‚t        | j                  d«      r.t        | j                  «      dk(  r| j                  d   | _        y y y )Nz8You can't use 8 bit and 4 bit precision at the same timeع__len__é   r   )r"   r#   ع
ValueErrorعhasattrr   عlen)عselfs    ْS/home/cdr/jupyterlab/.venv/lib/python3.12/site-packages/trl/trainer/model_config.pyع__post_init__zModelConfig.__post_init__®   s^   € ط×ز ×!2ز!2ـذWسXذXنگ4×+ر+¨Yش7¼Cہ×@Xر@Xس<Yذ]^ز<^ط'+×'?ر'?ہر'BˆDص$ً =_ذ7َ    )ع__name__ع
__module__ع__qualname__ع__doc__r   r   r   عstrع__annotations__r   r   r   عboolr   r   r   عintr   r   عfloatr   عlistr   r   r    r!   r"   r#   r&   r'   r0   © r1   r/   r   r      sw  … ٌ;ٌz ).ططذHذIô)ذک ™َ ٌ  ططذoذpô€NگCَ ٌ "'طà]عAٌ
ô"€Kگک#‘َ ٌ $طàً Eً
ôذگtَ ٌ */طàً rً
ô*ذک #™َ ٌ ططذ=ذ>ô€Hˆdَ ٌ ططک/ذ*ô€FˆCَ ٌ ططک-ذ(ô€Jگَ ٌ  ططک/ذ*ô€Lگ%َ ٌ 05ططذ0ذ1ô0ذک $ s،)ر,َ ٌ 16ططذ=ذ>ô1ذک( 4¨،9ر-َ ٌ  ططذ[ذ\ô€NگCَ ٌ طàً Gً
ô€Jگَ ٌ طàً cً
ô	€Hˆdَ 	ٌ ططذdذeô€Lگ$َ ٌ ططذdذeô€Lگ$َ ٌ  %طط.¸Eہ5¸>رJô ذکَ ٌ "'ططذ?ذ@ô"ذک$َ َ
Cr1   r   N)عdataclassesr   r   عtypingr   r   r<   r1   r/   ْ<module>r?      s,   ً÷ )ف ً ÷_Cً _Cَ ٌ_Cr1   