EvSys

LocalRLConfig

Attributes

attributemodel_config
= ConfigDict(extra='forbid')
attributelearning_ratefloat
= 5e-05
attributenum_epochsint
= 3
attributeper_device_train_batch_sizeint
= 4
attributegradient_accumulation_stepsint
= 8
attributemax_completion_lengthint
= 128
attributenum_generationsint
= 4
attributewarmup_stepsint
= 30
attributelogging_stepsint
= 10
attributesave_stepsint
= 50
attributesave_total_limitint
= 5
attributebf16bool
= False

Enable only on CUDA GPUs that support bfloat16 (Ampere+). Crashes on CPU/MPS.

attributefp16bool
= False

Enable only on CUDA GPUs. Crashes on CPU/MPS.

attributebetafloat
= 0.04
attributeseedint
= 42
attributelora_rankint
= 4
attributelora_alphaint
= 8
attributelora_target_moduleslist[str]
= Field(default_factory=(lambda: ['q_proj', 'v_proj']))
attributeverifier_kindstr
= 'format_only'
attributeverifier_paramsdict[str, Any]
= Field(default_factory=dict)

On this page