File tree Expand file tree Collapse file tree 1 file changed +22
-0
lines changed
Expand file tree Collapse file tree 1 file changed +22
-0
lines changed Original file line number Diff line number Diff line change @@ -484,6 +484,18 @@ paths:
484484 type : boolean
485485 default : auto
486486 description : Whether to mask the user messages in conversational data or prompts in instruction data.
487+ training_method :
488+ type : string
489+ enum :
490+ - sft
491+ - dpo
492+ default : sft
493+ description : The training method to use. 'sft' for Supervised Fine-Tuning or 'dpo' for Direct Preference Optimization.
494+ dpo_beta :
495+ type : number
496+ format : float
497+ default : 0.1
498+ description : The beta parameter for DPO training. Only applicable when training_method is 'dpo'.
487499 training_type :
488500 type : object
489501 oneOf :
@@ -2337,6 +2349,16 @@ components:
23372349 enum :
23382350 - auto
23392351 default : auto
2352+ training_method :
2353+ type : string
2354+ enum :
2355+ - sft
2356+ - dpo
2357+ default : sft
2358+ dpo_beta :
2359+ type : number
2360+ format : float
2361+ default : 0.1
23402362 training_type :
23412363 type : object
23422364 oneOf :
You can’t perform that action at this time.
0 commit comments