instruct fine tuning setup

This commit is contained in:
Your Name
2025-08-28 22:41:56 +00:00
parent d49b4ff2d5
commit 78d7063ce5
58 changed files with 2510234 additions and 98 deletions
@@ -139,7 +139,7 @@ class UnslothAlignPropConfig(AlignPropConfig):
def __init__(
self,
exp_name = 'train',
exp_name = 'inference',
run_name = '',
seed = 3407,
log_with = None,
+1 -1
View File
@@ -155,7 +155,7 @@ class UnslothDDPOConfig(DDPOConfig):
def __init__(
self,
exp_name = 'train',
exp_name = 'inference',
run_name = '',
seed = 3407,
log_with = None,