There was an error while loading. Please reload this page.
1 parent 13053a7 commit d039ad2Copy full SHA for d039ad2
llm/alignment/dpo/run_dpo.py
@@ -127,6 +127,8 @@ def main():
127
128
if training_args.pipeline_parallel_degree > 1:
129
model_class = AutoModelForCausalLMPipe
130
+ if not dpo_config.reference_free and not dpo_config.lora:
131
+ ref_model_config.dpo_config = dpo_config
132
model_config.dpo_config = dpo_config
133
else:
134
model_class = AutoModelForCausalLM
0 commit comments