update lora.py

This commit is contained in:
Goekdeniz-Guelmez
2025-01-31 21:10:44 +01:00
parent a57d553fc1
commit 243c9621d9
2 changed files with 117 additions and 27 deletions

View File

@@ -22,13 +22,7 @@ generate()
class GRPOTrainingArgs(TrainingArgs):
group_size: int = field(
default=4,
metadata={"help": "Number of response sper prompt."},
)
is_reference_free: bool = field(
default=False,
metadata={
"help": "Whether to use reference-free DPO training."
}
metadata={"help": "Number of responses per prompt."},
)
beta: float = field(
default=0.1, metadata={"help": "KL penalty coefficient."}