Skip to content

Commit

Permalink
Improve stabiliy: change default hyperparamers
Browse files Browse the repository at this point in the history
  • Loading branch information
vwxyzjn committed Jun 23, 2023
1 parent 0161a8e commit b56e8b3
Showing 1 changed file with 3 additions and 3 deletions.
6 changes: 3 additions & 3 deletions examples/sentiment/scripts/gpt2-sentiment.py
Original file line number Diff line number Diff line change
Expand Up @@ -60,13 +60,13 @@ class ScriptArguments:
model_name: Optional[str] = field(default="lvwerra/gpt2-imdb", metadata={"help": "the model name"})
log_with: Optional[str] = field(default=None, metadata={"help": "use 'wandb' to log with wandb"})
learning_rate: Optional[float] = field(default=1.41e-5, metadata={"help": "the learning rate"})
mini_batch_size: Optional[int] = field(default=16, metadata={"help": "the PPO minibatch size"})
batch_size: Optional[int] = field(default=256, metadata={"help": "the batch size"})
mini_batch_size: Optional[int] = field(default=128, metadata={"help": "the PPO minibatch size"})
batch_size: Optional[int] = field(default=128, metadata={"help": "the batch size"})
gradient_accumulation_steps: Optional[int] = field(
default=1, metadata={"help": "the number of gradient accumulation steps"}
)
early_stopping: Optional[bool] = field(default=False, metadata={"help": "whether to early stop"})
target_kl: Optional[float] = field(default=0.1, metadata={"help": "kl target for early stopping"})
target_kl: Optional[float] = field(default=6, metadata={"help": "kl target for early stopping"})


parser = HfArgumentParser(ScriptArguments)
Expand Down

0 comments on commit b56e8b3

Please sign in to comment.