Skip to content

Commit

Permalink
⚗️ Style Transfer: new hyperparams
Browse files Browse the repository at this point in the history
  • Loading branch information
simonmeoni committed Nov 4, 2024
1 parent c456dc0 commit 4d4cb2e
Show file tree
Hide file tree
Showing 2 changed files with 6 additions and 5 deletions.
3 changes: 2 additions & 1 deletion lib/style-transfer/configs/rb_gen/dpo/default.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@ training_args:
save_steps: 50
gradient_accumulation_steps: 16
gradient_checkpointing: false
learning_rate: 4e-6
learning_rate: 5e-6
weight_decay: 1e-7
eval_strategy: "no"
num_train_epochs: 5
Expand All @@ -19,6 +19,7 @@ training_args:
max_length: 1024
max_prompt_length: 512
report_to: "none"
beta: 0.1

beta: 0.1
checkpoint: null
Expand Down
8 changes: 4 additions & 4 deletions lib/style-transfer/configs/rb_gen/score/default.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -6,10 +6,10 @@ model:
model_name_or_path: "sentence-transformers/all-mpnet-base-v2"

train:
warmup_steps: 10
warmup_steps: 50
use_ground_truth: true
epochs: 5
train_size: 0.3
epochs: 2
train_size: 0.6
loss:
_target_: sentence_transformers.losses.ContrastiveTensionLoss
_target_: sentence_transformers.losses.ContrastiveLoss
_partial_: true

0 comments on commit 4d4cb2e

Please sign in to comment.