Skip to content

Commit

Permalink
⚗️ Style Transfer: add experiments
Browse files Browse the repository at this point in the history
  • Loading branch information
simonmeoni committed Nov 7, 2024
1 parent 83a4740 commit 8012adc
Show file tree
Hide file tree
Showing 2 changed files with 30 additions and 0 deletions.
Original file line number Diff line number Diff line change
@@ -0,0 +1,15 @@
export CUDA_VISIBLE_DEVICES=$1
python style_transfer/run_rb_gen.py model.name=meta-llama/Llama-3.2-3B-Instruct \
model.peft_config.target_modules='["q_proj", "k_proj", "v_proj", "o_proj", "gate_proj", "up_proj", "down_proj"]' \
dataset.name=bio-datasets/mimic-iii-gpt4o-tokens \
max_steps=5 \
dataset.num_generated_samples=3500 \
score.model.model_name_or_path=sentence-transformers/all-mpnet-base-v2 \
dataset.sft_ratio=0.06 \
dataset.gen_ratio=0.7 \
dataset.sft_dataset=null \
sft.training_args.eval_steps=30 \
score.train.train_size=0.6 \
dpo.training_args.num_train_epochs=10 \
dpo.percentile=70 \
score.batch_size=8
Original file line number Diff line number Diff line change
@@ -0,0 +1,15 @@
export CUDA_VISIBLE_DEVICES=$1
python style_transfer/run_rb_gen.py model.name=meta-llama/Llama-3.2-3B-Instruct \
model.peft_config.target_modules='["q_proj", "k_proj", "v_proj", "o_proj", "gate_proj", "up_proj", "down_proj"]' \
dataset.name=bio-datasets/mimic-iii-gpt4o-tokens \
max_steps=5 \
dataset.num_generated_samples=3500 \
score.model.model_name_or_path=sentence-transformers/all-mpnet-base-v2 \
dataset.sft_ratio=0.06 \
dataset.gen_ratio=0.7 \
sft.training_args.eval_steps=30 \
score.train.train_size=0.6 \
dataset.sft_dataset.size=977 \
dpo.training_args.num_train_epochs=20 \
dpo.percentile=70 \
score.batch_size=8

0 comments on commit 8012adc

Please sign in to comment.