Skip to content

Commit

Permalink
rename PairRM to PairRM 0.4B
Browse files Browse the repository at this point in the history
  • Loading branch information
jdf-prog committed Jan 17, 2024
1 parent 495b606 commit 3bfb48b
Show file tree
Hide file tree
Showing 3 changed files with 3 additions and 3 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -12,5 +12,5 @@ pairrm-tulu-2-13b:
do_sample: False
best_of: 16 # number of completions to generate, using PairRM to select the best one
batch_size: 800
pretty_name: "PairRM+Tulu 2+DPO 13B (best-of-16)"
pretty_name: "PairRM 0.4B+Tulu 2+DPO 13B (best-of-16)"
link: "https://huggingface.co/llm-blender/PairRM"
Original file line number Diff line number Diff line change
Expand Up @@ -12,5 +12,5 @@ pairrm-tulu-2-70b:
do_sample: False
best_of: 16 # number of completions to generate, using PairRM to select the best one
batch_size: 800
pretty_name: "PairRM+Tulu 2+DPO 70B (best-of-16)"
pretty_name: "PairRM 0.4B+Tulu 2+DPO 70B (best-of-16)"
link: "https://huggingface.co/llm-blender/PairRM"
Original file line number Diff line number Diff line change
Expand Up @@ -10,5 +10,5 @@ pairrm-zephyr-7b-beta:
top_p: 1.0
do_sample: True
best_of: 16 # number of completions to generate, using PairRM to select the best one
pretty_name: "PairRM+Zephyr 7B Beta (best-of-16)"
pretty_name: "PairRM 0.4B+Zephyr 7B Beta (best-of-16)"
link: "https://huggingface.co/llm-blender/PairRM"

0 comments on commit 3bfb48b

Please sign in to comment.