From de20acb2a05e82da39b8ce63adb3d3f56a9b546e Mon Sep 17 00:00:00 2001 From: Dongfu Jiang Date: Mon, 1 Apr 2024 10:59:06 +0800 Subject: [PATCH] update --- .gitmodules | 5 ++++- train_ranker.sh | 2 +- 2 files changed, 5 insertions(+), 2 deletions(-) diff --git a/.gitmodules b/.gitmodules index 9346233..ed0c7d0 100644 --- a/.gitmodules +++ b/.gitmodules @@ -1,3 +1,6 @@ [submodule "data/UnifiedFeedback"] path = data/UnifiedFeedback - url = https://github.com/jdf-prog/UnifiedFeedback.git + url = https://github.com/jdf-prog/UnifiedFeedback +[submodule "hf_space/LLM-Blender"] + path = hf_space/LLM-Blender + url = https://huggingface.co/spaces/llm-blender/LLM-Blender diff --git a/train_ranker.sh b/train_ranker.sh index 5d6af0a..eb1d56f 100755 --- a/train_ranker.sh +++ b/train_ranker.sh @@ -15,7 +15,7 @@ dataset="UnifiedFeedback" eval_dataset="reward_bench" backbone_type="phi" # "deberta" or "roberta" backbone_name="microsoft/phi-2" # "microsoft/deberta-v3-large" or "roberta-large" -n_gpu=4 +n_gpu=8 ranker="PairRanker" # "PairRanker" or "Summareranker" or "SimCLS" candidate_model="" # separted by comma. Empty string for all models candidate_decoding_method="" # separted by comma. Empty string for all methods