diff --git a/README.md b/README.md index 5528b25..b71d662 100644 --- a/README.md +++ b/README.md @@ -129,7 +129,7 @@ WANDB_ENTITY= WANDB_PROJECT= pytho [--model-list ] ``` -By default, the entity is configured to use your username, and the project name is set to `ja-vicuna-qa-benchmark`. +By default, the entity is configured to use your username, and the project name is set to `ja-vicuna-qa-benchmark-dev`. ## Sample Outputs diff --git a/llm_judge/upload_result.py b/llm_judge/upload_result.py index 95e7de3..bdbf096 100644 --- a/llm_judge/upload_result.py +++ b/llm_judge/upload_result.py @@ -59,7 +59,7 @@ def upload_results( results: A list of results. baseline_model: Baseline model name. Only used in `pairwise-baseline` mode. """ - project = os.getenv("WANDB_PROJECT", "ja-vicuna-qa-benchmark") + project = os.getenv("WANDB_PROJECT", "ja-vicuna-qa-benchmark-dev") if len(results) == 0: logger.warning(f"No results found for {result_id}") return