From 5dc268fe26d7c7c05b42189b967ac9e7b5bc3673 Mon Sep 17 00:00:00 2001 From: timovdk <5330531+timovdk@users.noreply.github.com> Date: Wed, 5 Feb 2025 16:57:05 +0100 Subject: [PATCH] setup mxbai study --- asreview2-optuna/main.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/asreview2-optuna/main.py b/asreview2-optuna/main.py index 1487297..889367f 100644 --- a/asreview2-optuna/main.py +++ b/asreview2-optuna/main.py @@ -21,7 +21,7 @@ # Study variables VERSION = 1 METRIC = "ndcg" # Options: "loss", "ndcg" -STUDY_SET = "full" +STUDY_SET = "demo" CLASSIFIER_TYPE = "xgboost" # Options: "nb", "log", "svm", "rf", "xgboost" FEATURE_EXTRACTOR_TYPE = "mxbai" # Options: "tfidf", "onehot", "labse", "bge-m3", "stella", "mxbai" PICKLE_FOLDER_PATH = Path("synergy-dataset", f"pickles_{FEATURE_EXTRACTOR_TYPE}") @@ -248,7 +248,7 @@ def download_pickles(report_order): if __name__ == "__main__": # list of studies - studies = pd.read_json(f"synergy_studies_{STUDY_SET}.jsonl", lines=True).head(1) + studies = pd.read_json(f"synergy_studies_{STUDY_SET}.jsonl", lines=True) report_order = sorted(set(studies["dataset_id"])) if PRE_PROCESSED_FMS: