Skip to content

Commit

Permalink
Remove train sets temporarily
Browse files Browse the repository at this point in the history
  • Loading branch information
liujch1998 committed Dec 19, 2024
1 parent ba30253 commit 0ae766e
Show file tree
Hide file tree
Showing 37 changed files with 0 additions and 94 deletions.

This file was deleted.

Binary file not shown.

This file was deleted.

Binary file not shown.

This file was deleted.

Binary file not shown.

This file was deleted.

Binary file not shown.

This file was deleted.

Binary file not shown.

This file was deleted.

Binary file not shown.

This file was deleted.

Binary file not shown.

This file was deleted.

Binary file not shown.

This file was deleted.

Binary file not shown.

This file was deleted.

Binary file not shown.

This file was deleted.

Binary file not shown.

This file was deleted.

Binary file not shown.

This file was deleted.

Binary file not shown.

This file was deleted.

Binary file not shown.

This file was deleted.

Binary file not shown.

This file was deleted.

Binary file not shown.

This file was deleted.

Binary file not shown.

This file was deleted.

Binary file not shown.
76 changes: 0 additions & 76 deletions src/olmo_eval/tasks.py
Original file line number Diff line number Diff line change
Expand Up @@ -1893,18 +1893,6 @@ def doc_to_label(self, doc) -> int:
# Train and test sets are added when applicable.
# No subsampling happens in these sets.
label_to_task_map_new = {
"arc_challenge_train_rc_5shot": (
OEEvalTask,
{
"dataset_path": "arc_challenge",
"dataset_name": "train_rc_5shot",
"metric_type": "len_norm",
},
),
"arc_challenge_train_mc_5shot": (
OEEvalTask,
{"dataset_path": "arc_challenge", "dataset_name": "train_mc_5shot", "metric_type": "acc"},
),
"arc_challenge_val_rc_5shot": (
OEEvalTask,
{
Expand All @@ -1929,14 +1917,6 @@ def doc_to_label(self, doc) -> int:
OEEvalTask,
{"dataset_path": "arc_challenge", "dataset_name": "test_mc_5shot", "metric_type": "acc"},
),
"arc_easy_train_rc_5shot": (
OEEvalTask,
{"dataset_path": "arc_easy", "dataset_name": "train_rc_5shot", "metric_type": "len_norm"},
), # this used to be acc
"arc_easy_train_mc_5shot": (
OEEvalTask,
{"dataset_path": "arc_easy", "dataset_name": "train_mc_5shot", "metric_type": "acc"},
),
"arc_easy_val_rc_5shot": (
OEEvalTask,
{"dataset_path": "arc_easy", "dataset_name": "val_rc_5shot", "metric_type": "len_norm"},
Expand All @@ -1953,14 +1933,6 @@ def doc_to_label(self, doc) -> int:
OEEvalTask,
{"dataset_path": "arc_easy", "dataset_name": "test_mc_5shot", "metric_type": "acc"},
),
"boolq_train_rc_5shot": (
OEEvalTask,
{"dataset_path": "boolq", "dataset_name": "train_rc_5shot", "metric_type": "acc"},
), # kept acc here, since len_norm can bias towards "yes"
"boolq_train_mc_5shot": (
OEEvalTask,
{"dataset_path": "boolq", "dataset_name": "train_mc_5shot", "metric_type": "acc"},
),
"boolq_val_rc_5shot": (
OEEvalTask,
{"dataset_path": "boolq", "dataset_name": "val_rc_5shot", "metric_type": "acc"},
Expand All @@ -1969,14 +1941,6 @@ def doc_to_label(self, doc) -> int:
OEEvalTask,
{"dataset_path": "boolq", "dataset_name": "val_mc_5shot", "metric_type": "acc"},
),
"csqa_train_rc_5shot": (
OEEvalTask,
{"dataset_path": "csqa", "dataset_name": "train_rc_5shot", "metric_type": "len_norm"},
),
"csqa_train_mc_5shot": (
OEEvalTask,
{"dataset_path": "csqa", "dataset_name": "train_mc_5shot", "metric_type": "acc"},
),
"csqa_val_rc_5shot": (
OEEvalTask,
{"dataset_path": "csqa", "dataset_name": "val_rc_5shot", "metric_type": "len_norm"},
Expand All @@ -1985,14 +1949,6 @@ def doc_to_label(self, doc) -> int:
OEEvalTask,
{"dataset_path": "csqa", "dataset_name": "val_mc_5shot", "metric_type": "acc"},
),
"hellaswag_train_rc_5shot": (
OEEvalTask,
{"dataset_path": "hellaswag", "dataset_name": "train_rc_5shot", "metric_type": "len_norm"},
),
"hellaswag_train_mc_5shot": (
OEEvalTask,
{"dataset_path": "hellaswag", "dataset_name": "train_mc_5shot", "metric_type": "acc"},
),
"hellaswag_val_rc_5shot": (
OEEvalTask,
{"dataset_path": "hellaswag", "dataset_name": "val_rc_5shot", "metric_type": "len_norm"},
Expand All @@ -2001,14 +1957,6 @@ def doc_to_label(self, doc) -> int:
OEEvalTask,
{"dataset_path": "hellaswag", "dataset_name": "val_mc_5shot", "metric_type": "acc"},
),
"openbookqa_train_rc_5shot": (
OEEvalTask,
{"dataset_path": "openbookqa", "dataset_name": "train_rc_5shot", "metric_type": "len_norm"},
),
"openbookqa_train_mc_5shot": (
OEEvalTask,
{"dataset_path": "openbookqa", "dataset_name": "train_mc_5shot", "metric_type": "acc"},
),
"openbookqa_val_rc_5shot": (
OEEvalTask,
{"dataset_path": "openbookqa", "dataset_name": "val_rc_5shot", "metric_type": "len_norm"},
Expand All @@ -2025,14 +1973,6 @@ def doc_to_label(self, doc) -> int:
OEEvalTask,
{"dataset_path": "openbookqa", "dataset_name": "test_mc_5shot", "metric_type": "acc"},
),
"piqa_train_rc_5shot": (
OEEvalTask,
{"dataset_path": "piqa", "dataset_name": "train_rc_5shot", "metric_type": "len_norm"},
),
"piqa_train_mc_5shot": (
OEEvalTask,
{"dataset_path": "piqa", "dataset_name": "train_mc_5shot", "metric_type": "acc"},
),
"piqa_val_rc_5shot": (
OEEvalTask,
{"dataset_path": "piqa", "dataset_name": "val_rc_5shot", "metric_type": "len_norm"},
Expand All @@ -2041,14 +1981,6 @@ def doc_to_label(self, doc) -> int:
OEEvalTask,
{"dataset_path": "piqa", "dataset_name": "val_mc_5shot", "metric_type": "acc"},
),
"socialiqa_train_rc_5shot": (
OEEvalTask,
{"dataset_path": "socialiqa", "dataset_name": "train_rc_5shot", "metric_type": "len_norm"},
),
"socialiqa_train_mc_5shot": (
OEEvalTask,
{"dataset_path": "socialiqa", "dataset_name": "train_mc_5shot", "metric_type": "acc"},
),
"socialiqa_val_rc_5shot": (
OEEvalTask,
{"dataset_path": "socialiqa", "dataset_name": "val_rc_5shot", "metric_type": "len_norm"},
Expand All @@ -2057,14 +1989,6 @@ def doc_to_label(self, doc) -> int:
OEEvalTask,
{"dataset_path": "socialiqa", "dataset_name": "val_mc_5shot", "metric_type": "acc"},
),
"winogrande_train_rc_5shot": (
OEEvalTask,
{"dataset_path": "winogrande", "dataset_name": "train_rc_5shot", "metric_type": "len_norm"},
), # this used to be acc
"winogrande_train_mc_5shot": (
OEEvalTask,
{"dataset_path": "winogrande", "dataset_name": "train_mc_5shot", "metric_type": "acc"},
),
"winogrande_val_rc_5shot": (
OEEvalTask,
{"dataset_path": "winogrande", "dataset_name": "val_rc_5shot", "metric_type": "len_norm"},
Expand Down

0 comments on commit 0ae766e

Please sign in to comment.