Skip to content

Commit 89f8f4f

Browse files
committed
.
Signed-off-by: Jonathan Bnayahu <[email protected]>
1 parent 4f9d37b commit 89f8f4f

File tree

2 files changed

+10
-4
lines changed

2 files changed

+10
-4
lines changed

prepare/benchmarks/safety.py

Lines changed: 7 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -2,30 +2,33 @@
22
from unitxt.catalog import add_to_catalog
33
from unitxt.standard import DatasetRecipe
44

5+
MAX_TEST_INSTANCES = 500
6+
57
benchmark = Benchmark(
68
subsets={
79
"attaq": DatasetRecipe(
810
card="cards.safety.attaq_gg",
911
template_card_index="default",
10-
max_test_instances=500,
12+
group_by=["label"],
13+
max_test_instances=MAX_TEST_INSTANCES,
1114
),
1215
"provoq": DatasetRecipe(
1316
card="cards.safety.provoq",
1417
template_card_index="default",
1518
group_by=["group"],
16-
max_test_instances=500,
19+
max_test_instances=MAX_TEST_INSTANCES,
1720
),
1821
"airbench": DatasetRecipe(
1922
card="cards.safety.airbench2024",
2023
template_card_index="default",
2124
group_by=["l2-name"],
22-
max_test_instances=500,
25+
max_test_instances=MAX_TEST_INSTANCES,
2326
),
2427
"ailuminate": DatasetRecipe(
2528
card="cards.safety.mlcommons_ailuminate",
2629
template_card_index="default",
2730
group_by=["hazard"],
28-
max_test_instances=500,
31+
max_test_instances=MAX_TEST_INSTANCES,
2932
),
3033
}
3134
)

src/unitxt/catalog/benchmarks/safety.json

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -5,6 +5,9 @@
55
"__type__": "dataset_recipe",
66
"card": "cards.safety.attaq_gg",
77
"template_card_index": "default",
8+
"group_by": [
9+
"label"
10+
],
811
"max_test_instances": 500
912
},
1013
"provoq": {

0 commit comments

Comments
 (0)