Skip to content

Commit d56baa8

Browse files
authored
change: change model and group tasks in LMEval HF tests (#394)
1 parent 288178a commit d56baa8

File tree

2 files changed

+4
-14
lines changed

2 files changed

+4
-14
lines changed

tests/model_explainability/lm_eval/conftest.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,7 @@ def lmevaljob_hf(
3535
name=LMEVALJOB_NAME,
3636
namespace=model_namespace.name,
3737
model="hf",
38-
model_args=[{"name": "pretrained", "value": "Qwen/Qwen2.5-0.5B-Instruct"}],
38+
model_args=[{"name": "pretrained", "value": "rgeada/tiny-untrained-granite"}],
3939
task_list=request.param.get("task_list"),
4040
log_samples=True,
4141
allow_online=True,

tests/model_explainability/lm_eval/test_lm_eval.py

Lines changed: 3 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -10,19 +10,9 @@
1010
"model_namespace, lmevaljob_hf",
1111
[
1212
pytest.param(
13-
{"name": "test-lmeval-hf-arc"}, {"task_list": {"taskNames": ["arc_challenge"]}}, id="arc_challenge"
14-
),
15-
pytest.param(
16-
{"name": "test-lmeval-hf-mmlu"},
17-
{"task_list": {"taskNames": ["mmlu_astronomy_generative"]}},
18-
id="mmlu_astronomy_generative",
19-
),
20-
pytest.param({"name": "test-lmeval-hf-hellaswag"}, {"task_list": {"taskNames": ["hellaswag"]}}, id="hellaswag"),
21-
pytest.param(
22-
{"name": "test-lmeval-hf-truthfulqa"}, {"task_list": {"taskNames": ["truthfulqa_gen"]}}, id="truthfulqa_gen"
23-
),
24-
pytest.param(
25-
{"name": "test-lmeval-hf-winogrande"}, {"task_list": {"taskNames": ["winogrande"]}}, id="winogrande"
13+
{"name": "test-lmeval-hf-tasks"},
14+
{"task_list": {"taskNames": ["arc_challenge", "mmlu_astronomy", "hellaswag", "truthfulqa", "winogrande"]}},
15+
id="popular_tasks",
2616
),
2717
pytest.param(
2818
{"name": "test-lmeval-hf-custom-task"},

0 commit comments

Comments
 (0)