Skip to content

Commit 6395477

Browse files
committed
work on lamastack evals tests
1 parent 7223766 commit 6395477

2 files changed

Lines changed: 5 additions & 4 deletions

File tree

tests/llama_stack/conftest.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -84,7 +84,7 @@ def llama_stack_server_config(
8484
"name": "llama-stack",
8585
"port": 8321,
8686
},
87-
"distribution": {"image": "quay.io/ruimvieira/llama-stack-odh:latest"},
87+
"distribution": {"image": "quay.io/ruimvieira/llama-stack-lmeval-fix:latest"},
8888
"storage": {
8989
"size": "20Gi",
9090
},

tests/llama_stack/eval/test_lmeval_provider.py

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -38,7 +38,8 @@ def test_lmeval_register_benchmark(self, llama_stack_client):
3838
dataset_id=trustyai_lmeval_arc_easy,
3939
scoring_functions=["string"],
4040
provider_id=LlamaStackProviders.Eval.TRUSTYAI_LMEVAL,
41-
metadata={"tokenized_request": False, "tokenizer": "google/flan-t5-small"},
41+
provider_benchmark_id="string",
42+
metadata={"tokenized_requests": False, "tokenizer": "google/flan-t5-small"},
4243
)
4344

4445
benchmarks = llama_stack_client.benchmarks.list()
@@ -52,12 +53,12 @@ def test_llamastack_run_eval(self, patched_trustyai_operator_configmap_allow_onl
5253
benchmark_id=f"{LlamaStackProviders.Eval.TRUSTYAI_LMEVAL}::arc_easy",
5354
benchmark_config={
5455
"eval_candidate": {
55-
"type": "model",
5656
"model": "qwen",
57+
"type": "model",
5758
"provider_id": LlamaStackProviders.Eval.TRUSTYAI_LMEVAL,
5859
"sampling_params": {"temperature": 0.7, "top_p": 0.9, "max_tokens": 256},
5960
},
60-
"num_examples": 10,
61+
"num_examples": 100,
6162
},
6263
)
6364

0 commit comments

Comments
 (0)