forked from EvolvingLMMs-Lab/lmms-eval
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathopenrouter_mme_stats.sh
More file actions
34 lines (28 loc) · 1.08 KB
/
Copy pathopenrouter_mme_stats.sh
File metadata and controls
34 lines (28 loc) · 1.08 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
#!/bin/bash
set -euo pipefail
# OpenRouter + MME quick test (simple version)
# - Default uses all samples (`LIMIT=-1`)
# - Stability metrics appear when `REPEATS > 1`
export HF_HOME="${HF_HOME:-$HOME/.cache/huggingface}"
export OPENAI_API_KEY="${OPENAI_API_KEY:-${OPENROUTER_API_KEY:?Error: OPENROUTER_API_KEY not set in environment}}"
export OPENAI_API_BASE="${OPENAI_API_BASE:-https://openrouter.ai/api/v1}"
MODEL_VERSION="${MODEL_VERSION:-mistralai/ministral-3b-2512}"
TASKS="${TASKS:-mme}"
REPEATS="${REPEATS:-1}"
LIMIT="${LIMIT:--1}"
BATCH_SIZE="${BATCH_SIZE:-1}"
OUTPUT_PATH="${OUTPUT_PATH:-./logs/openrouter_mme_stats/}"
VERBOSITY="${VERBOSITY:-INFO}"
echo "[INFO] OpenRouter MME test"
echo "[INFO] model=${MODEL_VERSION} tasks=${TASKS} repeats=${REPEATS} limit=${LIMIT}"
echo "[INFO] output_path=${OUTPUT_PATH}"
python3 -m lmms_eval \
--model openai \
--model_args "model_version=${MODEL_VERSION}" \
--tasks "${TASKS}" \
--batch_size "${BATCH_SIZE}" \
--repeats "${REPEATS}" \
--limit "${LIMIT}" \
--output_path "${OUTPUT_PATH}" \
--log_samples \
--verbosity "${VERBOSITY}"