Skip to content

Commit ba93c73

Browse files
committed
CALM-> CLAM
1 parent ba2d622 commit ba93c73

1 file changed

Lines changed: 20 additions & 20 deletions

File tree

llm/summarize_results.py

Lines changed: 20 additions & 20 deletions
Original file line numberDiff line numberDiff line change
@@ -113,7 +113,7 @@ def shorten_model_label(label: str) -> str:
113113
"flores_ca2en": 0.0, # BLEU/100 → 0..1
114114
}
115115

116-
CALM_TASKS = list(RANDOM_BASELINES.keys())
116+
CLAM_TASKS = list(RANDOM_BASELINES.keys())
117117

118118
COLUMN_LABELS = {
119119
"model": "Model",
@@ -126,7 +126,7 @@ def shorten_model_label(label: str) -> str:
126126
"casum_rougeL": "CaSum",
127127
"flores_en2ca": "EN→CA",
128128
"flores_ca2en": "CA→EN",
129-
"calm_pct": "CALM%",
129+
"clam_pct": "CLAM%",
130130
}
131131

132132

@@ -148,9 +148,9 @@ def normalize_score(key: str, raw) -> float | None:
148148
return max(0.0, min(1.0, normalized))
149149

150150

151-
def calm_score(metrics: dict) -> float | None:
152-
"""Compute CALM composite score (0–100) as mean of normalized task scores."""
153-
normalized = [normalize_score(k, metrics.get(k)) for k in CALM_TASKS]
151+
def clam_score(metrics: dict) -> float | None:
152+
"""Compute CLAM composite score (0–100) as mean of normalized task scores."""
153+
normalized = [normalize_score(k, metrics.get(k)) for k in CLAM_TASKS]
154154
valid = [v for v in normalized if v is not None]
155155
if not valid:
156156
return None
@@ -207,14 +207,14 @@ def fmt_pct(value) -> str:
207207
</tbody>
208208
</table>
209209
210-
<h2>Normalized scores (HF Open LLM v2) + CALM composite</h2>
210+
<h2>Normalized scores (HF Open LLM v2) + CLAM composite</h2>
211211
<table>
212212
<thead>
213213
<tr>
214214
<th>Model</th>
215215
<th>Params (mem)</th>
216216
{% for col in norm_cols %}<th>{{ col }}</th>{% endfor %}
217-
<th>CALM%</th>
217+
<th>CLAM%</th>
218218
</tr>
219219
</thead>
220220
<tbody>
@@ -223,7 +223,7 @@ def fmt_pct(value) -> str:
223223
<td>{% if cloud %}<b>{{ label }}</b>{% else %}{{ label }}{% endif %}</td>
224224
<td>{{ row | fmt_params }}</td>
225225
{% for col in norm_cols %}<td>{{ metrics.get(col) | norm(col) | fmt }}</td>{% endfor %}
226-
<td>{{ metrics | calm }}</td>
226+
<td>{{ metrics | clam }}</td>
227227
</tr>
228228
{% endfor %}
229229
</tbody>
@@ -238,7 +238,7 @@ def render_html(rows: list, all_metric_keys: list, norm_keys: list, fmt_params_f
238238
env = Environment()
239239
env.filters["fmt"] = fmt
240240
env.filters["norm"] = lambda value, key: normalize_score(key, value)
241-
env.filters["calm"] = lambda metrics: fmt_pct(calm_score(metrics))
241+
env.filters["clam"] = lambda metrics: fmt_pct(clam_score(metrics))
242242
env.filters["fmt_params"] = lambda row: fmt_params_fn(row[3], row[4])
243243
template = env.from_string(HTML_TEMPLATE_SRC)
244244
return template.render(rows=rows, raw_cols=all_metric_keys, norm_cols=norm_keys)
@@ -270,8 +270,8 @@ def main():
270270
print("No result files found.")
271271
return
272272

273-
# Sort rows by CALM score descending
274-
rows.sort(key=lambda r: calm_score(r[1]) or -1.0, reverse=True)
273+
# Sort rows by CLAM score descending
274+
rows.sort(key=lambda r: clam_score(r[1]) or -1.0, reverse=True)
275275

276276
def fmt_params(params_b, memory_gb) -> str:
277277
if params_b is None:
@@ -295,30 +295,30 @@ def fmt_params(params_b, memory_gb) -> str:
295295
print(f"{label:<{label_width}}{fmt_params(params_b, memory_gb):>{params_col_w}}{row}")
296296
print(separator)
297297

298-
# ── Normalized scores + CALM composite table ──────────────────────────────
299-
norm_keys = [k for k in CALM_TASKS if k in all_metric_keys]
298+
# ── Normalized scores + CLAM composite table ──────────────────────────────
299+
norm_keys = [k for k in CLAM_TASKS if k in all_metric_keys]
300300
norm_col_w = max(14, max(len(k) for k in norm_keys) + 2)
301-
calm_col_w = 10
301+
clam_col_w = 10
302302
norm_label_w = label_width
303303

304304
norm_header = (
305305
f"{'Model':<{norm_label_w}}"
306306
+ f"{'Params (mem)':>{params_col_w}}"
307307
+ "".join(f"{k:>{norm_col_w}}" for k in norm_keys)
308-
+ f"{'CALM%':>{calm_col_w}}"
308+
+ f"{'CLAM%':>{clam_col_w}}"
309309
)
310310
norm_sep = "-" * len(norm_header)
311311

312-
print("\nNormalized scores (HF Open LLM v2) + CALM composite")
312+
print("\nNormalized scores (HF Open LLM v2) + CLAM composite")
313313
print(norm_sep)
314314
print(norm_header)
315315
print(norm_sep)
316316
for label, metrics, _cloud, params_b, memory_gb in rows:
317317
norm_row = "".join(
318318
f"{fmt(normalize_score(k, metrics.get(k))):>{norm_col_w}}" for k in norm_keys
319319
)
320-
calm = fmt_pct(calm_score(metrics))
321-
print(f"{label:<{norm_label_w}}{fmt_params(params_b, memory_gb):>{params_col_w}}{norm_row}{calm:>{calm_col_w}}")
320+
clam = fmt_pct(clam_score(metrics))
321+
print(f"{label:<{norm_label_w}}{fmt_params(params_b, memory_gb):>{params_col_w}}{norm_row}{clam:>{clam_col_w}}")
322322
print(norm_sep)
323323

324324
# ── HTML export ───────────────────────────────────────────────────────────
@@ -333,7 +333,7 @@ def fmt_params(params_b, memory_gb) -> str:
333333
"params_b": COLUMN_LABELS["params_b"],
334334
"memory_gb": COLUMN_LABELS["memory_gb"],
335335
**{k: COLUMN_LABELS.get(k, k) for k in norm_keys},
336-
"calm_pct": COLUMN_LABELS["calm_pct"],
336+
"clam_pct": COLUMN_LABELS["clam_pct"],
337337
}
338338
json_rows = []
339339
for label, metrics, cloud, params_b, memory_gb in rows:
@@ -343,7 +343,7 @@ def fmt_params(params_b, memory_gb) -> str:
343343
"params_b": params_b,
344344
"memory_gb": memory_gb,
345345
**{k: round(normalize_score(k, metrics.get(k)), 4) if normalize_score(k, metrics.get(k)) is not None else None for k in norm_keys},
346-
"calm_pct": round(calm_score(metrics), 2) if calm_score(metrics) is not None else None,
346+
"clam_pct": round(clam_score(metrics), 2) if clam_score(metrics) is not None else None,
347347
}
348348
json_rows.append(entry)
349349
json_path = Path(args.json_norm)

0 commit comments

Comments
 (0)