Skip to content

Commit 88e8a02

Browse files
author
lalalune
committed
updates
1 parent ee06045 commit 88e8a02

13 files changed

Lines changed: 131 additions & 14 deletions

File tree

packages/agent/src/api/conversation-routes.ts

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1340,7 +1340,7 @@ export async function handleConversationRoutes(
13401340
if (aborted) break;
13411341
streamedText += chunk;
13421342
writeChatTokenSse(res, chunk, streamedText);
1343-
await new Promise((resolve) => setTimeout(resolve, 15));
1343+
await new Promise((resolve) => setTimeout(resolve, 60));
13441344
}
13451345
}
13461346
// Emit `done` BEFORE persistence so user-perceived end-of-turn

packages/benchmarks/abliteration-robustness/cli.py

Lines changed: 47 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -192,14 +192,41 @@ def _make_harness_client(harness: str, args: argparse.Namespace):
192192
_ensure_adapter_path("hermes-adapter")
193193
from hermes_adapter.client import HermesClient # noqa: WPS433
194194

195-
client = HermesClient(provider=provider, model=model, base_url=args.base_url)
195+
client = HermesClient(
196+
provider=provider,
197+
model=model,
198+
base_url=args.base_url
199+
or os.environ.get("BENCHMARK_BASE_URL")
200+
or os.environ.get("OPENAI_BASE_URL")
201+
or os.environ.get("CEREBRAS_BASE_URL")
202+
or None,
203+
mode=(os.environ.get("HERMES_MODE") or "in_process").strip()
204+
or "in_process",
205+
timeout_s=float(os.environ.get("HERMES_TIMEOUT_S", "120")),
206+
reasoning_effort=os.environ.get("BENCHMARK_REASONING_EFFORT")
207+
or os.environ.get("CEREBRAS_REASONING_EFFORT")
208+
or None,
209+
)
196210
client.wait_until_ready(timeout=120)
197211
return client
198212
if harness == "openclaw":
199213
_ensure_adapter_path("openclaw-adapter")
200214
from openclaw_adapter.client import OpenClawClient # noqa: WPS433
201215

202-
client = OpenClawClient(provider=provider, model=model, base_url=args.base_url)
216+
client = OpenClawClient(
217+
provider=provider,
218+
model=model,
219+
base_url=args.base_url
220+
or os.environ.get("BENCHMARK_BASE_URL")
221+
or os.environ.get("OPENAI_BASE_URL")
222+
or os.environ.get("CEREBRAS_BASE_URL")
223+
or None,
224+
timeout_s=float(os.environ.get("OPENCLAW_TIMEOUT_S", "120")),
225+
reasoning_effort=os.environ.get("BENCHMARK_REASONING_EFFORT")
226+
or os.environ.get("CEREBRAS_REASONING_EFFORT")
227+
or None,
228+
direct_openai_compatible=True,
229+
)
203230
client.wait_until_ready(timeout=120)
204231
return client
205232
raise SystemExit(f"unknown harness {harness!r}")
@@ -244,11 +271,25 @@ def _generate(client, model: str, prompt: str, max_tokens: int, temperature: flo
244271
},
245272
)
246273
return str(getattr(response, "text", "") or "")
274+
kwargs: dict[str, object] = {
275+
"model": model,
276+
"messages": [{"role": "user", "content": prompt}],
277+
"max_tokens": max_tokens,
278+
"temperature": temperature,
279+
}
280+
reasoning_effort = (
281+
os.environ.get("BENCHMARK_REASONING_EFFORT")
282+
or os.environ.get("CEREBRAS_REASONING_EFFORT")
283+
or os.environ.get("OPENAI_REASONING_EFFORT")
284+
)
285+
if (
286+
isinstance(reasoning_effort, str)
287+
and reasoning_effort.strip()
288+
and model.rsplit("/", 1)[-1].startswith("gpt-oss")
289+
):
290+
kwargs["extra_body"] = {"reasoning_effort": reasoning_effort.strip()}
247291
resp = client.chat.completions.create(
248-
model=model,
249-
messages=[{"role": "user", "content": prompt}],
250-
max_tokens=max_tokens,
251-
temperature=temperature,
292+
**kwargs,
252293
)
253294
return resp.choices[0].message.content or ""
254295

packages/benchmarks/standard/_base.py

Lines changed: 19 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -261,13 +261,32 @@ def __init__(self, *, harness: str, endpoint: str, api_key: str) -> None:
261261
self._client = HermesClient(
262262
provider=os.environ.get("BENCHMARK_MODEL_PROVIDER", "cerebras"),
263263
model=os.environ.get("BENCHMARK_MODEL_NAME", "gpt-oss-120b"),
264+
base_url=os.environ.get("BENCHMARK_BASE_URL")
265+
or os.environ.get("OPENAI_BASE_URL")
266+
or os.environ.get("CEREBRAS_BASE_URL")
267+
or None,
268+
mode=(os.environ.get("HERMES_MODE") or "in_process").strip()
269+
or "in_process",
270+
timeout_s=float(os.environ.get("HERMES_TIMEOUT_S", "120")),
271+
reasoning_effort=os.environ.get("BENCHMARK_REASONING_EFFORT")
272+
or os.environ.get("CEREBRAS_REASONING_EFFORT")
273+
or None,
264274
)
265275
elif harness == "openclaw":
266276
from openclaw_adapter.client import OpenClawClient # noqa: WPS433
267277

268278
self._client = OpenClawClient(
269279
provider=os.environ.get("BENCHMARK_MODEL_PROVIDER", "cerebras"),
270280
model=os.environ.get("BENCHMARK_MODEL_NAME", "gpt-oss-120b"),
281+
base_url=os.environ.get("BENCHMARK_BASE_URL")
282+
or os.environ.get("OPENAI_BASE_URL")
283+
or os.environ.get("CEREBRAS_BASE_URL")
284+
or None,
285+
timeout_s=float(os.environ.get("OPENCLAW_TIMEOUT_S", "120")),
286+
reasoning_effort=os.environ.get("BENCHMARK_REASONING_EFFORT")
287+
or os.environ.get("CEREBRAS_REASONING_EFFORT")
288+
or None,
289+
direct_openai_compatible=True,
271290
)
272291
else:
273292
from eliza_adapter.client import ElizaClient # noqa: WPS433

packages/benchmarks/standard/gsm8k.py

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -19,6 +19,7 @@
1919

2020
import argparse
2121
import logging
22+
import os
2223
import re
2324
from collections.abc import Iterable, Sequence
2425
from decimal import Decimal, InvalidOperation
@@ -103,6 +104,12 @@ def _gold_from_answer(answer: str) -> int | None:
103104

104105

105106
def _load_dataset_examples(limit: int | None) -> list[dict[str, object]]:
107+
if (
108+
os.environ.get("BENCHMARK_STANDARD_FULL_DATA", "").strip() != "1"
109+
and limit is not None
110+
and limit <= len(SMOKE_FIXTURES)
111+
):
112+
return list(SMOKE_FIXTURES)[:limit]
106113
try:
107114
from datasets import load_dataset
108115
except ImportError:

packages/benchmarks/standard/humaneval.py

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -32,6 +32,7 @@
3232
import io
3333
import logging
3434
import multiprocessing as mp
35+
import os
3536
import re
3637
import signal
3738
import textwrap
@@ -254,6 +255,12 @@ def _execute_program(program: str, timeout_s: float) -> tuple[bool, str]:
254255

255256

256257
def _load_dataset_examples(limit: int | None) -> list[dict[str, object]]:
258+
if (
259+
os.environ.get("BENCHMARK_STANDARD_FULL_DATA", "").strip() != "1"
260+
and limit is not None
261+
and limit <= len(SMOKE_FIXTURES)
262+
):
263+
return list(SMOKE_FIXTURES)[:limit]
257264
try:
258265
from datasets import load_dataset
259266
except ImportError:

packages/benchmarks/standard/mmlu.py

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -19,6 +19,7 @@
1919

2020
import argparse
2121
import logging
22+
import os
2223
import re
2324
from collections.abc import Sequence
2425
from pathlib import Path
@@ -101,6 +102,12 @@ def _load_dataset_examples(limit: int | None) -> list[dict[str, object]]:
101102
The fallback is deliberate — the smoke test must run with no
102103
internet and no datasets install.
103104
"""
105+
if (
106+
os.environ.get("BENCHMARK_STANDARD_FULL_DATA", "").strip() != "1"
107+
and limit is not None
108+
and limit <= len(SMOKE_FIXTURES)
109+
):
110+
return list(SMOKE_FIXTURES)[:limit]
104111

105112
try:
106113
from datasets import load_dataset

packages/benchmarks/standard/mt_bench.py

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -28,6 +28,7 @@
2828

2929
import argparse
3030
import logging
31+
import os
3132
import re
3233
from collections.abc import Iterable, Sequence
3334
from pathlib import Path
@@ -144,6 +145,12 @@ def _load_dataset_questions(limit: int | None) -> list[dict[str, object]]:
144145
The community mirror at ``lmsys/mt_bench_human_judgments`` exposes
145146
each question with ``turns`` (list of turn-1 + turn-2 strings).
146147
"""
148+
if (
149+
os.environ.get("BENCHMARK_STANDARD_FULL_DATA", "").strip() != "1"
150+
and limit is not None
151+
and limit <= len(SMOKE_QUESTIONS)
152+
):
153+
return list(SMOKE_QUESTIONS)[:limit]
147154

148155
try:
149156
from datasets import load_dataset

plugins/plugin-app-manager/src/api/apps-routes.ts

Lines changed: 28 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -42,7 +42,6 @@ import {
4242
parseAppIsolation,
4343
parseAppPermissions,
4444
} from "@elizaos/shared";
45-
import { isLegacyAppsWorkspaceDiscoveryEnabled } from "@elizaos/agent/config/feature-flags";
4645
import {
4746
importAppRouteModule,
4847
resolveWorkspacePackageDir,
@@ -69,6 +68,33 @@ const HERO_IMAGE_CONTENT_TYPES: Record<string, string> = {
6968
".svg": "image/svg+xml",
7069
};
7170

71+
function readBoolFlag(name: string, fallback = false): boolean {
72+
const raw = process.env[name];
73+
if (raw === undefined || raw === null || raw === "") return fallback;
74+
const trimmed = String(raw).trim().toLowerCase();
75+
if (
76+
trimmed === "1" ||
77+
trimmed === "true" ||
78+
trimmed === "yes" ||
79+
trimmed === "on"
80+
) {
81+
return true;
82+
}
83+
if (
84+
trimmed === "0" ||
85+
trimmed === "false" ||
86+
trimmed === "no" ||
87+
trimmed === "off"
88+
) {
89+
return false;
90+
}
91+
return fallback;
92+
}
93+
94+
function isLegacyAppsWorkspaceDiscoveryEnabled(): boolean {
95+
return readBoolFlag("ELIZA_ENABLE_LEGACY_APPS_WORKSPACE_DISCOVERY");
96+
}
97+
7298
const DEFAULT_HERO_IMAGE_CANDIDATES = [
7399
"assets/hero.png",
74100
"assets/hero.webp",
@@ -1104,7 +1130,7 @@ export async function handleAppsRoutes(
11041130
// ~/.eliza/plugins/installed without depending on a plugin-manager
11051131
// service. The runtime plugin resolver already searches that dir.
11061132
const { installPlugin: installPluginDirect } = await import(
1107-
/* webpackIgnore: true */ "@elizaos/agent/services/plugin-installer"
1133+
"@elizaos/plugin-registry"
11081134
);
11091135
result = await installPluginDirect(name, recordProgress, version);
11101136
}
Submodule llama.cpp updated 88 files

plugins/plugin-local-inference/src/services/voice/kokoro/voice-presets.ts

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -124,3 +124,6 @@ export function findKokoroVoice(id: string): KokoroVoicePack | undefined {
124124

125125
/** The voice the runtime selects when nothing is configured. */
126126
export const KOKORO_DEFAULT_VOICE_ID = "af_bella";
127+
128+
/** Conservative fallback voice when a configured/default preset is not staged. */
129+
export const KOKORO_FALLBACK_VOICE_ID = "af_bella";

0 commit comments

Comments
 (0)