Skip to content

Commit 3d3c229

Browse files
committed
Fix local inference PR checks
1 parent 99dba3f commit 3d3c229

3 files changed

Lines changed: 15 additions & 15 deletions

File tree

packages/app-core/scripts/build-llama-cpp-dflash.mjs

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1418,7 +1418,7 @@ function cmakeFlagsForTarget(target, ctx) {
14181418
// `ggml_backend_cpu_init` (per-backend symbol name), so the loader
14191419
// fails and inference can't run. -DGGML_BACKEND_DL=OFF embeds the
14201420
// backend's init directly into the binary.
1421-
flags.push("-DGGML_BACKEND_DL=OFF", "-DBUILD_SHARED_LIBS=OFF");
1421+
flags.push("-DGGML_BACKEND_DL=OFF");
14221422
} else if (platform === "ios") {
14231423
// iOS cross-compile (host must be macOS with Xcode). The Capacitor
14241424
// plugin's xcframework patch consumes the resulting static archive +

scripts/local-inference-ablation.config.json

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -17,8 +17,8 @@
1717
},
1818
{
1919
"name": "qjl_tcq_forced",
20-
"label": "target only, forced QJL/TCQ turbo3_tcq",
21-
"args": ["--cache-type-k", "tbq3_tcq", "--cache-type-v", "tbq3_tcq"]
20+
"label": "target only, QJL K + TBQ3 V",
21+
"args": ["--cache-type-k", "qjl1_256", "--cache-type-v", "tbq3_0"]
2222
},
2323
{
2424
"name": "dflash_only",
@@ -45,19 +45,19 @@
4545
},
4646
{
4747
"name": "all_dflash_qjl_tcq",
48-
"label": "DFlash + forced QJL/TCQ turbo3_tcq",
48+
"label": "DFlash + QJL K + TBQ3 V",
4949
"needsDrafter": true,
5050
"args": [
5151
"--spec-type",
5252
"dflash",
5353
"--cache-type-k",
54-
"tbq3_tcq",
54+
"qjl1_256",
5555
"--cache-type-v",
56-
"tbq3_tcq",
56+
"tbq3_0",
5757
"--cache-type-k-draft",
58-
"tbq3_tcq",
58+
"qjl1_256",
5959
"--cache-type-v-draft",
60-
"tbq3_tcq"
60+
"tbq3_0"
6161
]
6262
}
6363
]

scripts/local-inference-ablation.mjs

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -37,8 +37,8 @@ const DEFAULT_VARIANTS = [
3737
},
3838
{
3939
name: "qjl_tcq_forced",
40-
label: "target only, forced QJL/TCQ turbo3_tcq",
41-
args: ["--cache-type-k", "tbq3_tcq", "--cache-type-v", "tbq3_tcq"],
40+
label: "target only, QJL K + TBQ3 V",
41+
args: ["--cache-type-k", "qjl1_256", "--cache-type-v", "tbq3_0"],
4242
},
4343
{
4444
name: "dflash_only",
@@ -65,19 +65,19 @@ const DEFAULT_VARIANTS = [
6565
},
6666
{
6767
name: "all_dflash_qjl_tcq",
68-
label: "DFlash + forced QJL/TCQ turbo3_tcq",
68+
label: "DFlash + QJL K + TBQ3 V",
6969
needsDrafter: true,
7070
args: [
7171
"--spec-type",
7272
"dflash",
7373
"--cache-type-k",
74-
"tbq3_tcq",
74+
"qjl1_256",
7575
"--cache-type-v",
76-
"tbq3_tcq",
76+
"tbq3_0",
7777
"--cache-type-k-draft",
78-
"tbq3_tcq",
78+
"qjl1_256",
7979
"--cache-type-v-draft",
80-
"tbq3_tcq",
80+
"tbq3_0",
8181
],
8282
},
8383
];

0 commit comments

Comments
 (0)