@@ -559,6 +559,8 @@ static const std::map<llm_tensor, const char *> LLM_TENSOR_NAMES = {
559559 { LLM_TENSOR_INDEXER_PROJ, " blk.%d.indexer.proj" },
560560 { LLM_TENSOR_INDEXER_ATTN_K, " blk.%d.indexer.attn_k" },
561561 { LLM_TENSOR_INDEXER_ATTN_Q_B, " blk.%d.indexer.attn_q_b" },
562+ { LLM_TENSOR_MASKED_EMBD_CENTROIDS, " masked_embd_centroids" },
563+ { LLM_TENSOR_MASKED_EMBD_ORDERING, " masked_embd_ordering" },
562564};
563565
564566// declare information about the model weight tensors:
@@ -783,6 +785,8 @@ static const std::map<llm_tensor, llm_tensor_info> LLM_TENSOR_INFOS = {
783785 // latent projections feed ggml_mul_mat, the buft probe must use MUL_MAT to keep them on GPU
784786 {LLM_TENSOR_FFN_LATENT_DOWN, {LLM_TENSOR_LAYER_REPEATING, GGML_OP_MUL_MAT}},
785787 {LLM_TENSOR_FFN_LATENT_UP, {LLM_TENSOR_LAYER_REPEATING, GGML_OP_MUL_MAT}},
788+ {LLM_TENSOR_MASKED_EMBD_CENTROIDS, {LLM_TENSOR_LAYER_INPUT, GGML_OP_NONE}},
789+ {LLM_TENSOR_MASKED_EMBD_ORDERING, {LLM_TENSOR_LAYER_INPUT, GGML_OP_NONE}},
786790};
787791
788792LLM_KV::LLM_KV (llm_arch arch, const char * suffix) : arch(arch), suffix(suffix) {}
0 commit comments