@@ -687,6 +687,8 @@ class MODEL_TENSOR(IntEnum):
687687 V_TOK_EOI = auto () # cogvlm
688688 # audio (mtmd)
689689 A_ENC_EMBD_POS = auto ()
690+ A_ENC_EMBD_NORM = auto ()
691+ A_ENC_EMBD_TO_LOGITS = auto ()
690692 A_ENC_CONV1D = auto ()
691693 A_PRE_NORM = auto ()
692694 A_POST_NORM = auto ()
@@ -697,8 +699,13 @@ class MODEL_TENSOR(IntEnum):
697699 A_ENC_OUTPUT = auto ()
698700 A_ENC_OUTPUT_NORM = auto ()
699701 A_ENC_FFN_UP = auto ()
702+ A_ENC_FFN_NORM = auto ()
700703 A_ENC_FFN_GATE = auto ()
701704 A_ENC_FFN_DOWN = auto ()
705+ A_ENC_FFN_UP_1 = auto ()
706+ A_ENC_FFN_NORM_1 = auto ()
707+ A_ENC_FFN_GATE_1 = auto ()
708+ A_ENC_FFN_DOWN_1 = auto ()
702709 A_MMPROJ = auto ()
703710 A_MMPROJ_FC = auto ()
704711 A_MM_NORM_PRE = auto ()
@@ -710,6 +717,12 @@ class MODEL_TENSOR(IntEnum):
710717 NEXTN_HNORM = auto ()
711718 NEXTN_SHARED_HEAD_HEAD = auto ()
712719 NEXTN_SHARED_HEAD_NORM = auto ()
720+ # lfm2 audio
721+ A_ENC_NORM_CONV = auto ()
722+ A_ENC_LINEAR_POS = auto ()
723+ A_ENC_POS_BIAS_U = auto ()
724+ A_ENC_POS_BIAS_V = auto ()
725+ A_ENC_OUT = auto ()
713726
714727
715728MODEL_ARCH_NAMES : dict [MODEL_ARCH , str ] = {
@@ -1059,6 +1072,8 @@ class MODEL_TENSOR(IntEnum):
10591072 MODEL_TENSOR .V_TOK_EOI : "v.eoi" ,
10601073 # audio (mtmd)
10611074 MODEL_TENSOR .A_ENC_EMBD_POS : "a.position_embd" ,
1075+ MODEL_TENSOR .A_ENC_EMBD_NORM : "a.position_embd_norm" ,
1076+ MODEL_TENSOR .A_ENC_EMBD_TO_LOGITS : "a.embd_to_logits" ,
10621077 MODEL_TENSOR .A_ENC_CONV1D : "a.conv1d.{bid}" ,
10631078 MODEL_TENSOR .A_PRE_NORM : "a.pre_ln" ,
10641079 MODEL_TENSOR .A_POST_NORM : "a.post_ln" ,
@@ -1068,9 +1083,14 @@ class MODEL_TENSOR(IntEnum):
10681083 MODEL_TENSOR .A_ENC_INPUT_NORM : "a.blk.{bid}.ln1" ,
10691084 MODEL_TENSOR .A_ENC_OUTPUT : "a.blk.{bid}.attn_out" ,
10701085 MODEL_TENSOR .A_ENC_OUTPUT_NORM : "a.blk.{bid}.ln2" ,
1086+ MODEL_TENSOR .A_ENC_FFN_NORM : "a.blk.{bid}.ffn_norm" ,
10711087 MODEL_TENSOR .A_ENC_FFN_UP : "a.blk.{bid}.ffn_up" ,
10721088 MODEL_TENSOR .A_ENC_FFN_GATE : "a.blk.{bid}.ffn_gate" ,
10731089 MODEL_TENSOR .A_ENC_FFN_DOWN : "a.blk.{bid}.ffn_down" ,
1090+ MODEL_TENSOR .A_ENC_FFN_NORM_1 : "a.blk.{bid}.ffn_norm_1" ,
1091+ MODEL_TENSOR .A_ENC_FFN_UP_1 : "a.blk.{bid}.ffn_up_1" ,
1092+ MODEL_TENSOR .A_ENC_FFN_GATE_1 : "a.blk.{bid}.ffn_gate_1" ,
1093+ MODEL_TENSOR .A_ENC_FFN_DOWN_1 : "a.blk.{bid}.ffn_down_1" ,
10741094 MODEL_TENSOR .A_MMPROJ : "mm.a.mlp.{bid}" ,
10751095 MODEL_TENSOR .A_MMPROJ_FC : "mm.a.fc" ,
10761096 MODEL_TENSOR .A_MM_NORM_PRE : "mm.a.norm_pre" ,
@@ -1082,6 +1102,12 @@ class MODEL_TENSOR(IntEnum):
10821102 MODEL_TENSOR .NEXTN_HNORM : "blk.{bid}.nextn.hnorm" ,
10831103 MODEL_TENSOR .NEXTN_SHARED_HEAD_HEAD : "blk.{bid}.nextn.shared_head_head" ,
10841104 MODEL_TENSOR .NEXTN_SHARED_HEAD_NORM : "blk.{bid}.nextn.shared_head_norm" ,
1105+ # lfm2
1106+ MODEL_TENSOR .A_ENC_NORM_CONV : "a.blk.{bid}.norm_conv" ,
1107+ MODEL_TENSOR .A_ENC_LINEAR_POS : "a.blk.{bid}.linear_pos" ,
1108+ MODEL_TENSOR .A_ENC_POS_BIAS_U : "a.blk.{bid}.pos_bias_u" ,
1109+ MODEL_TENSOR .A_ENC_POS_BIAS_V : "a.blk.{bid}.pos_bias_v" ,
1110+ MODEL_TENSOR .A_ENC_OUT : "a.pre_encode.out" ,
10851111}
10861112
10871113MODEL_TENSORS : dict [MODEL_ARCH , list [MODEL_TENSOR ]] = {
@@ -1137,6 +1163,8 @@ class MODEL_TENSOR(IntEnum):
11371163 MODEL_TENSOR .V_TOK_EOI ,
11381164 # audio
11391165 MODEL_TENSOR .A_ENC_EMBD_POS ,
1166+ MODEL_TENSOR .A_ENC_EMBD_NORM ,
1167+ MODEL_TENSOR .A_ENC_EMBD_TO_LOGITS ,
11401168 MODEL_TENSOR .A_ENC_CONV1D ,
11411169 MODEL_TENSOR .A_PRE_NORM ,
11421170 MODEL_TENSOR .A_POST_NORM ,
@@ -1146,13 +1174,27 @@ class MODEL_TENSOR(IntEnum):
11461174 MODEL_TENSOR .A_ENC_INPUT_NORM ,
11471175 MODEL_TENSOR .A_ENC_OUTPUT ,
11481176 MODEL_TENSOR .A_ENC_OUTPUT_NORM ,
1177+ MODEL_TENSOR .A_ENC_FFN_NORM ,
11491178 MODEL_TENSOR .A_ENC_FFN_UP ,
11501179 MODEL_TENSOR .A_ENC_FFN_GATE ,
11511180 MODEL_TENSOR .A_ENC_FFN_DOWN ,
1181+ MODEL_TENSOR .A_ENC_FFN_NORM_1 ,
1182+ MODEL_TENSOR .A_ENC_FFN_UP_1 ,
1183+ MODEL_TENSOR .A_ENC_FFN_GATE_1 ,
1184+ MODEL_TENSOR .A_ENC_FFN_DOWN_1 ,
11521185 MODEL_TENSOR .A_MMPROJ ,
11531186 MODEL_TENSOR .A_MMPROJ_FC ,
11541187 MODEL_TENSOR .A_MM_NORM_PRE ,
11551188 MODEL_TENSOR .A_MM_NORM_MID ,
1189+ MODEL_TENSOR .CONVNEXT_DW ,
1190+ MODEL_TENSOR .CONVNEXT_NORM ,
1191+ MODEL_TENSOR .CONVNEXT_PW1 ,
1192+ MODEL_TENSOR .CONVNEXT_PW2 ,
1193+ MODEL_TENSOR .A_ENC_NORM_CONV ,
1194+ MODEL_TENSOR .A_ENC_LINEAR_POS ,
1195+ MODEL_TENSOR .A_ENC_POS_BIAS_U ,
1196+ MODEL_TENSOR .A_ENC_POS_BIAS_V ,
1197+ MODEL_TENSOR .A_ENC_OUT ,
11561198 ],
11571199 MODEL_ARCH .LLAMA : [
11581200 MODEL_TENSOR .TOKEN_EMBD ,
@@ -3328,6 +3370,7 @@ class VisionProjectorType:
33283370 LIGHTONOCR = "lightonocr"
33293371 COGVLM = "cogvlm"
33303372 JANUS_PRO = "janus_pro"
3373+ LFM2A = "lfm2a" # audio
33313374
33323375
33333376# Items here are (block size, type size)
0 commit comments