@@ -2359,12 +2359,12 @@ struct clip_model_loader {
23592359 hparams.n_layer = n_layer_orig;
23602360 model.layers .resize (hparams.n_layer );
23612361
2362- model.gs_inp_linear_w = get_tensor (string_format (TN_GS_INP_LINEAR, " weight" ));
2363- model.gs_inp_linear_b = get_tensor (string_format (TN_GS_INP_LINEAR, " bias" ));
2364- model.gs_ctc_out_w = get_tensor (string_format (TN_GS_CTC_OUT , " weight" ));
2365- model.gs_ctc_out_b = get_tensor (string_format (TN_GS_CTC_OUT , " bias" ));
2366- model.gs_ctc_out_mid_w = get_tensor (string_format (TN_GS_CTC_OUT_MID , " weight" ));
2367- model.gs_ctc_out_mid_b = get_tensor (string_format (TN_GS_CTC_OUT_MID , " bias" ));
2362+ model.inp_proj_w = get_tensor (string_format (TN_INP_PROJ, " weight" ));
2363+ model.inp_proj_b = get_tensor (string_format (TN_INP_PROJ, " bias" ));
2364+ model.ctc_out_w = get_tensor (string_format (TN_CTC_OUT , " weight" ));
2365+ model.ctc_out_b = get_tensor (string_format (TN_CTC_OUT , " bias" ));
2366+ model.ctc_out_mid_w = get_tensor (string_format (TN_CTC_OUT_MID , " weight" ));
2367+ model.ctc_out_mid_b = get_tensor (string_format (TN_CTC_OUT_MID , " bias" ));
23682368
23692369 for (int il = 0 ; il < hparams.n_layer ; ++il) {
23702370 auto & layer = model.layers [il];
@@ -2374,7 +2374,7 @@ struct clip_model_loader {
23742374 layer.v_w = get_tensor (string_format (TN_ATTN_V, prefix, il, " weight" ));
23752375 layer.o_w = get_tensor (string_format (TN_ATTN_OUTPUT, prefix, il, " weight" ));
23762376 layer.o_b = get_tensor (string_format (TN_ATTN_OUTPUT, prefix, il, " bias" ));
2377- layer.attn_rel_pos_emb = get_tensor (string_format (TN_GS_ATTN_REL_POS , prefix, il));
2377+ layer.attn_rel_pos_emb = get_tensor (string_format (TN_ATTN_REL_POS_EMB , prefix, il));
23782378
23792379 layer.ln_1_w = get_tensor (string_format (TN_LN_1, prefix, il, " weight" ));
23802380 layer.ln_1_b = get_tensor (string_format (TN_LN_1, prefix, il, " bias" ));
@@ -2407,45 +2407,45 @@ struct clip_model_loader {
24072407 layer.conv_pw2_b = get_tensor (string_format (TN_CONV_PW2, prefix, il, " bias" ));
24082408 }
24092409
2410- model.gs_proj_query = get_tensor (TN_GS_PROJ_QUERY );
2411- model.gs_proj_norm_w = get_tensor (string_format (TN_GS_PROJ_NORM , " weight" ));
2412- model.gs_proj_norm_b = get_tensor (string_format (TN_GS_PROJ_NORM , " bias" ));
2413- model.gs_proj_linear_w = get_tensor (string_format (TN_GS_PROJ_LINEAR , " weight" ));
2414- model.gs_proj_linear_b = get_tensor (string_format (TN_GS_PROJ_LINEAR , " bias" ));
2410+ model.qf_proj_query = get_tensor (TN_QF_PROJ_QUERY );
2411+ model.qf_proj_norm_w = get_tensor (string_format (TN_QF_PROJ_NORM , " weight" ));
2412+ model.qf_proj_norm_b = get_tensor (string_format (TN_QF_PROJ_NORM , " bias" ));
2413+ model.qf_proj_linear_w = get_tensor (string_format (TN_QF_PROJ_LINEAR , " weight" ));
2414+ model.qf_proj_linear_b = get_tensor (string_format (TN_QF_PROJ_LINEAR , " bias" ));
24152415
24162416 const int n_proj_layers = 2 ;
2417- model.gs_proj_layers .resize (n_proj_layers);
2417+ model.qf_proj_layers .resize (n_proj_layers);
24182418 for (int il = 0 ; il < n_proj_layers; ++il) {
2419- auto & pl = model.gs_proj_layers [il];
2420-
2421- pl.self_attn_q_w = get_tensor (string_format (TN_GS_PROJ_SELF_ATTN_Q , il, " weight" ));
2422- pl.self_attn_q_b = get_tensor (string_format (TN_GS_PROJ_SELF_ATTN_Q , il, " bias" ));
2423- pl.self_attn_k_w = get_tensor (string_format (TN_GS_PROJ_SELF_ATTN_K , il, " weight" ));
2424- pl.self_attn_k_b = get_tensor (string_format (TN_GS_PROJ_SELF_ATTN_K , il, " bias" ));
2425- pl.self_attn_v_w = get_tensor (string_format (TN_GS_PROJ_SELF_ATTN_V , il, " weight" ));
2426- pl.self_attn_v_b = get_tensor (string_format (TN_GS_PROJ_SELF_ATTN_V , il, " bias" ));
2427- pl.self_attn_o_w = get_tensor (string_format (TN_GS_PROJ_SELF_ATTN_O , il, " weight" ));
2428- pl.self_attn_o_b = get_tensor (string_format (TN_GS_PROJ_SELF_ATTN_O , il, " bias" ));
2429- pl.self_attn_norm_w = get_tensor (string_format (TN_GS_PROJ_SELF_ATTN_N , il, " weight" ));
2430- pl.self_attn_norm_b = get_tensor (string_format (TN_GS_PROJ_SELF_ATTN_N , il, " bias" ));
2431-
2432- pl.cross_attn_q_w = get_tensor (string_format (TN_GS_PROJ_CROSS_ATTN_Q , il, " weight" ));
2433- pl.cross_attn_q_b = get_tensor (string_format (TN_GS_PROJ_CROSS_ATTN_Q , il, " bias" ));
2434- pl.cross_attn_k_w = get_tensor (string_format (TN_GS_PROJ_CROSS_ATTN_K , il, " weight" ));
2435- pl.cross_attn_k_b = get_tensor (string_format (TN_GS_PROJ_CROSS_ATTN_K , il, " bias" ));
2436- pl.cross_attn_v_w = get_tensor (string_format (TN_GS_PROJ_CROSS_ATTN_V , il, " weight" ));
2437- pl.cross_attn_v_b = get_tensor (string_format (TN_GS_PROJ_CROSS_ATTN_V , il, " bias" ));
2438- pl.cross_attn_o_w = get_tensor (string_format (TN_GS_PROJ_CROSS_ATTN_O , il, " weight" ));
2439- pl.cross_attn_o_b = get_tensor (string_format (TN_GS_PROJ_CROSS_ATTN_O , il, " bias" ));
2440- pl.cross_attn_norm_w = get_tensor (string_format (TN_GS_PROJ_CROSS_ATTN_N , il, " weight" ));
2441- pl.cross_attn_norm_b = get_tensor (string_format (TN_GS_PROJ_CROSS_ATTN_N , il, " bias" ));
2442-
2443- pl.ffn_up_w = get_tensor (string_format (TN_GS_PROJ_FFN_UP , il, " weight" ));
2444- pl.ffn_up_b = get_tensor (string_format (TN_GS_PROJ_FFN_UP , il, " bias" ));
2445- pl.ffn_down_w = get_tensor (string_format (TN_GS_PROJ_FFN_DOWN , il, " weight" ));
2446- pl.ffn_down_b = get_tensor (string_format (TN_GS_PROJ_FFN_DOWN , il, " bias" ));
2447- pl.ffn_norm_w = get_tensor (string_format (TN_GS_PROJ_FFN_NORM , il, " weight" ));
2448- pl.ffn_norm_b = get_tensor (string_format (TN_GS_PROJ_FFN_NORM , il, " bias" ));
2419+ auto & pl = model.qf_proj_layers [il];
2420+
2421+ pl.self_attn_q_w = get_tensor (string_format (TN_QF_SELF_ATTN_Q , il, " weight" ));
2422+ pl.self_attn_q_b = get_tensor (string_format (TN_QF_SELF_ATTN_Q , il, " bias" ));
2423+ pl.self_attn_k_w = get_tensor (string_format (TN_QF_SELF_ATTN_K , il, " weight" ));
2424+ pl.self_attn_k_b = get_tensor (string_format (TN_QF_SELF_ATTN_K , il, " bias" ));
2425+ pl.self_attn_v_w = get_tensor (string_format (TN_QF_SELF_ATTN_V , il, " weight" ));
2426+ pl.self_attn_v_b = get_tensor (string_format (TN_QF_SELF_ATTN_V , il, " bias" ));
2427+ pl.self_attn_o_w = get_tensor (string_format (TN_QF_SELF_ATTN_O , il, " weight" ));
2428+ pl.self_attn_o_b = get_tensor (string_format (TN_QF_SELF_ATTN_O , il, " bias" ));
2429+ pl.self_attn_norm_w = get_tensor (string_format (TN_QF_SELF_ATTN_N , il, " weight" ));
2430+ pl.self_attn_norm_b = get_tensor (string_format (TN_QF_SELF_ATTN_N , il, " bias" ));
2431+
2432+ pl.cross_attn_q_w = get_tensor (string_format (TN_QF_CROSS_ATTN_Q , il, " weight" ));
2433+ pl.cross_attn_q_b = get_tensor (string_format (TN_QF_CROSS_ATTN_Q , il, " bias" ));
2434+ pl.cross_attn_k_w = get_tensor (string_format (TN_QF_CROSS_ATTN_K , il, " weight" ));
2435+ pl.cross_attn_k_b = get_tensor (string_format (TN_QF_CROSS_ATTN_K , il, " bias" ));
2436+ pl.cross_attn_v_w = get_tensor (string_format (TN_QF_CROSS_ATTN_V , il, " weight" ));
2437+ pl.cross_attn_v_b = get_tensor (string_format (TN_QF_CROSS_ATTN_V , il, " bias" ));
2438+ pl.cross_attn_o_w = get_tensor (string_format (TN_QF_CROSS_ATTN_O , il, " weight" ));
2439+ pl.cross_attn_o_b = get_tensor (string_format (TN_QF_CROSS_ATTN_O , il, " bias" ));
2440+ pl.cross_attn_norm_w = get_tensor (string_format (TN_QF_CROSS_ATTN_N , il, " weight" ));
2441+ pl.cross_attn_norm_b = get_tensor (string_format (TN_QF_CROSS_ATTN_N , il, " bias" ));
2442+
2443+ pl.ffn_up_w = get_tensor (string_format (TN_QF_FFN_UP , il, " weight" ));
2444+ pl.ffn_up_b = get_tensor (string_format (TN_QF_FFN_UP , il, " bias" ));
2445+ pl.ffn_down_w = get_tensor (string_format (TN_QF_FFN_DOWN , il, " weight" ));
2446+ pl.ffn_down_b = get_tensor (string_format (TN_QF_FFN_DOWN , il, " bias" ));
2447+ pl.ffn_norm_w = get_tensor (string_format (TN_QF_FFN_NORM , il, " weight" ));
2448+ pl.ffn_norm_b = get_tensor (string_format (TN_QF_FFN_NORM , il, " bias" ));
24492449 }
24502450 } break ;
24512451 default :
@@ -3846,7 +3846,7 @@ int clip_n_mmproj_embd(const struct clip_ctx * ctx) {
38463846 case PROJECTOR_TYPE_GEMMA4A:
38473847 return ctx->model .hparams .projection_dim ;
38483848 case PROJECTOR_TYPE_GRANITE_SPEECH:
3849- return ctx->model .gs_proj_linear_w ->ne [1 ];
3849+ return ctx->model .qf_proj_linear_w ->ne [1 ];
38503850 case PROJECTOR_TYPE_GLM4V:
38513851 return ctx->model .mm_ffn_down_w ->ne [1 ];
38523852 default :
0 commit comments