@@ -1989,14 +1989,14 @@ static void ggml_vk_load_shaders(vk_device& device) {
19891989 ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_Q4_K][i], " mul_mat_vec_q4_k_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_q4_k_f32_f32_len, mul_mat_vec_q4_k_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
19901990 ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_Q5_K][i], " mul_mat_vec_q5_k_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_q5_k_f32_f32_len, mul_mat_vec_q5_k_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
19911991 ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_Q6_K][i], " mul_mat_vec_q6_k_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_q6_k_f32_f32_len, mul_mat_vec_q6_k_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1992- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ1_S][i], " mul_mat_vec_iq1_s_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq1_s_f32_f32_len, mul_mat_vec_iq1_s_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1993- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ1_M][i], " mul_mat_vec_iq1_m_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq1_m_f32_f32_len, mul_mat_vec_iq1_m_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1994- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ2_XXS][i], " mul_mat_vec_iq2_xxs_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_xxs_f32_f32_len, mul_mat_vec_iq2_xxs_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1995- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ2_XS][i], " mul_mat_vec_iq2_xs_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_xs_f32_f32_len, mul_mat_vec_iq2_xs_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1996- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ2_S][i], " mul_mat_vec_iq2_s_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_s_f32_f32_len, mul_mat_vec_iq2_s_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1997- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ3_XXS][i], " mul_mat_vec_iq3_xxs_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq3_xxs_f32_f32_len, mul_mat_vec_iq3_xxs_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1998- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ3_S][i], " mul_mat_vec_iq3_s_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq3_s_f32_f32_len, mul_mat_vec_iq3_s_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1999- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ4_XS][i], " mul_mat_vec_iq4_xs_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq4_xs_f32_f32_len, mul_mat_vec_iq4_xs_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1992+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ1_S][i], " mul_mat_vec_iq1_s_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq1_s_f32_f32_len, mul_mat_vec_iq1_s_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
1993+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ1_M][i], " mul_mat_vec_iq1_m_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq1_m_f32_f32_len, mul_mat_vec_iq1_m_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
1994+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ2_XXS][i], " mul_mat_vec_iq2_xxs_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_xxs_f32_f32_len, mul_mat_vec_iq2_xxs_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
1995+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ2_XS][i], " mul_mat_vec_iq2_xs_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_xs_f32_f32_len, mul_mat_vec_iq2_xs_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
1996+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ2_S][i], " mul_mat_vec_iq2_s_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_s_f32_f32_len, mul_mat_vec_iq2_s_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
1997+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ3_XXS][i], " mul_mat_vec_iq3_xxs_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq3_xxs_f32_f32_len, mul_mat_vec_iq3_xxs_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
1998+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ3_S][i], " mul_mat_vec_iq3_s_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq3_s_f32_f32_len, mul_mat_vec_iq3_s_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
1999+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ4_XS][i], " mul_mat_vec_iq4_xs_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq4_xs_f32_f32_len, mul_mat_vec_iq4_xs_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
20002000 ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ4_NL][i], " mul_mat_vec_iq4_nl_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq4_nl_f32_f32_len, mul_mat_vec_iq4_nl_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 *rm_stdq, 1 , 1 }, {subgroup_size_16, 2 *rm_stdq, i+1 }, 1 , true );
20012001
20022002 ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_F32 ][i], " mul_mat_vec_f32_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_f32_f16_f32_len, mul_mat_vec_f32_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 , 1 , 1 }, {device->subgroup_size , 2 , i+1 }, 1 );
@@ -2011,14 +2011,14 @@ static void ggml_vk_load_shaders(vk_device& device) {
20112011 ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_Q4_K][i], " mul_mat_vec_q4_k_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_q4_k_f16_f32_len, mul_mat_vec_q4_k_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
20122012 ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_Q5_K][i], " mul_mat_vec_q5_k_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_q5_k_f16_f32_len, mul_mat_vec_q5_k_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
20132013 ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_Q6_K][i], " mul_mat_vec_q6_k_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_q6_k_f16_f32_len, mul_mat_vec_q6_k_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2014- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ1_S][i], " mul_mat_vec_iq1_s_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq1_s_f16_f32_len, mul_mat_vec_iq1_s_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2015- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ1_M][i], " mul_mat_vec_iq1_m_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq1_m_f16_f32_len, mul_mat_vec_iq1_m_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2016- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ2_XXS][i], " mul_mat_vec_iq2_xxs_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_xxs_f16_f32_len, mul_mat_vec_iq2_xxs_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2017- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ2_XS][i], " mul_mat_vec_iq2_xs_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_xs_f16_f32_len, mul_mat_vec_iq2_xs_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2018- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ2_S][i], " mul_mat_vec_iq2_s_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_s_f16_f32_len, mul_mat_vec_iq2_s_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2019- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ3_XXS][i], " mul_mat_vec_iq3_xxs_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq3_xxs_f16_f32_len, mul_mat_vec_iq3_xxs_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2020- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ3_S][i], " mul_mat_vec_iq3_s_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq3_s_f16_f32_len, mul_mat_vec_iq3_s_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2021- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ4_XS][i], " mul_mat_vec_iq4_xs_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq4_xs_f16_f32_len, mul_mat_vec_iq4_xs_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2014+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ1_S][i], " mul_mat_vec_iq1_s_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq1_s_f16_f32_len, mul_mat_vec_iq1_s_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
2015+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ1_M][i], " mul_mat_vec_iq1_m_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq1_m_f16_f32_len, mul_mat_vec_iq1_m_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
2016+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ2_XXS][i], " mul_mat_vec_iq2_xxs_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_xxs_f16_f32_len, mul_mat_vec_iq2_xxs_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
2017+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ2_XS][i], " mul_mat_vec_iq2_xs_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_xs_f16_f32_len, mul_mat_vec_iq2_xs_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
2018+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ2_S][i], " mul_mat_vec_iq2_s_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_s_f16_f32_len, mul_mat_vec_iq2_s_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
2019+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ3_XXS][i], " mul_mat_vec_iq3_xxs_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq3_xxs_f16_f32_len, mul_mat_vec_iq3_xxs_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
2020+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ3_S][i], " mul_mat_vec_iq3_s_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq3_s_f16_f32_len, mul_mat_vec_iq3_s_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
2021+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ4_XS][i], " mul_mat_vec_iq4_xs_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq4_xs_f16_f32_len, mul_mat_vec_iq4_xs_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
20222022 ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ4_NL][i], " mul_mat_vec_iq4_nl_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq4_nl_f16_f32_len, mul_mat_vec_iq4_nl_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 *rm_stdq, 1 , 1 }, {subgroup_size_16, 2 *rm_stdq, i+1 }, 1 , true );
20232023 }
20242024
@@ -2034,13 +2034,13 @@ static void ggml_vk_load_shaders(vk_device& device) {
20342034 ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_Q4_K], " mul_mat_vec_id_q4_k_f32" , mul_mat_vec_id_q4_k_f32_len, mul_mat_vec_id_q4_k_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
20352035 ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_Q5_K], " mul_mat_vec_id_q5_k_f32" , mul_mat_vec_id_q5_k_f32_len, mul_mat_vec_id_q5_k_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
20362036 ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_Q6_K], " mul_mat_vec_id_q6_k_f32" , mul_mat_vec_id_q6_k_f32_len, mul_mat_vec_id_q6_k_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2037- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ1_S], " mul_mat_vec_id_iq1_s_f32" , mul_mat_vec_id_iq1_s_f32_len, mul_mat_vec_id_iq1_s_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2038- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ1_M], " mul_mat_vec_id_iq1_m_f32" , mul_mat_vec_id_iq1_m_f32_len, mul_mat_vec_id_iq1_m_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2039- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ2_XXS], " mul_mat_vec_id_iq2_xxs_f32" , mul_mat_vec_id_iq2_xxs_f32_len, mul_mat_vec_id_iq2_xxs_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2040- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ2_XS], " mul_mat_vec_id_iq2_xs_f32" , mul_mat_vec_id_iq2_xs_f32_len, mul_mat_vec_id_iq2_xs_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2041- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ2_S], " mul_mat_vec_id_iq2_s_f32" , mul_mat_vec_id_iq2_s_f32_len, mul_mat_vec_id_iq2_s_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2042- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ3_XXS], " mul_mat_vec_id_iq3_xxs_f32" , mul_mat_vec_id_iq3_xxs_f32_len, mul_mat_vec_id_iq3_xxs_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2043- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ3_S], " mul_mat_vec_id_iq3_s_f32" , mul_mat_vec_id_iq3_s_f32_len, mul_mat_vec_id_iq3_s_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2037+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ1_S], " mul_mat_vec_id_iq1_s_f32" , mul_mat_vec_id_iq1_s_f32_len, mul_mat_vec_id_iq1_s_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq}, 1 , true );
2038+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ1_M], " mul_mat_vec_id_iq1_m_f32" , mul_mat_vec_id_iq1_m_f32_len, mul_mat_vec_id_iq1_m_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq}, 1 , true );
2039+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ2_XXS], " mul_mat_vec_id_iq2_xxs_f32" , mul_mat_vec_id_iq2_xxs_f32_len, mul_mat_vec_id_iq2_xxs_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq}, 1 , true );
2040+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ2_XS], " mul_mat_vec_id_iq2_xs_f32" , mul_mat_vec_id_iq2_xs_f32_len, mul_mat_vec_id_iq2_xs_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq}, 1 , true );
2041+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ2_S], " mul_mat_vec_id_iq2_s_f32" , mul_mat_vec_id_iq2_s_f32_len, mul_mat_vec_id_iq2_s_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq}, 1 , true );
2042+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ3_XXS], " mul_mat_vec_id_iq3_xxs_f32" , mul_mat_vec_id_iq3_xxs_f32_len, mul_mat_vec_id_iq3_xxs_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq}, 1 , true );
2043+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ3_S], " mul_mat_vec_id_iq3_s_f32" , mul_mat_vec_id_iq3_s_f32_len, mul_mat_vec_id_iq3_s_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq}, 1 , true );
20442044 ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ4_XS], " mul_mat_vec_id_iq4_xs_f32" , mul_mat_vec_id_iq4_xs_f32_len, mul_mat_vec_id_iq4_xs_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
20452045 ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ4_NL], " mul_mat_vec_id_iq4_nl_f32" , mul_mat_vec_id_iq4_nl_f32_len, mul_mat_vec_id_iq4_nl_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {2 *rm_stdq, 1 , 1 }, {subgroup_size_16, 2 *rm_stdq}, 1 , true );
20462046
0 commit comments