@@ -1989,14 +1989,14 @@ static void ggml_vk_load_shaders(vk_device& device) {
1989
1989
ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_Q4_K][i], " mul_mat_vec_q4_k_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_q4_k_f32_f32_len, mul_mat_vec_q4_k_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1990
1990
ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_Q5_K][i], " mul_mat_vec_q5_k_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_q5_k_f32_f32_len, mul_mat_vec_q5_k_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1991
1991
ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_Q6_K][i], " mul_mat_vec_q6_k_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_q6_k_f32_f32_len, mul_mat_vec_q6_k_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1992
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ1_S][i], " mul_mat_vec_iq1_s_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq1_s_f32_f32_len, mul_mat_vec_iq1_s_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1993
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ1_M][i], " mul_mat_vec_iq1_m_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq1_m_f32_f32_len, mul_mat_vec_iq1_m_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1994
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ2_XXS][i], " mul_mat_vec_iq2_xxs_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_xxs_f32_f32_len, mul_mat_vec_iq2_xxs_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1995
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ2_XS][i], " mul_mat_vec_iq2_xs_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_xs_f32_f32_len, mul_mat_vec_iq2_xs_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1996
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ2_S][i], " mul_mat_vec_iq2_s_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_s_f32_f32_len, mul_mat_vec_iq2_s_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1997
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ3_XXS][i], " mul_mat_vec_iq3_xxs_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq3_xxs_f32_f32_len, mul_mat_vec_iq3_xxs_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1998
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ3_S][i], " mul_mat_vec_iq3_s_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq3_s_f32_f32_len, mul_mat_vec_iq3_s_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1999
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ4_XS][i], " mul_mat_vec_iq4_xs_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq4_xs_f32_f32_len, mul_mat_vec_iq4_xs_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
1992
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ1_S][i], " mul_mat_vec_iq1_s_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq1_s_f32_f32_len, mul_mat_vec_iq1_s_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
1993
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ1_M][i], " mul_mat_vec_iq1_m_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq1_m_f32_f32_len, mul_mat_vec_iq1_m_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
1994
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ2_XXS][i], " mul_mat_vec_iq2_xxs_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_xxs_f32_f32_len, mul_mat_vec_iq2_xxs_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
1995
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ2_XS][i], " mul_mat_vec_iq2_xs_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_xs_f32_f32_len, mul_mat_vec_iq2_xs_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
1996
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ2_S][i], " mul_mat_vec_iq2_s_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_s_f32_f32_len, mul_mat_vec_iq2_s_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
1997
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ3_XXS][i], " mul_mat_vec_iq3_xxs_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq3_xxs_f32_f32_len, mul_mat_vec_iq3_xxs_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
1998
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ3_S][i], " mul_mat_vec_iq3_s_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq3_s_f32_f32_len, mul_mat_vec_iq3_s_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
1999
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ4_XS][i], " mul_mat_vec_iq4_xs_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq4_xs_f32_f32_len, mul_mat_vec_iq4_xs_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2000
2000
ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f32_f32 [GGML_TYPE_IQ4_NL][i], " mul_mat_vec_iq4_nl_f32_f32_" +std::to_string (i+1 ), mul_mat_vec_iq4_nl_f32_f32_len, mul_mat_vec_iq4_nl_f32_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 *rm_stdq, 1 , 1 }, {subgroup_size_16, 2 *rm_stdq, i+1 }, 1 , true );
2001
2001
2002
2002
ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_F32 ][i], " mul_mat_vec_f32_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_f32_f16_f32_len, mul_mat_vec_f32_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 , 1 , 1 }, {device->subgroup_size , 2 , i+1 }, 1 );
@@ -2011,14 +2011,14 @@ static void ggml_vk_load_shaders(vk_device& device) {
2011
2011
ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_Q4_K][i], " mul_mat_vec_q4_k_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_q4_k_f16_f32_len, mul_mat_vec_q4_k_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2012
2012
ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_Q5_K][i], " mul_mat_vec_q5_k_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_q5_k_f16_f32_len, mul_mat_vec_q5_k_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2013
2013
ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_Q6_K][i], " mul_mat_vec_q6_k_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_q6_k_f16_f32_len, mul_mat_vec_q6_k_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2014
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ1_S][i], " mul_mat_vec_iq1_s_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq1_s_f16_f32_len, mul_mat_vec_iq1_s_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2015
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ1_M][i], " mul_mat_vec_iq1_m_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq1_m_f16_f32_len, mul_mat_vec_iq1_m_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2016
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ2_XXS][i], " mul_mat_vec_iq2_xxs_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_xxs_f16_f32_len, mul_mat_vec_iq2_xxs_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2017
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ2_XS][i], " mul_mat_vec_iq2_xs_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_xs_f16_f32_len, mul_mat_vec_iq2_xs_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2018
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ2_S][i], " mul_mat_vec_iq2_s_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_s_f16_f32_len, mul_mat_vec_iq2_s_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2019
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ3_XXS][i], " mul_mat_vec_iq3_xxs_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq3_xxs_f16_f32_len, mul_mat_vec_iq3_xxs_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2020
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ3_S][i], " mul_mat_vec_iq3_s_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq3_s_f16_f32_len, mul_mat_vec_iq3_s_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2021
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ4_XS][i], " mul_mat_vec_iq4_xs_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq4_xs_f16_f32_len, mul_mat_vec_iq4_xs_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2014
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ1_S][i], " mul_mat_vec_iq1_s_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq1_s_f16_f32_len, mul_mat_vec_iq1_s_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
2015
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ1_M][i], " mul_mat_vec_iq1_m_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq1_m_f16_f32_len, mul_mat_vec_iq1_m_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
2016
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ2_XXS][i], " mul_mat_vec_iq2_xxs_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_xxs_f16_f32_len, mul_mat_vec_iq2_xxs_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
2017
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ2_XS][i], " mul_mat_vec_iq2_xs_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_xs_f16_f32_len, mul_mat_vec_iq2_xs_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
2018
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ2_S][i], " mul_mat_vec_iq2_s_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq2_s_f16_f32_len, mul_mat_vec_iq2_s_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
2019
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ3_XXS][i], " mul_mat_vec_iq3_xxs_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq3_xxs_f16_f32_len, mul_mat_vec_iq3_xxs_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
2020
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ3_S][i], " mul_mat_vec_iq3_s_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq3_s_f16_f32_len, mul_mat_vec_iq3_s_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq, i+1 }, 1 , true );
2021
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ4_XS][i], " mul_mat_vec_iq4_xs_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq4_xs_f16_f32_len, mul_mat_vec_iq4_xs_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq, i+1 }, 1 , true );
2022
2022
ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_f16_f32 [GGML_TYPE_IQ4_NL][i], " mul_mat_vec_iq4_nl_f16_f32_" +std::to_string (i+1 ), mul_mat_vec_iq4_nl_f16_f32_len, mul_mat_vec_iq4_nl_f16_f32_data, " main" , 3 , sizeof (vk_mat_vec_push_constants), {2 *rm_stdq, 1 , 1 }, {subgroup_size_16, 2 *rm_stdq, i+1 }, 1 , true );
2023
2023
}
2024
2024
@@ -2034,13 +2034,13 @@ static void ggml_vk_load_shaders(vk_device& device) {
2034
2034
ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_Q4_K], " mul_mat_vec_id_q4_k_f32" , mul_mat_vec_id_q4_k_f32_len, mul_mat_vec_id_q4_k_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2035
2035
ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_Q5_K], " mul_mat_vec_id_q5_k_f32" , mul_mat_vec_id_q5_k_f32_len, mul_mat_vec_id_q5_k_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2036
2036
ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_Q6_K], " mul_mat_vec_id_q6_k_f32" , mul_mat_vec_id_q6_k_f32_len, mul_mat_vec_id_q6_k_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2037
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ1_S], " mul_mat_vec_id_iq1_s_f32" , mul_mat_vec_id_iq1_s_f32_len, mul_mat_vec_id_iq1_s_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2038
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ1_M], " mul_mat_vec_id_iq1_m_f32" , mul_mat_vec_id_iq1_m_f32_len, mul_mat_vec_id_iq1_m_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2039
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ2_XXS], " mul_mat_vec_id_iq2_xxs_f32" , mul_mat_vec_id_iq2_xxs_f32_len, mul_mat_vec_id_iq2_xxs_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2040
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ2_XS], " mul_mat_vec_id_iq2_xs_f32" , mul_mat_vec_id_iq2_xs_f32_len, mul_mat_vec_id_iq2_xs_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2041
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ2_S], " mul_mat_vec_id_iq2_s_f32" , mul_mat_vec_id_iq2_s_f32_len, mul_mat_vec_id_iq2_s_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2042
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ3_XXS], " mul_mat_vec_id_iq3_xxs_f32" , mul_mat_vec_id_iq3_xxs_f32_len, mul_mat_vec_id_iq3_xxs_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2043
- ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ3_S], " mul_mat_vec_id_iq3_s_f32" , mul_mat_vec_id_iq3_s_f32_len, mul_mat_vec_id_iq3_s_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2037
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ1_S], " mul_mat_vec_id_iq1_s_f32" , mul_mat_vec_id_iq1_s_f32_len, mul_mat_vec_id_iq1_s_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq}, 1 , true );
2038
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ1_M], " mul_mat_vec_id_iq1_m_f32" , mul_mat_vec_id_iq1_m_f32_len, mul_mat_vec_id_iq1_m_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq}, 1 , true );
2039
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ2_XXS], " mul_mat_vec_id_iq2_xxs_f32" , mul_mat_vec_id_iq2_xxs_f32_len, mul_mat_vec_id_iq2_xxs_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq}, 1 , true );
2040
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ2_XS], " mul_mat_vec_id_iq2_xs_f32" , mul_mat_vec_id_iq2_xs_f32_len, mul_mat_vec_id_iq2_xs_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq}, 1 , true );
2041
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ2_S], " mul_mat_vec_id_iq2_s_f32" , mul_mat_vec_id_iq2_s_f32_len, mul_mat_vec_id_iq2_s_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq}, 1 , true );
2042
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ3_XXS], " mul_mat_vec_id_iq3_xxs_f32" , mul_mat_vec_id_iq3_xxs_f32_len, mul_mat_vec_id_iq3_xxs_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq}, 1 , true );
2043
+ ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ3_S], " mul_mat_vec_id_iq3_s_f32" , mul_mat_vec_id_iq3_s_f32_len, mul_mat_vec_id_iq3_s_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {2 * rm_kq, 1 , 1 }, {subgroup_size_16, 2 * rm_kq}, 1 , true );
2044
2044
ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ4_XS], " mul_mat_vec_id_iq4_xs_f32" , mul_mat_vec_id_iq4_xs_f32_len, mul_mat_vec_id_iq4_xs_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {rm_kq, 1 , 1 }, {subgroup_size_16, rm_kq}, 1 , true );
2045
2045
ggml_vk_create_pipeline (device, device->pipeline_dequant_mul_mat_vec_id_f32 [GGML_TYPE_IQ4_NL], " mul_mat_vec_id_iq4_nl_f32" , mul_mat_vec_id_iq4_nl_f32_len, mul_mat_vec_id_iq4_nl_f32_data, " main" , 4 , sizeof (vk_mat_vec_id_push_constants), {2 *rm_stdq, 1 , 1 }, {subgroup_size_16, 2 *rm_stdq}, 1 , true );
2046
2046
0 commit comments