@@ -704,13 +704,15 @@ void process_shaders() {
704704 shader = (tname == " f32" || tname == " f16" || tname == " bf16" ) ? " get_rows.comp" : " get_rows_quant.comp" ;
705705
706706 if (tname == " f16" ) {
707- string_to_spv (" get_rows_" + tname, shader, merge_maps (base_dict, {{data_a_key, " 1" }, {" B_TYPE" , " int" }, {" D_TYPE" , " float16_t" }, {" OPTIMIZATION_ERROR_WORKAROUND" , " 1" }}));
707+ string_to_spv (" get_rows_" + tname, shader, merge_maps (base_dict, {{" TEMP_TYPE " , " FLOAT_TYPE " }, { data_a_key, " 1" }, {" B_TYPE" , " int" }, {" D_TYPE" , " float16_t" }, {" OPTIMIZATION_ERROR_WORKAROUND" , " 1" }}));
708708 } else {
709- string_to_spv (" get_rows_" + tname, shader, merge_maps (base_dict, {{data_a_key, " 1" }, {" B_TYPE" , " int" }, {" D_TYPE" , " float16_t" }}));
709+ string_to_spv (" get_rows_" + tname, shader, merge_maps (base_dict, {{" TEMP_TYPE " , " FLOAT_TYPE " }, { data_a_key, " 1" }, {" B_TYPE" , " int" }, {" D_TYPE" , " float16_t" }}));
710710 }
711- string_to_spv (" get_rows_" + tname + " _f32" , shader, merge_maps (base_dict, {{data_a_key, " 1" }, {" B_TYPE" , " int" }, {" D_TYPE" , " float" }}));
711+ string_to_spv (" get_rows_" + tname + " _f32" , shader, merge_maps (base_dict, {{" TEMP_TYPE " , " FLOAT_TYPE " }, { data_a_key, " 1" }, {" B_TYPE" , " int" }, {" D_TYPE" , " float" }}));
712712 }
713713
714+ string_to_spv (" get_rows_i32" , " get_rows.comp" , {{" TEMP_TYPE" , " uint" }, {" A_TYPE" , " uint" }, {" B_TYPE" , " int" }, {" D_TYPE" , " uint" }});
715+
714716 string_to_spv (" mul_mat_vec_p021_f16_f32_subgroup_add" , " mul_mat_vec_p021.comp" , {{" A_TYPE" , " float16_t" }, {" A_TYPE_VEC4" , " f16vec4" }, {" B_TYPE" , " float" }, {" B_TYPE_VEC4" , " vec4" }, {" D_TYPE" , " float" }, {" USE_SUBGROUP_ADD" , " 1" }});
715717 string_to_spv (" mul_mat_vec_p021_f16_f32" , " mul_mat_vec_p021.comp" , {{" A_TYPE" , " float16_t" }, {" A_TYPE_VEC4" , " f16vec4" }, {" B_TYPE" , " float" }, {" B_TYPE_VEC4" , " vec4" }, {" D_TYPE" , " float" }});
716718 string_to_spv (" mul_mat_vec_nc_f16_f32" , " mul_mat_vec_nc.comp" , {{" A_TYPE" , " float16_t" }, {" A_TYPE_VEC4" , " f16vec4" }, {" B_TYPE" , " float" }, {" B_TYPE_VEC4" , " vec4" }, {" D_TYPE" , " float" }});
0 commit comments