@@ -1090,7 +1090,6 @@ static inline void conv3x3s1_winograd23_transform_output_tile_bf16s(const Mat& t
10901090 tmp10 = activation_ss (tmp10, activation_type, activation_params);
10911091 tmp11 = activation_ss (tmp11, activation_type, activation_params);
10921092
1093-
10941093 // if (out_elempack == 1)
10951094 {
10961095 unsigned short * outptr1 = outptr0 + N;
@@ -1153,7 +1152,6 @@ static inline void conv3x3s1_winograd23_transform_output_tile_bf16s(const Mat& t
11531152 tmp0 = activation_ss (tmp0, activation_type, activation_params);
11541153 tmp1 = activation_ss (tmp1, activation_type, activation_params);
11551154
1156-
11571155 // if (out_elempack == 1)
11581156 {
11591157 outptr0[0 ] = float32_to_bfloat16 (tmp0);
@@ -2866,7 +2864,6 @@ static inline void conv3x3s1_winograd43_transform_output_tile_bf16s(const Mat& t
28662864 tmp30 = activation_ss (tmp30, activation_type, activation_params);
28672865 tmp31 = activation_ss (tmp31, activation_type, activation_params);
28682866
2869-
28702867 // if (out_elempack == 1)
28712868 {
28722869 unsigned short * outptr1 = outptr0 + N;
@@ -2961,7 +2958,6 @@ static inline void conv3x3s1_winograd43_transform_output_tile_bf16s(const Mat& t
29612958 tmp2 = activation_ss (tmp2, activation_type, activation_params);
29622959 tmp3 = activation_ss (tmp3, activation_type, activation_params);
29632960
2964-
29652961 // if (out_elempack == 1)
29662962 {
29672963 outptr0[0 ] = float32_to_bfloat16 (tmp0);
@@ -4132,7 +4128,6 @@ static inline void conv3x3s1_winograd63_transform_input_tile_bf16s(const Mat& bo
41324128 }
41334129}
41344130
4135-
41364131#if NCNN_RUNTIME_CPU && NCNN_AVX512BF16 && __AVX512F__ && !__AVX512BF16__
41374132void conv3x3s1_winograd63_transform_output_tile_bf16s_avx512bf16 (const Mat& top_tile, Mat& top_blob, const Mat& bias, int i, int max_ii, int j, int max_jj, int activation_type, const Mat& activation_params);
41384133#endif
@@ -5102,7 +5097,6 @@ static inline void conv3x3s1_winograd63_transform_output_tile_bf16s(const Mat& t
51025097 tmp50 = activation_ss (tmp50, activation_type, activation_params);
51035098 tmp51 = activation_ss (tmp51, activation_type, activation_params);
51045099
5105-
51065100 // if (out_elempack == 1)
51075101 {
51085102 unsigned short * outptr1 = outptr0 + N;
@@ -5223,7 +5217,6 @@ static inline void conv3x3s1_winograd63_transform_output_tile_bf16s(const Mat& t
52235217 tmp4 = activation_ss (tmp4, activation_type, activation_params);
52245218 tmp5 = activation_ss (tmp5, activation_type, activation_params);
52255219
5226-
52275220 // if (out_elempack == 1)
52285221 {
52295222 outptr0[0 ] = float32_to_bfloat16 (tmp0);
@@ -5240,7 +5233,6 @@ static inline void conv3x3s1_winograd63_transform_output_tile_bf16s(const Mat& t
52405233 }
52415234}
52425235
5243-
52445236#if NCNN_RUNTIME_CPU && NCNN_AVX512BF16 && __AVX512F__ && !__AVX512BF16__
52455237int conv3x3s1_winograd63_bf16s_avx512bf16 (const Mat& bottom_blob, Mat& top_blob, const Mat& AT, const Mat& bias, int nT, int activation_type, const Mat& activation_params, const Option& opt);
52465238#endif
@@ -5373,4 +5365,3 @@ static int conv3x3s1_winograd63_bf16s(const Mat& bottom_blob, Mat& top_blob, con
53735365
53745366 return 0 ;
53755367}
5376-
0 commit comments