@@ -33,6 +33,7 @@ void gemm_s8(bool is_transA,
3333 Dtype* C,
3434 const float * bias,
3535 bool is_bias,
36+ GemmBiasDirection bias_direction,
3637 const float * scale,
3738 const operators::ActivationParam act_param,
3839 ARMContext* ctx) {
@@ -83,8 +84,19 @@ void gemm_s8(bool is_transA,
8384 int lda = is_transA ? M : K;
8485 prepackA_int8 (packed_A, A, lda, 0 , M, 0 , K, is_transA, ctx);
8586
86- gemm_prepack_int8<Dtype>(
87- packed_A, B, bias, C, M, N, K, is_bias, is_transB, scale, act_param, ctx);
87+ gemm_prepack_int8<Dtype>(packed_A,
88+ B,
89+ bias,
90+ C,
91+ M,
92+ N,
93+ K,
94+ is_bias,
95+ bias_direction,
96+ is_transB,
97+ scale,
98+ act_param,
99+ ctx);
88100}
89101
90102template void gemm_s8<float >(bool is_transA,
@@ -97,6 +109,7 @@ template void gemm_s8<float>(bool is_transA,
97109 float * C,
98110 const float * bias,
99111 bool is_bias,
112+ GemmBiasDirection bias_direction,
100113 const float * scale,
101114 const operators::ActivationParam act_param,
102115 ARMContext* ctx);
@@ -111,6 +124,7 @@ template void gemm_s8<int8_t>(bool is_transA,
111124 int8_t * C,
112125 const float * bias,
113126 bool is_bias,
127+ GemmBiasDirection bias_direction,
114128 const float * scale,
115129 const operators::ActivationParam act_param,
116130 ARMContext* ctx);
@@ -127,6 +141,7 @@ void gemm_sve(bool is_transA,
127141 Dtype* C,
128142 const float * bias,
129143 bool is_bias,
144+ GemmBiasDirection bias_direction,
130145 const float * scale,
131146 const operators::ActivationParam act_param,
132147 ARMContext* ctx) {
@@ -203,6 +218,7 @@ template void gemm_sve<float>(bool is_transA,
203218 float * C,
204219 const float * bias,
205220 bool is_bias,
221+ GemmBiasDirection bias_direction,
206222 const float * scale,
207223 const operators::ActivationParam act_param,
208224 ARMContext* ctx);
@@ -217,6 +233,7 @@ template void gemm_sve<int8_t>(bool is_transA,
217233 int8_t * C,
218234 const float * bias,
219235 bool is_bias,
236+ GemmBiasDirection bias_direction,
220237 const float * scale,
221238 const operators::ActivationParam act_param,
222239 ARMContext* ctx);
0 commit comments