/AliOS-Things-master/components/ai_agent/src/engine/tflite-micro/third_party/cmsis/CMSIS/NN/Source/FullyConnectedFunctions/ |
A D | arm_fully_connected_q7_opt.c | 179 sum3 = __SMLAD(inM13, inV, sum3); in arm_fully_connected_q7_opt() 191 sum3 = __SMLAD(inM13, inV, sum3); in arm_fully_connected_q7_opt() 210 sum3 = __SMLAD(inM14, inV, sum3); in arm_fully_connected_q7_opt() 222 sum3 = __SMLAD(inM14, inV, sum3); in arm_fully_connected_q7_opt() 271 [ sum3 ] "+r"(sum3), in arm_fully_connected_q7_opt() 309 [ sum3 ] "+r"(sum3), in arm_fully_connected_q7_opt() 330 sum3 += inV * inM3; in arm_fully_connected_q7_opt() 422 sum3 += inA1 * inB1 + inA2 * inB2; in arm_fully_connected_q7_opt() 438 sum3 += inA3 * inB1 + inA4 * inB2; in arm_fully_connected_q7_opt() 452 sum3 += inA * inB; in arm_fully_connected_q7_opt() [all …]
|
A D | arm_fully_connected_mat_q7_vec_q15_opt.c | 142 q31_t sum3 = ((q31_t)(*pBias++) << bias_shift) + NN_ROUND(out_shift); in arm_fully_connected_mat_q7_vec_q15_opt() local 167 sum3 = __SMLAD(inM13, inV, sum3); in arm_fully_connected_mat_q7_vec_q15_opt() 188 sum3 = __SMLAD(inM14, inV, sum3); in arm_fully_connected_mat_q7_vec_q15_opt() 225 [ sum3 ] "+r"(sum3), in arm_fully_connected_mat_q7_vec_q15_opt() 250 [ sum3 ] "+r"(sum3), in arm_fully_connected_mat_q7_vec_q15_opt() 271 sum3 += inV * inM3; in arm_fully_connected_mat_q7_vec_q15_opt() 277 *pO++ = (q15_t)(__SSAT((sum3 >> out_shift), 16)); in arm_fully_connected_mat_q7_vec_q15_opt() 337 q31_t sum3 = ((q31_t)(*pBias++) << bias_shift) + NN_ROUND(out_shift); in arm_fully_connected_mat_q7_vec_q15_opt() local 361 sum3 += inA1 * inB1 + inA2 * inB2; in arm_fully_connected_mat_q7_vec_q15_opt() 376 sum3 += inA * inB; in arm_fully_connected_mat_q7_vec_q15_opt() [all …]
|
A D | arm_fully_connected_q15_opt.c | 121 q31_t sum3 = ((q31_t)(*pBias++) << bias_shift) + NN_ROUND(out_shift); in arm_fully_connected_q15_opt() local 141 sum3 = __SMLAD(inV, inM13, sum3); in arm_fully_connected_q15_opt() 172 [ sum3 ] "+r"(sum3), in arm_fully_connected_q15_opt() 193 sum3 += inV * inM3; in arm_fully_connected_q15_opt() 199 *pO++ = (q15_t)(__SSAT((sum3 >> out_shift), 16)); in arm_fully_connected_q15_opt() 259 q31_t sum3 = ((q31_t)(*pBias++) << bias_shift) + NN_ROUND(out_shift); in arm_fully_connected_q15_opt() local 280 sum3 += inA1 * inB1 + inA2 * inB2; in arm_fully_connected_q15_opt() 297 sum3 += inA * inB; in arm_fully_connected_q15_opt() 304 *pO++ = (q15_t)__SSAT((sum3 >> out_shift), 16); in arm_fully_connected_q15_opt()
|
/AliOS-Things-master/components/ai_agent/src/engine/tflite-micro/tensorflow/lite/micro/tools/make/downloads/cmsis/CMSIS/NN/Source/FullyConnectedFunctions/ |
A D | arm_fully_connected_q7_opt.c | 179 sum3 = __SMLAD(inM13, inV, sum3); in arm_fully_connected_q7_opt() 191 sum3 = __SMLAD(inM13, inV, sum3); in arm_fully_connected_q7_opt() 210 sum3 = __SMLAD(inM14, inV, sum3); in arm_fully_connected_q7_opt() 222 sum3 = __SMLAD(inM14, inV, sum3); in arm_fully_connected_q7_opt() 271 [ sum3 ] "+r"(sum3), in arm_fully_connected_q7_opt() 309 [ sum3 ] "+r"(sum3), in arm_fully_connected_q7_opt() 330 sum3 += inV * inM3; in arm_fully_connected_q7_opt() 422 sum3 += inA1 * inB1 + inA2 * inB2; in arm_fully_connected_q7_opt() 438 sum3 += inA3 * inB1 + inA4 * inB2; in arm_fully_connected_q7_opt() 452 sum3 += inA * inB; in arm_fully_connected_q7_opt() [all …]
|
A D | arm_fully_connected_mat_q7_vec_q15_opt.c | 142 q31_t sum3 = ((q31_t)(*pBias++) << bias_shift) + NN_ROUND(out_shift); in arm_fully_connected_mat_q7_vec_q15_opt() local 167 sum3 = __SMLAD(inM13, inV, sum3); in arm_fully_connected_mat_q7_vec_q15_opt() 188 sum3 = __SMLAD(inM14, inV, sum3); in arm_fully_connected_mat_q7_vec_q15_opt() 225 [ sum3 ] "+r"(sum3), in arm_fully_connected_mat_q7_vec_q15_opt() 250 [ sum3 ] "+r"(sum3), in arm_fully_connected_mat_q7_vec_q15_opt() 271 sum3 += inV * inM3; in arm_fully_connected_mat_q7_vec_q15_opt() 277 *pO++ = (q15_t)(__SSAT((sum3 >> out_shift), 16)); in arm_fully_connected_mat_q7_vec_q15_opt() 337 q31_t sum3 = ((q31_t)(*pBias++) << bias_shift) + NN_ROUND(out_shift); in arm_fully_connected_mat_q7_vec_q15_opt() local 361 sum3 += inA1 * inB1 + inA2 * inB2; in arm_fully_connected_mat_q7_vec_q15_opt() 376 sum3 += inA * inB; in arm_fully_connected_mat_q7_vec_q15_opt() [all …]
|
A D | arm_fully_connected_q15_opt.c | 121 q31_t sum3 = ((q31_t)(*pBias++) << bias_shift) + NN_ROUND(out_shift); in arm_fully_connected_q15_opt() local 141 sum3 = __SMLAD(inV, inM13, sum3); in arm_fully_connected_q15_opt() 172 [ sum3 ] "+r"(sum3), in arm_fully_connected_q15_opt() 193 sum3 += inV * inM3; in arm_fully_connected_q15_opt() 199 *pO++ = (q15_t)(__SSAT((sum3 >> out_shift), 16)); in arm_fully_connected_q15_opt() 259 q31_t sum3 = ((q31_t)(*pBias++) << bias_shift) + NN_ROUND(out_shift); in arm_fully_connected_q15_opt() local 280 sum3 += inA1 * inB1 + inA2 * inB2; in arm_fully_connected_q15_opt() 297 sum3 += inA * inB; in arm_fully_connected_q15_opt() 304 *pO++ = (q15_t)__SSAT((sum3 >> out_shift), 16); in arm_fully_connected_q15_opt()
|
/AliOS-Things-master/components/ai_agent/src/engine/tflite-micro/third_party/cmsis/CMSIS/NN/Source/ConvolutionFunctions/ |
A D | arm_nn_mat_mult_kernel_q7_q15_reordered.c | 68 q31_t sum3 = ((q31_t)(bias[i + 1]) << bias_shift) + NN_ROUND(out_shift); in arm_nn_mat_mult_kernel_q7_q15_reordered() local 85 sum3 = __SMLAD(inA21, inB1, sum3); in arm_nn_mat_mult_kernel_q7_q15_reordered() 93 sum3 = __SMLAD(inA22, inB1, sum3); in arm_nn_mat_mult_kernel_q7_q15_reordered() 108 sum3 += inA2 * inB1; in arm_nn_mat_mult_kernel_q7_q15_reordered() 113 *pOut++ = (q7_t)__SSAT((sum3 >> out_shift), 8); in arm_nn_mat_mult_kernel_q7_q15_reordered()
|
A D | arm_depthwise_separable_conv_HWC_q7.c | 150 q31_t sum3 = ((q31_t)(*pBias++) << bias_shift) + NN_ROUND(out_shift); in arm_depthwise_separable_conv_HWC_q7() local 186 sum3 = __SMLAD(opA, opB, sum3); in arm_depthwise_separable_conv_HWC_q7() 221 sum3 = __SMLAD(opA, opB, sum3); in arm_depthwise_separable_conv_HWC_q7() 268 [ sum3 ] "+r"(sum3), in arm_depthwise_separable_conv_HWC_q7() 312 [ sum3 ] "+r"(sum3), in arm_depthwise_separable_conv_HWC_q7() 333 sum3 += inA.bytes[2] * inB.bytes[2]; in arm_depthwise_separable_conv_HWC_q7() 340 *pOut++ = (q7_t)__SSAT((sum3 >> out_shift), 8); in arm_depthwise_separable_conv_HWC_q7()
|
A D | arm_depthwise_separable_conv_HWC_q7_nonsquare.c | 160 q31_t sum3 = ((q31_t)(*pBias++) << bias_shift) + NN_ROUND(out_shift); in arm_depthwise_separable_conv_HWC_q7_nonsquare() local 196 sum3 = __SMLAD(opA, opB, sum3); in arm_depthwise_separable_conv_HWC_q7_nonsquare() 231 sum3 = __SMLAD(opA, opB, sum3); in arm_depthwise_separable_conv_HWC_q7_nonsquare() 275 [ sum3 ] "+r"(sum3), in arm_depthwise_separable_conv_HWC_q7_nonsquare() 317 [ sum3 ] "+r"(sum3), in arm_depthwise_separable_conv_HWC_q7_nonsquare() 337 sum3 += inA.bytes[2] * inB.bytes[2]; in arm_depthwise_separable_conv_HWC_q7_nonsquare() 344 *pOut++ = (q7_t)__SSAT((sum3 >> out_shift), 8); in arm_depthwise_separable_conv_HWC_q7_nonsquare()
|
A D | arm_nn_mat_mult_kernel_q7_q15.c | 68 q31_t sum3 = ((q31_t)(*pBias) << bias_shift) + NN_ROUND(out_shift); in arm_nn_mat_mult_kernel_q7_q15() local 85 sum3 = __SMLAD(inA21, inB1, sum3); in arm_nn_mat_mult_kernel_q7_q15() 93 sum3 = __SMLAD(inA22, inB1, sum3); in arm_nn_mat_mult_kernel_q7_q15() 108 sum3 += inA2 * inB1; in arm_nn_mat_mult_kernel_q7_q15() 113 *pOut++ = (q7_t)__SSAT((sum3 >> out_shift), 8); in arm_nn_mat_mult_kernel_q7_q15()
|
A D | arm_convolve_HWC_q15_fast.c | 159 q31_t sum3 = ((q31_t)bias[i + 1] << bias_shift) + NN_ROUND(out_shift); in arm_convolve_HWC_q15_fast() local 173 sum3 = __SMLAD(inA2, inB1, sum3); in arm_convolve_HWC_q15_fast() 188 sum3 += inA2 * inB1; in arm_convolve_HWC_q15_fast() 193 *pOut++ = (q15_t)__SSAT(sum3 >> out_shift, 16); in arm_convolve_HWC_q15_fast()
|
A D | arm_convolve_HWC_q15_fast_nonsquare.c | 171 q31_t sum3 = ((q31_t)bias[i + 1] << bias_shift) + NN_ROUND(out_shift); in arm_convolve_HWC_q15_fast_nonsquare() local 185 sum3 = __SMLAD(inA2, inB1, sum3); in arm_convolve_HWC_q15_fast_nonsquare() 200 sum3 += inA2 * inB1; in arm_convolve_HWC_q15_fast_nonsquare() 205 *pOut++ = (q15_t)__SSAT(sum3 >> out_shift, 16); in arm_convolve_HWC_q15_fast_nonsquare()
|
/AliOS-Things-master/components/ai_agent/src/engine/tflite-micro/tensorflow/lite/micro/tools/make/downloads/cmsis/CMSIS/NN/Source/ConvolutionFunctions/ |
A D | arm_nn_mat_mult_kernel_q7_q15_reordered.c | 68 q31_t sum3 = ((q31_t)(bias[i + 1]) << bias_shift) + NN_ROUND(out_shift); in arm_nn_mat_mult_kernel_q7_q15_reordered() local 85 sum3 = __SMLAD(inA21, inB1, sum3); in arm_nn_mat_mult_kernel_q7_q15_reordered() 93 sum3 = __SMLAD(inA22, inB1, sum3); in arm_nn_mat_mult_kernel_q7_q15_reordered() 108 sum3 += inA2 * inB1; in arm_nn_mat_mult_kernel_q7_q15_reordered() 113 *pOut++ = (q7_t)__SSAT((sum3 >> out_shift), 8); in arm_nn_mat_mult_kernel_q7_q15_reordered()
|
A D | arm_depthwise_separable_conv_HWC_q7.c | 150 q31_t sum3 = ((q31_t)(*pBias++) << bias_shift) + NN_ROUND(out_shift); in arm_depthwise_separable_conv_HWC_q7() local 186 sum3 = __SMLAD(opA, opB, sum3); in arm_depthwise_separable_conv_HWC_q7() 221 sum3 = __SMLAD(opA, opB, sum3); in arm_depthwise_separable_conv_HWC_q7() 268 [ sum3 ] "+r"(sum3), in arm_depthwise_separable_conv_HWC_q7() 312 [ sum3 ] "+r"(sum3), in arm_depthwise_separable_conv_HWC_q7() 333 sum3 += inA.bytes[2] * inB.bytes[2]; in arm_depthwise_separable_conv_HWC_q7() 340 *pOut++ = (q7_t)__SSAT((sum3 >> out_shift), 8); in arm_depthwise_separable_conv_HWC_q7()
|
A D | arm_depthwise_separable_conv_HWC_q7_nonsquare.c | 160 q31_t sum3 = ((q31_t)(*pBias++) << bias_shift) + NN_ROUND(out_shift); in arm_depthwise_separable_conv_HWC_q7_nonsquare() local 196 sum3 = __SMLAD(opA, opB, sum3); in arm_depthwise_separable_conv_HWC_q7_nonsquare() 231 sum3 = __SMLAD(opA, opB, sum3); in arm_depthwise_separable_conv_HWC_q7_nonsquare() 275 [ sum3 ] "+r"(sum3), in arm_depthwise_separable_conv_HWC_q7_nonsquare() 317 [ sum3 ] "+r"(sum3), in arm_depthwise_separable_conv_HWC_q7_nonsquare() 337 sum3 += inA.bytes[2] * inB.bytes[2]; in arm_depthwise_separable_conv_HWC_q7_nonsquare() 344 *pOut++ = (q7_t)__SSAT((sum3 >> out_shift), 8); in arm_depthwise_separable_conv_HWC_q7_nonsquare()
|
A D | arm_nn_mat_mult_kernel_q7_q15.c | 68 q31_t sum3 = ((q31_t)(*pBias) << bias_shift) + NN_ROUND(out_shift); in arm_nn_mat_mult_kernel_q7_q15() local 85 sum3 = __SMLAD(inA21, inB1, sum3); in arm_nn_mat_mult_kernel_q7_q15() 93 sum3 = __SMLAD(inA22, inB1, sum3); in arm_nn_mat_mult_kernel_q7_q15() 108 sum3 += inA2 * inB1; in arm_nn_mat_mult_kernel_q7_q15() 113 *pOut++ = (q7_t)__SSAT((sum3 >> out_shift), 8); in arm_nn_mat_mult_kernel_q7_q15()
|
A D | arm_convolve_HWC_q15_fast.c | 159 q31_t sum3 = ((q31_t)bias[i + 1] << bias_shift) + NN_ROUND(out_shift); in arm_convolve_HWC_q15_fast() local 173 sum3 = __SMLAD(inA2, inB1, sum3); in arm_convolve_HWC_q15_fast() 188 sum3 += inA2 * inB1; in arm_convolve_HWC_q15_fast() 193 *pOut++ = (q15_t)__SSAT(sum3 >> out_shift, 16); in arm_convolve_HWC_q15_fast()
|
A D | arm_convolve_HWC_q15_fast_nonsquare.c | 171 q31_t sum3 = ((q31_t)bias[i + 1] << bias_shift) + NN_ROUND(out_shift); in arm_convolve_HWC_q15_fast_nonsquare() local 185 sum3 = __SMLAD(inA2, inB1, sum3); in arm_convolve_HWC_q15_fast_nonsquare() 200 sum3 += inA2 * inB1; in arm_convolve_HWC_q15_fast_nonsquare() 205 *pOut++ = (q15_t)__SSAT(sum3 >> out_shift, 16); in arm_convolve_HWC_q15_fast_nonsquare()
|
/AliOS-Things-master/hardware/chip/rtl872xd/sdk/component/soc/realtek/amebad/cmsis-dsp/Source/MatrixFunctions/ |
A D | arm_mat_mult_fast_q15.c | 95 q31_t sum2, sum3, sum4; in arm_mat_mult_fast_q15() local 297 sum3 = 0; in arm_mat_mult_fast_q15() 322 sum3 = __SMLAD(inA2, inB1, sum3); in arm_mat_mult_fast_q15() 361 sum3 += inA2 * inB1; in arm_mat_mult_fast_q15() 381 *px2++ = (q15_t) (sum3 >> 15); in arm_mat_mult_fast_q15()
|
A D | arm_mat_mult_fast_q31.c | 89 q31_t sum2, sum3, sum4; in arm_mat_mult_fast_q31() local 147 sum3 = 0; in arm_mat_mult_fast_q31() 168 sum3 = __SMMLA(inA2, inB1, sum3); in arm_mat_mult_fast_q31() 217 *px2++ = sum3 << 1; in arm_mat_mult_fast_q31()
|
/AliOS-Things-master/components/SDL2/src/image/external/libwebp-1.0.2/src/dsp/ |
A D | enc_neon.c | 768 const uint64_t sum3 = vgetq_lane_u64(sum2, 0) + vgetq_lane_u64(sum2, 1); in SumToInt_NEON() local 769 return (int)sum3; in SumToInt_NEON()
|