Home
last modified time | relevance | path

Searched defs:vsum2xAB (Results 1 – 25 of 44) sorted by relevance

12

/aosp_15_r20/external/XNNPACK/src/qs8-gemm/gen/
H A D3x16c16-minmax-rndnu-neon-mlal.c299 const int32x4_t vsum2xAB = vpaddq_s32(vacc2x10, vacc2x11); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c16__neon_mlal() local
390 const int32x2_t vsum2xAB = vpadd_s32(vpsum2xA, vpsum2xB); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c16__neon_mlal() local
H A D3x16c8-minmax-rndnu-neon-mull.c251 const int32x4_t vsum2xAB = vpaddq_s32(vacc2x10, vacc2x11); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c8__neon_mull() local
343 const int32x2_t vsum2xAB = vpadd_s32(vpsum2xA, vpsum2xB); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c8__neon_mull() local
H A D4x16c8-minmax-rndnu-neon-mull.c306 const int32x4_t vsum2xAB = vpaddq_s32(vacc2x10, vacc2x11); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c8__neon_mull() local
410 const int32x2_t vsum2xAB = vpadd_s32(vpsum2xA, vpsum2xB); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c8__neon_mull() local
H A D3x16c8-minmax-rndnu-neon-mlal.c440 const int32x4_t vsum2xAB = vpaddq_s32(vacc2x10, vacc2x11); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c8__neon_mlal() local
532 const int32x2_t vsum2xAB = vpadd_s32(vpsum2xA, vpsum2xB); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c8__neon_mlal() local
H A D4x16c16-minmax-rndnu-neon-mlal.c370 const int32x4_t vsum2xAB = vpaddq_s32(vacc2x10, vacc2x11); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c16__neon_mlal() local
473 const int32x2_t vsum2xAB = vpadd_s32(vpsum2xA, vpsum2xB); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c16__neon_mlal() local
H A D4x16c8-minmax-rndnu-neon-mlal.c545 const int32x4_t vsum2xAB = vpaddq_s32(vacc2x10, vacc2x11); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c8__neon_mlal() local
649 const int32x2_t vsum2xAB = vpadd_s32(vpsum2xA, vpsum2xB); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c8__neon_mlal() local
H A D3x16c4s2-minmax-rndnu-neon-mull.c252 const int32x2_t vsum2xAB = vpadd_s32(vget_low_s32(vacc2xAB), vget_high_s32(vacc2xAB)); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c4s2__neon_mull() local
H A D3x16c4-minmax-rndnu-neon-mull-ld2r.c326 const int32x2_t vsum2xAB = vpadd_s32(vget_low_s32(vacc2xAB), vget_high_s32(vacc2xAB)); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c4__neon_mull_ld2r() local
H A D3x16c4-minmax-rndnu-neon-mull-ld1r.c329 const int32x2_t vsum2xAB = vpadd_s32(vget_low_s32(vacc2xAB), vget_high_s32(vacc2xAB)); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c4__neon_mull_ld1r() local
H A D3x16c4-minmax-rndnu-neon-mull-dup.c326 const int32x2_t vsum2xAB = vpadd_s32(vget_low_s32(vacc2xAB), vget_high_s32(vacc2xAB)); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c4__neon_mull_dup() local
H A D4x16c4s2-minmax-rndnu-neon-mull.c304 const int32x2_t vsum2xAB = vpadd_s32(vget_low_s32(vacc2xAB), vget_high_s32(vacc2xAB)); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c4s2__neon_mull() local
H A D3x16c4s2-minmax-rndnu-neon-mlal.c445 const int32x2_t vsum2xAB = vpadd_s32(vget_low_s32(vacc2xAB), vget_high_s32(vacc2xAB)); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c4s2__neon_mlal() local
/aosp_15_r20/external/XNNPACK/src/qs8-igemm/gen/
H A D3x16c8-minmax-rndnu-neon-mull.c269 const int32x4_t vsum2xAB = vpaddq_s32(vacc2x10, vacc2x11); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c8__neon_mull() local
361 const int32x2_t vsum2xAB = vpadd_s32(vpsum2xA, vpsum2xB); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c8__neon_mull() local
H A D3x16c16-minmax-rndnu-neon-mlal.c317 const int32x4_t vsum2xAB = vpaddq_s32(vacc2x10, vacc2x11); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c16__neon_mlal() local
408 const int32x2_t vsum2xAB = vpadd_s32(vpsum2xA, vpsum2xB); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c16__neon_mlal() local
H A D4x16c8-minmax-rndnu-neon-mull.c326 const int32x4_t vsum2xAB = vpaddq_s32(vacc2x10, vacc2x11); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c8__neon_mull() local
430 const int32x2_t vsum2xAB = vpadd_s32(vpsum2xA, vpsum2xB); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c8__neon_mull() local
H A D4x16c16-minmax-rndnu-neon-mlal.c390 const int32x4_t vsum2xAB = vpaddq_s32(vacc2x10, vacc2x11); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c16__neon_mlal() local
493 const int32x2_t vsum2xAB = vpadd_s32(vpsum2xA, vpsum2xB); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c16__neon_mlal() local
H A D3x16c8-minmax-rndnu-neon-mlal.c458 const int32x4_t vsum2xAB = vpaddq_s32(vacc2x10, vacc2x11); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c8__neon_mlal() local
550 const int32x2_t vsum2xAB = vpadd_s32(vpsum2xA, vpsum2xB); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c8__neon_mlal() local
H A D4x16c8-minmax-rndnu-neon-mlal.c565 const int32x4_t vsum2xAB = vpaddq_s32(vacc2x10, vacc2x11); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c8__neon_mlal() local
669 const int32x2_t vsum2xAB = vpadd_s32(vpsum2xA, vpsum2xB); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c8__neon_mlal() local
H A D3x16c4s2-minmax-rndnu-neon-mull.c270 const int32x2_t vsum2xAB = vpadd_s32(vget_low_s32(vacc2xAB), vget_high_s32(vacc2xAB)); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c4s2__neon_mull() local
H A D3x16c4-minmax-rndnu-neon-mull-ld2r.c343 const int32x2_t vsum2xAB = vpadd_s32(vget_low_s32(vacc2xAB), vget_high_s32(vacc2xAB)); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c4__neon_mull_ld2r() local
H A D3x16c4-minmax-rndnu-neon-mull-dup.c343 const int32x2_t vsum2xAB = vpadd_s32(vget_low_s32(vacc2xAB), vget_high_s32(vacc2xAB)); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c4__neon_mull_dup() local
H A D3x16c4-minmax-rndnu-neon-mull-ld1r.c346 const int32x2_t vsum2xAB = vpadd_s32(vget_low_s32(vacc2xAB), vget_high_s32(vacc2xAB)); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c4__neon_mull_ld1r() local
H A D4x16c4s2-minmax-rndnu-neon-mull.c324 const int32x2_t vsum2xAB = vpadd_s32(vget_low_s32(vacc2xAB), vget_high_s32(vacc2xAB)); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c4s2__neon_mull() local
H A D3x16c4s2-minmax-rndnu-neon-mlal.c463 const int32x2_t vsum2xAB = vpadd_s32(vget_low_s32(vacc2xAB), vget_high_s32(vacc2xAB)); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c4s2__neon_mlal() local
H A D4x16c4-minmax-rndnu-neon-mull-ld1r.c420 const int32x2_t vsum2xAB = vpadd_s32(vget_low_s32(vacc2xAB), vget_high_s32(vacc2xAB)); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c4__neon_mull_ld1r() local

12