/aosp_15_r20/external/XNNPACK/src/qs8-gemm/gen/ |
H A D | 2x16c16-minmax-rndnu-neon-mlal.c | 222 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c16__neon_mlal() local 286 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c16__neon_mlal() local
|
H A D | 2x16c8-minmax-rndnu-neon-mull.c | 190 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c8__neon_mull() local 255 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c8__neon_mull() local
|
H A D | 2x16c8-minmax-rndnu-neon-mlal.c | 329 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c8__neon_mlal() local 394 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c8__neon_mlal() local
|
H A D | 3x16c16-minmax-rndnu-neon-mlal.c | 293 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c16__neon_mlal() local 369 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c16__neon_mlal() local
|
H A D | 3x16c8-minmax-rndnu-neon-mull.c | 245 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c8__neon_mull() local 322 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c8__neon_mull() local
|
H A D | 4x16c8-minmax-rndnu-neon-mull.c | 300 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c8__neon_mull() local 389 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c8__neon_mull() local
|
H A D | 3x16c8-minmax-rndnu-neon-mlal.c | 434 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c8__neon_mlal() local 511 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x16c8__neon_mlal() local
|
H A D | 4x16c16-minmax-rndnu-neon-mlal.c | 364 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c16__neon_mlal() local 452 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c16__neon_mlal() local
|
H A D | 2x16c4s2-minmax-rndnu-neon-mull.c | 191 const int32x2_t vsum1xEF = vpadd_s32(vget_low_s32(vacc1xEF), vget_high_s32(vacc1xEF)); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c4s2__neon_mull() local
|
H A D | 4x16c8-minmax-rndnu-neon-mlal.c | 539 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c8__neon_mlal() local 628 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x16c8__neon_mlal() local
|
H A D | 2x16c4-minmax-rndnu-neon-mull-ld1r.c | 248 const int32x2_t vsum1xEF = vpadd_s32(vget_low_s32(vacc1xEF), vget_high_s32(vacc1xEF)); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c4__neon_mull_ld1r() local
|
H A D | 2x16c4-minmax-rndnu-neon-mull-ld2r.c | 246 const int32x2_t vsum1xEF = vpadd_s32(vget_low_s32(vacc1xEF), vget_high_s32(vacc1xEF)); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c4__neon_mull_ld2r() local
|
H A D | 2x16c4-minmax-rndnu-neon-mull-dup.c | 246 const int32x2_t vsum1xEF = vpadd_s32(vget_low_s32(vacc1xEF), vget_high_s32(vacc1xEF)); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x16c4__neon_mull_dup() local
|
/aosp_15_r20/external/XNNPACK/src/qs8-igemm/gen/ |
H A D | 2x16c8-minmax-rndnu-neon-mull.c | 206 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c8__neon_mull() local 271 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c8__neon_mull() local
|
H A D | 2x16c16-minmax-rndnu-neon-mlal.c | 238 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c16__neon_mlal() local 302 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c16__neon_mlal() local
|
H A D | 2x16c8-minmax-rndnu-neon-mlal.c | 345 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c8__neon_mlal() local 410 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c8__neon_mlal() local
|
H A D | 3x16c8-minmax-rndnu-neon-mull.c | 263 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c8__neon_mull() local 340 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c8__neon_mull() local
|
H A D | 3x16c16-minmax-rndnu-neon-mlal.c | 311 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c16__neon_mlal() local 387 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c16__neon_mlal() local
|
H A D | 4x16c8-minmax-rndnu-neon-mull.c | 320 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c8__neon_mull() local 409 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c8__neon_mull() local
|
H A D | 4x16c16-minmax-rndnu-neon-mlal.c | 384 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c16__neon_mlal() local 472 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c16__neon_mlal() local
|
H A D | 3x16c8-minmax-rndnu-neon-mlal.c | 452 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c8__neon_mlal() local 529 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x16c8__neon_mlal() local
|
H A D | 4x16c8-minmax-rndnu-neon-mlal.c | 559 const int32x4_t vsum1xEF = vpaddq_s32(vacc1x14, vacc1x15); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c8__neon_mlal() local 648 const int32x2_t vsum1xEF = vpadd_s32(vpsum1xE, vpsum1xF); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x16c8__neon_mlal() local
|
H A D | 2x16c4s2-minmax-rndnu-neon-mull.c | 207 const int32x2_t vsum1xEF = vpadd_s32(vget_low_s32(vacc1xEF), vget_high_s32(vacc1xEF)); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c4s2__neon_mull() local
|
H A D | 2x16c4-minmax-rndnu-neon-mull-ld2r.c | 261 const int32x2_t vsum1xEF = vpadd_s32(vget_low_s32(vacc1xEF), vget_high_s32(vacc1xEF)); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c4__neon_mull_ld2r() local
|
H A D | 2x16c4-minmax-rndnu-neon-mull-ld1r.c | 263 const int32x2_t vsum1xEF = vpadd_s32(vget_low_s32(vacc1xEF), vget_high_s32(vacc1xEF)); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x16c4__neon_mull_ld1r() local
|