/aosp_15_r20/external/pytorch/aten/src/ATen/native/quantized/cpu/qnnpack/src/q8avgpool/ |
H A D | mp8x9p8q-neon.c | 83 const uint16x8_t vsum45 = vaddl_u8(vi4, vi5); in pytorch_q8avgpool_ukernel_mp8x9p8q__neon() local 136 const uint16x8_t vsum45 = vaddl_u8(vi4, vi5); in pytorch_q8avgpool_ukernel_mp8x9p8q__neon() local 189 const uint16x8_t vsum45 = vaddl_u8(vi4, vi5); in pytorch_q8avgpool_ukernel_mp8x9p8q__neon() local 239 const uint16x8_t vsum45 = vaddl_u8(vi4, vi5); in pytorch_q8avgpool_ukernel_mp8x9p8q__neon() local 313 const int16x8_t vsum45 = vreinterpretq_s16_u16(vaddl_u8(vi4, vi5)); in pytorch_q8avgpool_ukernel_mp8x9p8q__neon() local 389 const int16x8_t vsum45 = vreinterpretq_s16_u16(vaddl_u8(vi4, vi5)); in pytorch_q8avgpool_ukernel_mp8x9p8q__neon() local
|
H A D | mp8x9p8q-sse2.c | 82 const __m128i vsum45 = _mm_add_epi16(vxi4, vxi5); in pytorch_q8avgpool_ukernel_mp8x9p8q__sse2() local 144 const __m128i vsum45 = _mm_add_epi16(vxi4, vxi5); in pytorch_q8avgpool_ukernel_mp8x9p8q__sse2() local 205 const __m128i vsum45 = _mm_add_epi16(vxi4, vxi5); in pytorch_q8avgpool_ukernel_mp8x9p8q__sse2() local 263 const __m128i vsum45 = _mm_add_epi16(vxi4, vxi5); in pytorch_q8avgpool_ukernel_mp8x9p8q__sse2() local 344 const __m128i vsum45 = _mm_add_epi16(vxi4, vxi5); in pytorch_q8avgpool_ukernel_mp8x9p8q__sse2() local 422 const __m128i vsum45 = _mm_add_epi16(vxi4, vxi5); in pytorch_q8avgpool_ukernel_mp8x9p8q__sse2() local
|
/aosp_15_r20/external/XNNPACK/src/f32-gavgpool/ |
H A D | 7p7x-minmax-neon-c4.c | 49 const float32x4_t vsum45 = vaddq_f32(vi4, vi5); in xnn_f32_gavgpool_minmax_ukernel_7p7x__neon_c4() local 81 const float32x4_t vsum45 = vaddq_f32(vi4, vi5); in xnn_f32_gavgpool_minmax_ukernel_7p7x__neon_c4() local 135 const float32x4_t vsum45 = vaddq_f32(vi4, vi5); in xnn_f32_gavgpool_minmax_ukernel_7p7x__neon_c4() local 163 const float32x4_t vsum45 = vaddq_f32(vi4, vi5); in xnn_f32_gavgpool_minmax_ukernel_7p7x__neon_c4() local
|
H A D | 7p7x-minmax-wasmsimd-x86-c4.c | 56 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasmsimd_x86_c4() local 96 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasmsimd_x86_c4() local 158 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasmsimd_x86_c4() local 187 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasmsimd_x86_c4() local
|
H A D | 7p7x-minmax-wasmsimd-arm-c4.c | 56 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasmsimd_arm_c4() local 96 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasmsimd_arm_c4() local 158 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasmsimd_arm_c4() local 187 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasmsimd_arm_c4() local
|
H A D | 7p7x-minmax-sse-c4.c | 56 const __m128 vsum45 = _mm_add_ps(vi4, vi5); in xnn_f32_gavgpool_minmax_ukernel_7p7x__sse_c4() local 95 const __m128 vsum45 = _mm_add_ps(vi4, vi5); in xnn_f32_gavgpool_minmax_ukernel_7p7x__sse_c4() local 157 const __m128 vsum45 = _mm_add_ps(vi4, vi5); in xnn_f32_gavgpool_minmax_ukernel_7p7x__sse_c4() local 186 const __m128 vsum45 = _mm_add_ps(vi4, vi5); in xnn_f32_gavgpool_minmax_ukernel_7p7x__sse_c4() local
|
H A D | 7p7x-minmax-wasm-c1.c | 47 const float vsum45 = vi4 + vi5; in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasm_c1() local 80 const float vsum45 = vi4 + vi5; in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasm_c1() local 134 const float vsum45 = vi4 + vi5; in xnn_f32_gavgpool_minmax_ukernel_7p7x__wasm_c1() local
|
H A D | 7p7x-minmax-scalar-c1.c | 47 const float vsum45 = vi4 + vi5; in xnn_f32_gavgpool_minmax_ukernel_7p7x__scalar_c1() local 80 const float vsum45 = vi4 + vi5; in xnn_f32_gavgpool_minmax_ukernel_7p7x__scalar_c1() local 134 const float vsum45 = vi4 + vi5; in xnn_f32_gavgpool_minmax_ukernel_7p7x__scalar_c1() local
|
/aosp_15_r20/external/pytorch/aten/src/ATen/native/quantized/cpu/qnnpack/src/q8gavgpool/ |
H A D | mp8x7p7q-neon.c | 60 const int16x8_t vsum45 = vreinterpretq_s16_u16(vaddl_u8(vi4, vi5)); in pytorch_q8gavgpool_ukernel_mp8x7p7q__neon() local 105 const int16x8_t vsum45 = vreinterpretq_s16_u16(vaddl_u8(vi4, vi5)); in pytorch_q8gavgpool_ukernel_mp8x7p7q__neon() local 186 const int16x8_t vsum45 = vreinterpretq_s16_u16(vaddl_u8(vi4, vi5)); in pytorch_q8gavgpool_ukernel_mp8x7p7q__neon() local 259 const int16x8_t vsum45 = vreinterpretq_s16_u16(vaddl_u8(vi4, vi5)); in pytorch_q8gavgpool_ukernel_mp8x7p7q__neon() local
|
/aosp_15_r20/external/XNNPACK/src/f32-avgpool/ |
H A D | 9p8x-minmax-wasmsimd-arm-c4.c | 105 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local 182 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local 282 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local 311 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local
|
H A D | 9p8x-minmax-wasmsimd-x86-c4.c | 105 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() local 182 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() local 282 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() local 311 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_avgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() local
|
H A D | 9p8x-minmax-sse-c4.c | 105 const __m128 vsum45 = _mm_add_ps(vi4, vi5); in xnn_f32_avgpool_minmax_ukernel_9p8x__sse_c4() local 181 const __m128 vsum45 = _mm_add_ps(vi4, vi5); in xnn_f32_avgpool_minmax_ukernel_9p8x__sse_c4() local 280 const __m128 vsum45 = _mm_add_ps(vi4, vi5); in xnn_f32_avgpool_minmax_ukernel_9p8x__sse_c4() local 309 const __m128 vsum45 = _mm_add_ps(vi4, vi5); in xnn_f32_avgpool_minmax_ukernel_9p8x__sse_c4() local
|
H A D | 9p8x-minmax-neon-c4.c | 96 const float32x4_t vsum45 = vaddq_f32(vi4, vi5); in xnn_f32_avgpool_minmax_ukernel_9p8x__neon_c4() local 164 const float32x4_t vsum45 = vaddq_f32(vi4, vi5); in xnn_f32_avgpool_minmax_ukernel_9p8x__neon_c4() local 255 const float32x4_t vsum45 = vaddq_f32(vi4, vi5); in xnn_f32_avgpool_minmax_ukernel_9p8x__neon_c4() local 283 const float32x4_t vsum45 = vaddq_f32(vi4, vi5); in xnn_f32_avgpool_minmax_ukernel_9p8x__neon_c4() local
|
/aosp_15_r20/external/XNNPACK/src/f16-avgpool/ |
H A D | 9p8x-minmax-neonfp16arith-c8.c | 96 const float16x8_t vsum45 = vaddq_f16(vi4, vi5); in xnn_f16_avgpool_minmax_ukernel_9p8x__neonfp16arith_c8() local 164 const float16x8_t vsum45 = vaddq_f16(vi4, vi5); in xnn_f16_avgpool_minmax_ukernel_9p8x__neonfp16arith_c8() local 255 const float16x8_t vsum45 = vaddq_f16(vi4, vi5); in xnn_f16_avgpool_minmax_ukernel_9p8x__neonfp16arith_c8() local 283 const float16x8_t vsum45 = vaddq_f16(vi4, vi5); in xnn_f16_avgpool_minmax_ukernel_9p8x__neonfp16arith_c8() local
|
H A D | 9p8x-minmax-f16c-c8.c | 107 …const __m256 vsum45 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vi4, vi5), _MM_FROUND_NO_EXC)); in xnn_f16_avgpool_minmax_ukernel_9p8x__f16c_c8() local 184 …const __m256 vsum45 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vi4, vi5), _MM_FROUND_NO_EXC)); in xnn_f16_avgpool_minmax_ukernel_9p8x__f16c_c8() local 285 …const __m256 vsum45 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vi4, vi5), _MM_FROUND_NO_EXC)); in xnn_f16_avgpool_minmax_ukernel_9p8x__f16c_c8() local 314 …const __m256 vsum45 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vi4, vi5), _MM_FROUND_NO_EXC)); in xnn_f16_avgpool_minmax_ukernel_9p8x__f16c_c8() local
|
/aosp_15_r20/external/XNNPACK/src/f32-pavgpool/ |
H A D | 9p8x-minmax-wasmsimd-x86-c4.c | 105 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() local 182 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() local 285 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() local 314 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_x86_c4() local
|
H A D | 9p8x-minmax-wasmsimd-arm-c4.c | 105 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local 182 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local 285 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local 314 const v128_t vsum45 = wasm_f32x4_add(vi4, vi5); in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasmsimd_arm_c4() local
|
H A D | 9p8x-minmax-sse-c4.c | 105 const __m128 vsum45 = _mm_add_ps(vi4, vi5); in xnn_f32_pavgpool_minmax_ukernel_9p8x__sse_c4() local 181 const __m128 vsum45 = _mm_add_ps(vi4, vi5); in xnn_f32_pavgpool_minmax_ukernel_9p8x__sse_c4() local 283 const __m128 vsum45 = _mm_add_ps(vi4, vi5); in xnn_f32_pavgpool_minmax_ukernel_9p8x__sse_c4() local 312 const __m128 vsum45 = _mm_add_ps(vi4, vi5); in xnn_f32_pavgpool_minmax_ukernel_9p8x__sse_c4() local
|
H A D | 9p8x-minmax-neon-c4.c | 96 const float32x4_t vsum45 = vaddq_f32(vi4, vi5); in xnn_f32_pavgpool_minmax_ukernel_9p8x__neon_c4() local 164 const float32x4_t vsum45 = vaddq_f32(vi4, vi5); in xnn_f32_pavgpool_minmax_ukernel_9p8x__neon_c4() local 256 const float32x4_t vsum45 = vaddq_f32(vi4, vi5); in xnn_f32_pavgpool_minmax_ukernel_9p8x__neon_c4() local 284 const float32x4_t vsum45 = vaddq_f32(vi4, vi5); in xnn_f32_pavgpool_minmax_ukernel_9p8x__neon_c4() local
|
H A D | 9p8x-minmax-wasm-c1.c | 96 const float vsum45 = vi4 + vi5; in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasm_c1() local 165 const float vsum45 = vi4 + vi5; in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasm_c1() local 257 const float vsum45 = vi4 + vi5; in xnn_f32_pavgpool_minmax_ukernel_9p8x__wasm_c1() local
|
H A D | 9p8x-minmax-scalar-c1.c | 96 const float vsum45 = vi4 + vi5; in xnn_f32_pavgpool_minmax_ukernel_9p8x__scalar_c1() local 165 const float vsum45 = vi4 + vi5; in xnn_f32_pavgpool_minmax_ukernel_9p8x__scalar_c1() local 257 const float vsum45 = vi4 + vi5; in xnn_f32_pavgpool_minmax_ukernel_9p8x__scalar_c1() local
|
/aosp_15_r20/external/XNNPACK/src/f16-pavgpool/ |
H A D | 9p8x-minmax-neonfp16arith-c8.c | 96 const float16x8_t vsum45 = vaddq_f16(vi4, vi5); in xnn_f16_pavgpool_minmax_ukernel_9p8x__neonfp16arith_c8() local 164 const float16x8_t vsum45 = vaddq_f16(vi4, vi5); in xnn_f16_pavgpool_minmax_ukernel_9p8x__neonfp16arith_c8() local 256 const float16x8_t vsum45 = vaddq_f16(vi4, vi5); in xnn_f16_pavgpool_minmax_ukernel_9p8x__neonfp16arith_c8() local 284 const float16x8_t vsum45 = vaddq_f16(vi4, vi5); in xnn_f16_pavgpool_minmax_ukernel_9p8x__neonfp16arith_c8() local
|
H A D | 9p8x-minmax-avx2-c8.c | 107 …const __m256 vsum45 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vi4, vi5), _MM_FROUND_NO_EXC)); in xnn_f16_pavgpool_minmax_ukernel_9p8x__avx2_c8() local 184 …const __m256 vsum45 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vi4, vi5), _MM_FROUND_NO_EXC)); in xnn_f16_pavgpool_minmax_ukernel_9p8x__avx2_c8() local 287 …const __m256 vsum45 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vi4, vi5), _MM_FROUND_NO_EXC)); in xnn_f16_pavgpool_minmax_ukernel_9p8x__avx2_c8() local 316 …const __m256 vsum45 = _mm256_cvtph_ps(_mm256_cvtps_ph(_mm256_add_ps(vi4, vi5), _MM_FROUND_NO_EXC)); in xnn_f16_pavgpool_minmax_ukernel_9p8x__avx2_c8() local
|
/aosp_15_r20/external/XNNPACK/src/qu8-avgpool/ |
H A D | 9p8x-minmax-neon-c8.c | 107 const uint16x8_t vsum45 = vaddl_u8(vi4, vi5); in xnn_qu8_avgpool_minmax_ukernel_9p8x__neon_c8() local 180 const uint16x8_t vsum45 = vaddl_u8(vi4, vi5); in xnn_qu8_avgpool_minmax_ukernel_9p8x__neon_c8() local 275 const int16x8_t vsum45 = vreinterpretq_s16_u16(vaddl_u8(vi4, vi5)); in xnn_qu8_avgpool_minmax_ukernel_9p8x__neon_c8() local 349 const int16x8_t vsum45 = vreinterpretq_s16_u16(vaddl_u8(vi4, vi5)); in xnn_qu8_avgpool_minmax_ukernel_9p8x__neon_c8() local
|
H A D | 9p8x-minmax-sse2-c8.c | 112 const __m128i vsum45 = _mm_add_epi16(vxi4, vxi5); in xnn_qu8_avgpool_minmax_ukernel_9p8x__sse2_c8() local 195 const __m128i vsum45 = _mm_add_epi16(vxi4, vxi5); in xnn_qu8_avgpool_minmax_ukernel_9p8x__sse2_c8() local 301 const __m128i vsum45 = _mm_add_epi16(vxi4, vxi5); in xnn_qu8_avgpool_minmax_ukernel_9p8x__sse2_c8() local 376 const __m128i vsum45 = _mm_add_epi16(vxi4, vxi5); in xnn_qu8_avgpool_minmax_ukernel_9p8x__sse2_c8() local
|