/aosp_15_r20/external/pytorch/aten/src/ATen/native/quantized/cpu/qnnpack/src/q8gemm/ |
H A D | 4x8c2-xzp-neon.c | 228 vld1_dup_u16(__builtin_assume_aligned((const uint16_t*)a0, 1))); in pytorch_q8gemm_xzp_ukernel_4x8c2__neon() 231 vld1_dup_u16(__builtin_assume_aligned((const uint16_t*)a1, 1))); in pytorch_q8gemm_xzp_ukernel_4x8c2__neon() 234 vld1_dup_u16(__builtin_assume_aligned((const uint16_t*)a2, 1))); in pytorch_q8gemm_xzp_ukernel_4x8c2__neon() 237 vld1_dup_u16(__builtin_assume_aligned((const uint16_t*)a3, 1))); in pytorch_q8gemm_xzp_ukernel_4x8c2__neon() 268 vld1_dup_u16(__builtin_assume_aligned((const uint16_t*)a0, 1))); in pytorch_q8gemm_xzp_ukernel_4x8c2__neon() 271 vld1_dup_u16(__builtin_assume_aligned((const uint16_t*)a1, 1))); in pytorch_q8gemm_xzp_ukernel_4x8c2__neon() 274 vld1_dup_u16(__builtin_assume_aligned((const uint16_t*)a2, 1))); in pytorch_q8gemm_xzp_ukernel_4x8c2__neon() 277 vld1_dup_u16(__builtin_assume_aligned((const uint16_t*)a3, 1))); in pytorch_q8gemm_xzp_ukernel_4x8c2__neon() 309 vld1_dup_u16(__builtin_assume_aligned((const uint16_t*)a0, 1))); in pytorch_q8gemm_xzp_ukernel_4x8c2__neon() 312 vld1_dup_u16(__builtin_assume_aligned((const uint16_t*)a1, 1))); in pytorch_q8gemm_xzp_ukernel_4x8c2__neon() [all …]
|
H A D | 4x-sumrows-neon.c | 113 vld1_dup_u16(__builtin_assume_aligned((const uint16_t*)a0, 1))); in pytorch_q8sumrows_ukernel_4x__neon() 116 vld1_dup_u16(__builtin_assume_aligned((const uint16_t*)a1, 1))); in pytorch_q8sumrows_ukernel_4x__neon() 119 vld1_dup_u16(__builtin_assume_aligned((const uint16_t*)a2, 1))); in pytorch_q8sumrows_ukernel_4x__neon() 122 vld1_dup_u16(__builtin_assume_aligned((const uint16_t*)a3, 1))); in pytorch_q8sumrows_ukernel_4x__neon()
|
/aosp_15_r20/external/XNNPACK/src/f16-gavgpool-cw/ |
H A D | neonfp16arith-x4.c | 32 …const float16x4_t vmultiplier = vreinterpret_f16_u16(vld1_dup_u16(¶ms->neonfp16arith.multiplie… in xnn_f16_gavgpool_cw_ukernel__neonfp16arith_x4() 33 …const float16x4_t voutput_min = vreinterpret_f16_u16(vld1_dup_u16(¶ms->neonfp16arith.output_mi… in xnn_f16_gavgpool_cw_ukernel__neonfp16arith_x4() 34 …const float16x4_t voutput_max = vreinterpret_f16_u16(vld1_dup_u16(¶ms->neonfp16arith.output_ma… in xnn_f16_gavgpool_cw_ukernel__neonfp16arith_x4()
|
H A D | neonfp16arith-x8.c | 33 …const float16x4_t vmultiplier = vreinterpret_f16_u16(vld1_dup_u16(¶ms->neonfp16arith.multiplie… in xnn_f16_gavgpool_cw_ukernel__neonfp16arith_x8() 34 …const float16x4_t voutput_min = vreinterpret_f16_u16(vld1_dup_u16(¶ms->neonfp16arith.output_mi… in xnn_f16_gavgpool_cw_ukernel__neonfp16arith_x8() 35 …const float16x4_t voutput_max = vreinterpret_f16_u16(vld1_dup_u16(¶ms->neonfp16arith.output_ma… in xnn_f16_gavgpool_cw_ukernel__neonfp16arith_x8()
|
/aosp_15_r20/external/libaom/av1/common/arm/ |
H A D | blend_a64_hmask_neon.c | 84 const uint8x8_t m0 = vreinterpret_u8_u16(vld1_dup_u16((uint16_t *)mask)); in aom_blend_a64_hmask_neon()
|
/aosp_15_r20/external/XNNPACK/src/f16-conv-hwc2chw/ |
H A D | 3x3s2p1c3x4-neonfp16arith-2x2.c | 52 const float16x4_t vmax = vreinterpret_f16_u16(vld1_dup_u16(¶ms->neon.max)); in xnn_f16_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfp16arith_2x2() 53 const float16x4_t vmin = vreinterpret_f16_u16(vld1_dup_u16(¶ms->neon.min)); in xnn_f16_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfp16arith_2x2()
|
/aosp_15_r20/external/libvpx/vpx_dsp/arm/ |
H A D | highbd_intrapred_neon.c | 791 l0az = vext_u16(vld1_dup_u16(left), az, 3); in vpx_highbd_d117_predictor_4x4_neon() 800 azl0 = vext_u16(vld1_dup_u16(above - 1), l0, 3); in vpx_highbd_d117_predictor_4x4_neon() 1191 l0az = vext_u16(vld1_dup_u16(left), az, 3); in vpx_highbd_d153_predictor_4x4_neon() 1200 azl0 = vext_u16(vld1_dup_u16(above - 1), l0, 3); in vpx_highbd_d153_predictor_4x4_neon() 1832 l3 = vld1_dup_u16(left + 3); in vpx_highbd_d207_predictor_4x4_neon()
|
/aosp_15_r20/external/clang/test/CodeGen/ |
H A D | aarch64-neon-ldst-one.c | 173 return vld1_dup_u16(a); in test_vld1_dup_u16()
|
H A D | arm_neon_intrinsics.c | 4455 return vld1_dup_u16(a); in test_vld1_dup_u16()
|
/aosp_15_r20/external/eigen/Eigen/src/Core/arch/NEON/ |
H A D | PacketMath.h | 1803 return vreinterpret_u16_u32(vzip_u32(vreinterpret_u32_u16(vld1_dup_u16(from)), 1804 vreinterpret_u32_u16(vld1_dup_u16(from+1))).val[0]); 1865 { return vcombine_u16(vld1_dup_u16(from), vld1_dup_u16(from+1)); } 2057 Packet4us res = vld1_dup_u16(from);
|
/aosp_15_r20/external/libgav1/src/dsp/arm/ |
H A D | intrapred_neon.cc | 1035 const uint16x4_t row = vld1_dup_u16(left + y); in Horizontal4xH_NEON()
|
/aosp_15_r20/external/neon_2_sse/ |
H A D | NEON_2_SSE.h | 1288 _NEON2SSESTORAGE uint16x4_t vld1_dup_u16(__transfersize(1) uint16_t const * ptr); // VLD1.16 {d0[]}… 9500 _NEON2SSESTORAGE uint16x4_t vld1_dup_u16(__transfersize(1) uint16_t const * ptr); // VLD1.16 {d0[]}… 9501 _NEON2SSE_INLINE _NEON2SSE_PERFORMANCE_WARNING(uint16x4_t vld1_dup_u16(__transfersize(1) uint16_t c… in _NEON2SSE_PERFORMANCE_WARNING() 9533 #define vld1_dup_s16(ptr) vld1_dup_u16((uint16_t*)ptr) 9560 #define vld1_dup_p16 vld1_dup_u16
|
/aosp_15_r20/prebuilts/rust/linux-x86/1.81.0.u1/lib/rustlib/src/rust/library/stdarch/crates/core_arch/src/arm_shared/neon/ |
H A D | mod.rs | 2179 pub unsafe fn vld1_dup_u16(ptr: *const u16) -> uint16x4_t { in vld1_dup_u16() function 10519 let r: u16x4 = transmute(vld1_dup_u16(&elem)); in test_vld1_dup_u16()
|
/aosp_15_r20/prebuilts/rust/linux-musl-x86/1.81.0/lib/rustlib/src/rust/library/stdarch/crates/core_arch/src/arm_shared/neon/ |
H A D | mod.rs | 2179 pub unsafe fn vld1_dup_u16(ptr: *const u16) -> uint16x4_t { in vld1_dup_u16() function 10519 let r: u16x4 = transmute(vld1_dup_u16(&elem)); in test_vld1_dup_u16()
|
/aosp_15_r20/prebuilts/rust/linux-musl-x86/1.80.1/lib/rustlib/src/rust/library/stdarch/crates/core_arch/src/arm_shared/neon/ |
H A D | mod.rs | 2179 pub unsafe fn vld1_dup_u16(ptr: *const u16) -> uint16x4_t { in vld1_dup_u16() function 10519 let r: u16x4 = transmute(vld1_dup_u16(&elem)); in test_vld1_dup_u16()
|
/aosp_15_r20/prebuilts/rust/linux-x86/1.81.0/lib/rustlib/src/rust/library/stdarch/crates/core_arch/src/arm_shared/neon/ |
H A D | mod.rs | 2179 pub unsafe fn vld1_dup_u16(ptr: *const u16) -> uint16x4_t { in vld1_dup_u16() function 10519 let r: u16x4 = transmute(vld1_dup_u16(&elem)); in test_vld1_dup_u16()
|
/aosp_15_r20/prebuilts/rust/linux-x86/1.80.1/lib/rustlib/src/rust/library/stdarch/crates/core_arch/src/arm_shared/neon/ |
H A D | mod.rs | 2179 pub unsafe fn vld1_dup_u16(ptr: *const u16) -> uint16x4_t { in vld1_dup_u16() function 10519 let r: u16x4 = transmute(vld1_dup_u16(&elem)); in test_vld1_dup_u16()
|
/aosp_15_r20/out/soong/.intermediates/external/clang/clang-gen-arm-neon/gen/clang/Basic/ |
D | arm_neon.h | 8058 #define vld1_dup_u16(__p0) __extension__ ({ \ macro 8064 #define vld1_dup_u16(__p0) __extension__ ({ \ macro
|
/aosp_15_r20/prebuilts/clang/host/linux-x86/clang-3289846/lib64/clang/3.8/include/ |
D | arm_neon.h | 8058 #define vld1_dup_u16(__p0) __extension__ ({ \ macro 8064 #define vld1_dup_u16(__p0) __extension__ ({ \ macro
|
/aosp_15_r20/prebuilts/sdk/renderscript/clang-include/ |
H A D | arm_neon.h | 8146 #define vld1_dup_u16(__p0) __extension__ ({ \ macro 8152 #define vld1_dup_u16(__p0) __extension__ ({ \ macro
|
/aosp_15_r20/prebuilts/clang/host/linux-x86/clang-r530567b/lib/clang/19/include/ |
D | arm_neon.h | 8892 #define vld1_dup_u16(__p0) __extension__ ({ \ macro 8898 #define vld1_dup_u16(__p0) __extension__ ({ \ macro
|
/aosp_15_r20/prebuilts/clang/host/linux-x86/clang-r522817/lib/clang/18/include/ |
D | arm_neon.h | 8892 #define vld1_dup_u16(__p0) __extension__ ({ \ macro 8898 #define vld1_dup_u16(__p0) __extension__ ({ \ macro
|
/aosp_15_r20/prebuilts/clang/host/linux-x86/clang-r536225/lib/clang/19/include/ |
D | arm_neon.h | 8970 #define vld1_dup_u16(__p0) __extension__ ({ \ macro 8976 #define vld1_dup_u16(__p0) __extension__ ({ \ macro
|
/aosp_15_r20/prebuilts/clang-tools/linux-x86/lib64/clang/19/include/ |
H A D | arm_neon.h | 8892 #define vld1_dup_u16(__p0) __extension__ ({ \ macro 8898 #define vld1_dup_u16(__p0) __extension__ ({ \ macro
|
/aosp_15_r20/prebuilts/clang/host/linux-x86/clang-r530567/lib/clang/19/include/ |
D | arm_neon.h | 8892 #define vld1_dup_u16(__p0) __extension__ ({ \ macro 8898 #define vld1_dup_u16(__p0) __extension__ ({ \ macro
|