Home
last modified time | relevance | path

Searched +full:k +full:- +full:block (Results 1 – 25 of 1329) sorted by relevance

12345678910>>...54

/aosp_15_r20/external/XNNPACK/test/
H A Dqs8-gemm-minmax-fp32.yaml3 # This source code is licensed under the BSD-style license found in the
7 - name: xnn_qs8_gemm_minmax_fp32_ukernel_1x1c4__armsimd32
9 k-block: 4
10 - name: xnn_qs8_gemm_minmax_fp32_ukernel_1x2c4__armsimd32
12 k-block: 4
13 - name: xnn_qs8_gemm_minmax_fp32_ukernel_2x1c4__armsimd32
15 k-block: 4
16 - name: xnn_qs8_gemm_minmax_fp32_ukernel_2x2c4__armsimd32
18 k-block: 4
21 - name: xnn_qs8_gemm_minmax_fp32_ukernel_1x8c2__neon_mlal_dup
[all …]
H A Dqc8-gemm-minmax-fp32.yaml3 # This source code is licensed under the BSD-style license found in the
7 - name: xnn_qc8_gemm_minmax_fp32_ukernel_1x8__aarch32_neon_mlal_lane_cortex_a7
9 k-block: 8
11 - name: xnn_qc8_gemm_minmax_fp32_ukernel_1x8__aarch32_neon_mlal_lane_prfm_cortex_a7
13 k-block: 8
15 - name: xnn_qc8_gemm_minmax_fp32_ukernel_1x8__aarch32_neonv8_mlal_lane_cortex_a35
17 k-block: 8
19 - name: xnn_qc8_gemm_minmax_fp32_ukernel_1x8__aarch32_neonv8_mlal_lane_prfm_cortex_a35
21 k-block: 8
23 - name: xnn_qc8_gemm_minmax_fp32_ukernel_4x8__aarch32_neon_mlal_lane_cortex_a7
[all …]
H A Dqc8-igemm-minmax-fp32.yaml3 # This source code is licensed under the BSD-style license found in the
7 - name: xnn_qc8_igemm_minmax_fp32_ukernel_1x8__aarch32_neon_mlal_lane_cortex_a7
9 k-block: 8
11 - name: xnn_qc8_igemm_minmax_fp32_ukernel_1x8__aarch32_neon_mlal_lane_prfm_cortex_a7
13 k-block: 8
15 - name: xnn_qc8_igemm_minmax_fp32_ukernel_1x8__aarch32_neonv8_mlal_lane_cortex_a35
17 k-block: 8
19 - name: xnn_qc8_igemm_minmax_fp32_ukernel_1x8__aarch32_neonv8_mlal_lane_prfm_cortex_a35
21 k-block: 8
23 - name: xnn_qc8_igemm_minmax_fp32_ukernel_4x8__aarch32_neon_mlal_lane_cortex_a53
[all …]
H A Dqs8-gemm-minmax-rndnu.yaml3 # This source code is licensed under the BSD-style license found in the
7 - name: xnn_qs8_gemm_minmax_rndnu_ukernel_1x8__aarch32_neon_mlal_lane_cortex_a7
9 k-block: 8
11 - name: xnn_qs8_gemm_minmax_rndnu_ukernel_1x8__aarch32_neon_mlal_lane_prfm_cortex_a7
13 k-block: 8
15 - name: xnn_qs8_gemm_minmax_rndnu_ukernel_4x8__aarch32_neon_mlal_lane_cortex_a7
17 k-block: 8
19 - name: xnn_qs8_gemm_minmax_rndnu_ukernel_4x8__aarch32_neon_mlal_lane_cortex_a53
21 k-block: 8
23 - name: xnn_qs8_gemm_minmax_rndnu_ukernel_4x8__aarch32_neon_mlal_lane_ld64
[all …]
H A Dqs8-igemm-minmax-rndnu.yaml3 # This source code is licensed under the BSD-style license found in the
7 - name: xnn_qs8_igemm_minmax_rndnu_ukernel_1x8__aarch32_neon_mlal_lane_cortex_a7
9 k-block: 8
11 - name: xnn_qs8_igemm_minmax_rndnu_ukernel_1x8__aarch32_neon_mlal_lane_prfm_cortex_a7
13 k-block: 8
15 - name: xnn_qs8_igemm_minmax_rndnu_ukernel_4x8__aarch32_neon_mlal_lane_cortex_a53
17 k-block: 8
19 - name: xnn_qs8_igemm_minmax_rndnu_ukernel_4x8__aarch32_neon_mlal_lane_ld64
21 k-block: 8
23 - name: xnn_qs8_igemm_minmax_rndnu_ukernel_4x8__aarch32_neon_mlal_lane_prfm_cortex_a53
[all …]
H A Dqs8-igemm-minmax-fp32.yaml3 # This source code is licensed under the BSD-style license found in the
7 - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x1c4__armsimd32
9 k-block: 4
10 - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x2c4__armsimd32
12 k-block: 4
13 - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x1c4__armsimd32
15 k-block: 4
16 - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x2c4__armsimd32
18 k-block: 4
21 - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x8c2__neon_mlal_dup
[all …]
H A Df32-gemm-minmax.yaml3 # This source code is licensed under the BSD-style license found in the
7 - name: xnn_f32_gemm_minmax_ukernel_4x4__aarch32_vfp_ld64
9 k-block: 2
11 - name: xnn_f32_gemm_minmax_ukernel_4x8__aarch32_neon_cortex_a7
13 k-block: 2
15 - name: xnn_f32_gemm_minmax_ukernel_4x8__aarch32_neon_cortex_a53
17 k-block: 4
20 - name: xnn_f32_gemm_minmax_ukernel_4x8__aarch32_neon_cortex_a55
22 k-block: 4
25 - name: xnn_f32_gemm_minmax_ukernel_4x8__aarch32_neon_cortex_a75
[all …]
H A Df32-igemm-minmax.yaml3 # This source code is licensed under the BSD-style license found in the
7 - name: xnn_f32_igemm_minmax_ukernel_4x8__aarch32_neon_cortex_a7
9 k-block: 2
11 - name: xnn_f32_igemm_minmax_ukernel_4x8__aarch32_neon_cortex_a53
13 k-block: 4
16 - name: xnn_f32_igemm_minmax_ukernel_4x8__aarch32_neon_cortex_a55
18 k-block: 4
21 - name: xnn_f32_igemm_minmax_ukernel_4x8__aarch32_neon_cortex_a75
23 k-block: 4
26 - name: xnn_f32_igemm_minmax_ukernel_4x8__aarch32_neon_ld64
[all …]
H A Dqu8-gemm-minmax-fp32.yaml3 # This source code is licensed under the BSD-style license found in the
7 - name: xnn_qu8_gemm_minmax_fp32_ukernel_4x16c4__aarch64_neondot_cortex_a55
9 k-block: 16
11 - name: xnn_qu8_gemm_minmax_fp32_ukernel_4x16c4__aarch64_neondot_ld128
13 k-block: 16
17 - name: xnn_qu8_gemm_minmax_fp32_ukernel_1x1c4__armsimd32
19 k-block: 4
20 - name: xnn_qu8_gemm_minmax_fp32_ukernel_1x2c4__armsimd32
22 k-block: 4
23 - name: xnn_qu8_gemm_minmax_fp32_ukernel_2x1c4__armsimd32
[all …]
H A Dqu8-igemm-minmax-fp32.yaml3 # This source code is licensed under the BSD-style license found in the
7 - name: xnn_qu8_igemm_minmax_fp32_ukernel_4x16c4__aarch64_neondot_cortex_a55
9 k-block: 16
11 - name: xnn_qu8_igemm_minmax_fp32_ukernel_4x16c4__aarch64_neondot_ld128
13 k-block: 16
17 - name: xnn_qu8_igemm_minmax_fp32_ukernel_1x1c4__armsimd32
19 k-block: 4
20 - name: xnn_qu8_igemm_minmax_fp32_ukernel_1x2c4__armsimd32
22 k-block: 4
23 - name: xnn_qu8_igemm_minmax_fp32_ukernel_2x1c4__armsimd32
[all …]
H A Df32-gemminc-minmax.yaml3 # This source code is licensed under the BSD-style license found in the
7 - name: xnn_f32_gemminc_minmax_ukernel_1x8__aarch64_neonfma_cortex_a53
9 k-block: 8
12 - name: xnn_f32_gemminc_minmax_ukernel_1x8__aarch64_neonfma_cortex_a75
14 k-block: 8
17 - name: xnn_f32_gemminc_minmax_ukernel_1x8__aarch64_neonfma_ld64
19 k-block: 2
21 - name: xnn_f32_gemminc_minmax_ukernel_1x8__aarch64_neonfma_prfm_cortex_a75
23 k-block: 8
26 - name: xnn_f32_gemminc_minmax_ukernel_1x12__aarch64_neonfma_cortex_a53
[all …]
H A Df32-spmm-minmax.yaml3 # This source code is licensed under the BSD-style license found in the
7 - name: xnn_f32_spmm_minmax_ukernel_4x1__neon
9 k-block: 1
10 - name: xnn_f32_spmm_minmax_ukernel_4x1__neon_pipelined
12 k-block: 1
13 - name: xnn_f32_spmm_minmax_ukernel_4x1__neon_x2
15 k-block: 2
16 - name: xnn_f32_spmm_minmax_ukernel_4x1__neonfma
18 k-block: 1
19 - name: xnn_f32_spmm_minmax_ukernel_4x1__neonfma_pipelined
[all …]
H A Dqu8-gemm-minmax-rndnu.yaml3 # This source code is licensed under the BSD-style license found in the
7 - name: xnn_qu8_gemm_minmax_rndnu_ukernel_1x8__aarch32_neon_mlal_lane_cortex_a7
9 k-block: 8
11 - name: xnn_qu8_gemm_minmax_rndnu_ukernel_1x8__aarch32_neon_mlal_lane_prfm_cortex_a7
13 k-block: 8
15 - name: xnn_qu8_gemm_minmax_rndnu_ukernel_4x8__aarch32_neon_mlal_lane_cortex_a7
17 k-block: 8
19 - name: xnn_qu8_gemm_minmax_rndnu_ukernel_4x8__aarch32_neon_mlal_lane_cortex_a53
21 k-block: 8
23 - name: xnn_qu8_gemm_minmax_rndnu_ukernel_4x8__aarch32_neon_mlal_lane_ld64
[all …]
H A Dqu8-igemm-minmax-rndnu.yaml3 # This source code is licensed under the BSD-style license found in the
7 - name: xnn_qu8_igemm_minmax_rndnu_ukernel_1x8__aarch32_neon_mlal_lane_cortex_a7
9 k-block: 8
11 - name: xnn_qu8_igemm_minmax_rndnu_ukernel_1x8__aarch32_neon_mlal_lane_prfm_cortex_a7
13 k-block: 8
15 - name: xnn_qu8_igemm_minmax_rndnu_ukernel_4x8__aarch32_neon_mlal_lane_cortex_a53
17 k-block: 8
19 - name: xnn_qu8_igemm_minmax_rndnu_ukernel_4x8__aarch32_neon_mlal_lane_ld64
21 k-block: 8
23 - name: xnn_qu8_igemm_minmax_rndnu_ukernel_4x8__aarch32_neon_mlal_lane_prfm_cortex_a53
[all …]
H A Df32-igemm-relu.yaml3 # This source code is licensed under the BSD-style license found in the
7 - name: xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_loadsplat
8 k-block: 1
9 - name: xnn_f32_igemm_relu_ukernel_1x8__wasmsimd_splat
10 k-block: 4
11 - name: xnn_f32_igemm_relu_ukernel_1x8s4__wasmsimd
12 k-block: 4
13 - name: xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_loadsplat
14 k-block: 1
15 - name: xnn_f32_igemm_relu_ukernel_3x8__wasmsimd_splat
[all …]
H A Df32-gemm-relu.yaml3 # This source code is licensed under the BSD-style license found in the
7 - name: xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_loadsplat
8 k-block: 1
9 - name: xnn_f32_gemm_relu_ukernel_1x8__wasmsimd_splat
10 k-block: 4
11 - name: xnn_f32_gemm_relu_ukernel_1x8s4__wasmsimd
12 k-block: 4
13 - name: xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_loadsplat
14 k-block: 1
15 - name: xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat
[all …]
H A Df32-gemm.yaml3 # This source code is licensed under the BSD-style license found in the
7 - name: xnn_f32_gemm_ukernel_4x4__aarch32_vfp_ld64
8 k-block: 2
11 - name: xnn_f32_gemm_ukernel_1x8__wasmsimd_loadsplat
12 k-block: 1
13 - name: xnn_f32_gemm_ukernel_1x8__wasmsimd_splat
14 k-block: 4
15 - name: xnn_f32_gemm_ukernel_1x8s4__wasmsimd
16 k-block: 4
17 - name: xnn_f32_gemm_ukernel_3x8__wasmsimd_loadsplat
[all …]
/aosp_15_r20/external/boringssl/src/gen/bcm/
H A Daesv8-gcm-armv8-linux.S1 // This file is generated from a similarly-named Perl script in the BoringSSL
10 .arch armv8-a+crypto
18 stp x29, x30, [sp, #-128]!
32 ldr q31, [x19, #-16] // load round N-1 keys
37 … // special case vector load initial counter so we can start first AES block as quickly as poss…
38 sub x5, x5, #1 // byte_len - 1
44 fmov d2, x10 // CTR block 2
47 fmov d1, x10 // CTR block 1
49 aesmc v0.16b, v0.16b // AES block 0 - round 0
51 rev w9, w12 // CTR block 1
[all …]
H A Daesv8-gcm-armv8-win.S1 // This file is generated from a similarly-named Perl script in the BoringSSL
10 .arch armv8-a+crypto
20 stp x29, x30, [sp, #-128]!
34 ldr q31, [x19, #-16] // load round N-1 keys
39 … // special case vector load initial counter so we can start first AES block as quickly as poss…
40 sub x5, x5, #1 // byte_len - 1
46 fmov d2, x10 // CTR block 2
49 fmov d1, x10 // CTR block 1
51 aesmc v0.16b, v0.16b // AES block 0 - round 0
53 rev w9, w12 // CTR block 1
[all …]
H A Daesv8-gcm-armv8-apple.S1 // This file is generated from a similarly-named Perl script in the BoringSSL
18 stp x29, x30, [sp, #-128]!
32 ldr q31, [x19, #-16] // load round N-1 keys
37 … // special case vector load initial counter so we can start first AES block as quickly as poss…
38 sub x5, x5, #1 // byte_len - 1
44 fmov d2, x10 // CTR block 2
47 fmov d1, x10 // CTR block 1
49 aesmc v0.16b, v0.16b // AES block 0 - round 0
51 rev w9, w12 // CTR block 1
52 fmov d3, x10 // CTR block 3
[all …]
/aosp_15_r20/external/cronet/third_party/boringssl/src/gen/bcm/
H A Daesv8-gcm-armv8-linux.S1 // This file is generated from a similarly-named Perl script in the BoringSSL
10 .arch armv8-a+crypto
18 stp x29, x30, [sp, #-128]!
32 ldr q31, [x19, #-16] // load round N-1 keys
37 … // special case vector load initial counter so we can start first AES block as quickly as poss…
38 sub x5, x5, #1 // byte_len - 1
44 fmov d2, x10 // CTR block 2
47 fmov d1, x10 // CTR block 1
49 aesmc v0.16b, v0.16b // AES block 0 - round 0
51 rev w9, w12 // CTR block 1
[all …]
H A Daesv8-gcm-armv8-win.S1 // This file is generated from a similarly-named Perl script in the BoringSSL
10 .arch armv8-a+crypto
20 stp x29, x30, [sp, #-128]!
34 ldr q31, [x19, #-16] // load round N-1 keys
39 … // special case vector load initial counter so we can start first AES block as quickly as poss…
40 sub x5, x5, #1 // byte_len - 1
46 fmov d2, x10 // CTR block 2
49 fmov d1, x10 // CTR block 1
51 aesmc v0.16b, v0.16b // AES block 0 - round 0
53 rev w9, w12 // CTR block 1
[all …]
H A Daesv8-gcm-armv8-apple.S1 // This file is generated from a similarly-named Perl script in the BoringSSL
18 stp x29, x30, [sp, #-128]!
32 ldr q31, [x19, #-16] // load round N-1 keys
37 … // special case vector load initial counter so we can start first AES block as quickly as poss…
38 sub x5, x5, #1 // byte_len - 1
44 fmov d2, x10 // CTR block 2
47 fmov d1, x10 // CTR block 1
49 aesmc v0.16b, v0.16b // AES block 0 - round 0
51 rev w9, w12 // CTR block 1
52 fmov d3, x10 // CTR block 3
[all …]
/aosp_15_r20/external/cronet/third_party/boringssl/src/crypto/fipsmodule/modes/asm/
H A Daesv8-gcm-armv8.pl19 # derived from https://github.com/ARM-software/AArch64cryptolib, original
23 # Approach - assume we don't want to reload constants, so reserve ~half of
34 # | CTR block 4k+8 | AES block 4k+4 | GHASH block 4k+0 |
37 # | CTR block 4k+9 | AES block 4k+5 | GHASH block 4k+1 |
40 # | CTR block 4k+10| AES block 4k+6 | GHASH block 4k+2 |
43 # | CTR block 4k+11| AES block 4k+7 | GHASH block 4k+3 |
50 # result for GHASH 4k+0
53 # EOR res_curr (4k+0), res_curr (4k+0), low_acc
55 # CTR block: Increment and byte reverse counter in scalar registers and transfer
65 # AES block:
[all …]
/aosp_15_r20/external/boringssl/src/crypto/fipsmodule/modes/asm/
H A Daesv8-gcm-armv8.pl19 # derived from https://github.com/ARM-software/AArch64cryptolib, original
23 # Approach - assume we don't want to reload constants, so reserve ~half of
34 # | CTR block 4k+8 | AES block 4k+4 | GHASH block 4k+0 |
37 # | CTR block 4k+9 | AES block 4k+5 | GHASH block 4k+1 |
40 # | CTR block 4k+10| AES block 4k+6 | GHASH block 4k+2 |
43 # | CTR block 4k+11| AES block 4k+7 | GHASH block 4k+3 |
50 # result for GHASH 4k+0
53 # EOR res_curr (4k+0), res_curr (4k+0), low_acc
55 # CTR block: Increment and byte reverse counter in scalar registers and transfer
65 # AES block:
[all …]

12345678910>>...54