xref: /aosp_15_r20/external/vixl/examples/aarch64/add2-vectors.cc (revision f5c631da2f1efdd72b5fd1e20510e4042af13d77)
1*f5c631daSSadaf Ebrahimi // Copyright 2015, VIXL authors
2*f5c631daSSadaf Ebrahimi // All rights reserved.
3*f5c631daSSadaf Ebrahimi //
4*f5c631daSSadaf Ebrahimi // Redistribution and use in source and binary forms, with or without
5*f5c631daSSadaf Ebrahimi // modification, are permitted provided that the following conditions are met:
6*f5c631daSSadaf Ebrahimi //
7*f5c631daSSadaf Ebrahimi //   * Redistributions of source code must retain the above copyright notice,
8*f5c631daSSadaf Ebrahimi //     this list of conditions and the following disclaimer.
9*f5c631daSSadaf Ebrahimi //   * Redistributions in binary form must reproduce the above copyright notice,
10*f5c631daSSadaf Ebrahimi //     this list of conditions and the following disclaimer in the documentation
11*f5c631daSSadaf Ebrahimi //     and/or other materials provided with the distribution.
12*f5c631daSSadaf Ebrahimi //   * Neither the name of ARM Limited nor the names of its contributors may be
13*f5c631daSSadaf Ebrahimi //     used to endorse or promote products derived from this software without
14*f5c631daSSadaf Ebrahimi //     specific prior written permission.
15*f5c631daSSadaf Ebrahimi //
16*f5c631daSSadaf Ebrahimi // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS CONTRIBUTORS "AS IS" AND
17*f5c631daSSadaf Ebrahimi // ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
18*f5c631daSSadaf Ebrahimi // WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
19*f5c631daSSadaf Ebrahimi // DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
20*f5c631daSSadaf Ebrahimi // FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21*f5c631daSSadaf Ebrahimi // DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
22*f5c631daSSadaf Ebrahimi // SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
23*f5c631daSSadaf Ebrahimi // CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
24*f5c631daSSadaf Ebrahimi // OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
25*f5c631daSSadaf Ebrahimi // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26*f5c631daSSadaf Ebrahimi 
27*f5c631daSSadaf Ebrahimi #include "examples.h"
28*f5c631daSSadaf Ebrahimi 
29*f5c631daSSadaf Ebrahimi using namespace vixl;
30*f5c631daSSadaf Ebrahimi using namespace vixl::aarch64;
31*f5c631daSSadaf Ebrahimi 
32*f5c631daSSadaf Ebrahimi // Macro to compute the number of elements in a vector.
33*f5c631daSSadaf Ebrahimi #define ARRAY_SIZE(Array) (sizeof(Array) / sizeof((Array)[0]))
34*f5c631daSSadaf Ebrahimi #define __ masm->
35*f5c631daSSadaf Ebrahimi 
36*f5c631daSSadaf Ebrahimi /*
37*f5c631daSSadaf Ebrahimi  * This example adds two vectors with 1-byte elements using NEON instructions,
38*f5c631daSSadaf Ebrahimi  * and returns the results in the first vector.
39*f5c631daSSadaf Ebrahimi  */
GenerateAdd2Vectors(MacroAssembler * masm)40*f5c631daSSadaf Ebrahimi void GenerateAdd2Vectors(MacroAssembler* masm) {
41*f5c631daSSadaf Ebrahimi   // void add2_vectors(uint8_t *vec_a, const uint8_t *vec_b, unsigned size)
42*f5c631daSSadaf Ebrahimi   // Argument locations:
43*f5c631daSSadaf Ebrahimi   //    vec_a (pointer) -> x0
44*f5c631daSSadaf Ebrahimi   //    vec_b (pointer) -> x1
45*f5c631daSSadaf Ebrahimi   //    size (integer) -> w2
46*f5c631daSSadaf Ebrahimi   // Result returned in vec_a.
47*f5c631daSSadaf Ebrahimi 
48*f5c631daSSadaf Ebrahimi   Label loop16, loopr, end;
49*f5c631daSSadaf Ebrahimi 
50*f5c631daSSadaf Ebrahimi   // Loop to add vector elements in 16-byte chunks.
51*f5c631daSSadaf Ebrahimi   __ Bind(&loop16);
52*f5c631daSSadaf Ebrahimi 
53*f5c631daSSadaf Ebrahimi   // Handle vectors smaller than 16-bytes in the remainder loop.
54*f5c631daSSadaf Ebrahimi   __ Cmp(w2, 16);
55*f5c631daSSadaf Ebrahimi   __ B(lo, &loopr);
56*f5c631daSSadaf Ebrahimi   __ Sub(w2, w2, 16);
57*f5c631daSSadaf Ebrahimi 
58*f5c631daSSadaf Ebrahimi   // Add vectors in 16-byte chunks.
59*f5c631daSSadaf Ebrahimi   __ Ld1(v0.V16B(), MemOperand(x0));
60*f5c631daSSadaf Ebrahimi   __ Ld1(v1.V16B(), MemOperand(x1, 16, PostIndex));
61*f5c631daSSadaf Ebrahimi   __ Add(v0.V16B(), v0.V16B(), v1.V16B());
62*f5c631daSSadaf Ebrahimi   __ St1(v0.V16B(), MemOperand(x0, 16, PostIndex));
63*f5c631daSSadaf Ebrahimi 
64*f5c631daSSadaf Ebrahimi   __ B(&loop16);
65*f5c631daSSadaf Ebrahimi 
66*f5c631daSSadaf Ebrahimi   // Loop to add the remaining vector elements.
67*f5c631daSSadaf Ebrahimi   __ Bind(&loopr);
68*f5c631daSSadaf Ebrahimi 
69*f5c631daSSadaf Ebrahimi   // If there are no more vector elements to process, then exit.
70*f5c631daSSadaf Ebrahimi   __ Cbz(w2, &end);
71*f5c631daSSadaf Ebrahimi   __ Sub(w2, w2, 1);
72*f5c631daSSadaf Ebrahimi 
73*f5c631daSSadaf Ebrahimi   // Add remaining vector elements in 1-byte chunks.
74*f5c631daSSadaf Ebrahimi   __ Ldrb(w5, MemOperand(x0));
75*f5c631daSSadaf Ebrahimi   __ Ldrb(w6, MemOperand(x1, 1, PostIndex));
76*f5c631daSSadaf Ebrahimi   __ Add(w5, w5, w6);
77*f5c631daSSadaf Ebrahimi   __ Strb(w5, MemOperand(x0, 1, PostIndex));
78*f5c631daSSadaf Ebrahimi 
79*f5c631daSSadaf Ebrahimi   __ B(&loopr);
80*f5c631daSSadaf Ebrahimi 
81*f5c631daSSadaf Ebrahimi   __ Bind(&end);
82*f5c631daSSadaf Ebrahimi 
83*f5c631daSSadaf Ebrahimi   __ Ret();
84*f5c631daSSadaf Ebrahimi }
85*f5c631daSSadaf Ebrahimi 
86*f5c631daSSadaf Ebrahimi 
PrintVector(const uint8_t * vec,unsigned num)87*f5c631daSSadaf Ebrahimi void PrintVector(const uint8_t* vec, unsigned num) {
88*f5c631daSSadaf Ebrahimi   unsigned i;
89*f5c631daSSadaf Ebrahimi   printf("( ");
90*f5c631daSSadaf Ebrahimi   if (num > 0) {
91*f5c631daSSadaf Ebrahimi     for (i = 0; i < num - 1; ++i) {
92*f5c631daSSadaf Ebrahimi       printf("%d, ", vec[i]);
93*f5c631daSSadaf Ebrahimi     }
94*f5c631daSSadaf Ebrahimi     printf("%d", vec[i]);
95*f5c631daSSadaf Ebrahimi   }
96*f5c631daSSadaf Ebrahimi   printf(" )\n");
97*f5c631daSSadaf Ebrahimi }
98*f5c631daSSadaf Ebrahimi 
99*f5c631daSSadaf Ebrahimi 
100*f5c631daSSadaf Ebrahimi #ifndef TEST_EXAMPLES
main(void)101*f5c631daSSadaf Ebrahimi int main(void) {
102*f5c631daSSadaf Ebrahimi   MacroAssembler masm;
103*f5c631daSSadaf Ebrahimi 
104*f5c631daSSadaf Ebrahimi   // Generate native code for the example function.
105*f5c631daSSadaf Ebrahimi   Label add2_vectors;
106*f5c631daSSadaf Ebrahimi   masm.Bind(&add2_vectors);
107*f5c631daSSadaf Ebrahimi   GenerateAdd2Vectors(&masm);
108*f5c631daSSadaf Ebrahimi   masm.FinalizeCode();
109*f5c631daSSadaf Ebrahimi 
110*f5c631daSSadaf Ebrahimi   // Initialize input data for the example function.
111*f5c631daSSadaf Ebrahimi   // clang-format: off
112*f5c631daSSadaf Ebrahimi   uint8_t vec_a[] = {0,  1,  2,  3,  4,  5,  6,  7,  8,  9,  10, 11, 12,
113*f5c631daSSadaf Ebrahimi                      13, 14, 15, 0,  1,  2,  3,  4,  5,  6,  7,  8,  9,
114*f5c631daSSadaf Ebrahimi                      10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20};
115*f5c631daSSadaf Ebrahimi   uint8_t vec_b[] = {16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28,
116*f5c631daSSadaf Ebrahimi                      29, 30, 31, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25,
117*f5c631daSSadaf Ebrahimi                      26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36};
118*f5c631daSSadaf Ebrahimi   // clang-format on
119*f5c631daSSadaf Ebrahimi   uint8_t vec_c[ARRAY_SIZE(vec_a)];
120*f5c631daSSadaf Ebrahimi 
121*f5c631daSSadaf Ebrahimi   // Check whether the number of elements in both vectors match.
122*f5c631daSSadaf Ebrahimi   VIXL_CHECK(ARRAY_SIZE(vec_a) == ARRAY_SIZE(vec_b));
123*f5c631daSSadaf Ebrahimi 
124*f5c631daSSadaf Ebrahimi   // Compute the result in C.
125*f5c631daSSadaf Ebrahimi   for (unsigned i = 0; i < ARRAY_SIZE(vec_a); i++) {
126*f5c631daSSadaf Ebrahimi     vec_c[i] = vec_a[i] + vec_b[i];
127*f5c631daSSadaf Ebrahimi   }
128*f5c631daSSadaf Ebrahimi 
129*f5c631daSSadaf Ebrahimi #ifdef VIXL_INCLUDE_SIMULATOR_AARCH64
130*f5c631daSSadaf Ebrahimi   uintptr_t vec_a_addr = reinterpret_cast<uintptr_t>(vec_a);
131*f5c631daSSadaf Ebrahimi   uintptr_t vec_b_addr = reinterpret_cast<uintptr_t>(vec_b);
132*f5c631daSSadaf Ebrahimi 
133*f5c631daSSadaf Ebrahimi   // Configure register environment in the simulator.
134*f5c631daSSadaf Ebrahimi   Decoder decoder;
135*f5c631daSSadaf Ebrahimi   Simulator simulator(&decoder);
136*f5c631daSSadaf Ebrahimi   simulator.WriteXRegister(0, vec_a_addr);
137*f5c631daSSadaf Ebrahimi   simulator.WriteXRegister(1, vec_b_addr);
138*f5c631daSSadaf Ebrahimi   simulator.WriteXRegister(2, ARRAY_SIZE(vec_a));
139*f5c631daSSadaf Ebrahimi   PrintVector(vec_a, ARRAY_SIZE(vec_a));
140*f5c631daSSadaf Ebrahimi   printf(" +\n");
141*f5c631daSSadaf Ebrahimi   PrintVector(vec_b, ARRAY_SIZE(vec_b));
142*f5c631daSSadaf Ebrahimi 
143*f5c631daSSadaf Ebrahimi   // Run the example function in the simulator.
144*f5c631daSSadaf Ebrahimi   simulator.RunFrom(masm.GetLabelAddress<Instruction*>(&add2_vectors));
145*f5c631daSSadaf Ebrahimi   printf(" =\n");
146*f5c631daSSadaf Ebrahimi   PrintVector(vec_a, ARRAY_SIZE(vec_a));
147*f5c631daSSadaf Ebrahimi 
148*f5c631daSSadaf Ebrahimi   // Check that the computed value in NEON matches the C version.
149*f5c631daSSadaf Ebrahimi   for (unsigned i = 0; i < ARRAY_SIZE(vec_a); i++) {
150*f5c631daSSadaf Ebrahimi     VIXL_CHECK(vec_c[i] == vec_a[i]);
151*f5c631daSSadaf Ebrahimi   }
152*f5c631daSSadaf Ebrahimi #else
153*f5c631daSSadaf Ebrahimi   USE(vec_c);
154*f5c631daSSadaf Ebrahimi 
155*f5c631daSSadaf Ebrahimi   // Placeholder to run test natively.
156*f5c631daSSadaf Ebrahimi   printf("Running tests natively is not supported yet.\n");
157*f5c631daSSadaf Ebrahimi #endif  // VIXL_INCLUDE_SIMULATOR_AARCH64
158*f5c631daSSadaf Ebrahimi 
159*f5c631daSSadaf Ebrahimi   return 0;
160*f5c631daSSadaf Ebrahimi }
161*f5c631daSSadaf Ebrahimi #endif  // TEST_EXAMPLES
162