xref: /aosp_15_r20/external/XNNPACK/test/raddexpminusmax-microkernel-tester.h (revision 4bdc94577ba0e567308109d787f7fec7b531ce36)
1*4bdc9457SAndroid Build Coastguard Worker // Copyright 2019 Google LLC
2*4bdc9457SAndroid Build Coastguard Worker //
3*4bdc9457SAndroid Build Coastguard Worker // This source code is licensed under the BSD-style license found in the
4*4bdc9457SAndroid Build Coastguard Worker // LICENSE file in the root directory of this source tree.
5*4bdc9457SAndroid Build Coastguard Worker 
6*4bdc9457SAndroid Build Coastguard Worker #pragma once
7*4bdc9457SAndroid Build Coastguard Worker 
8*4bdc9457SAndroid Build Coastguard Worker #include <gtest/gtest.h>
9*4bdc9457SAndroid Build Coastguard Worker 
10*4bdc9457SAndroid Build Coastguard Worker #include <algorithm>
11*4bdc9457SAndroid Build Coastguard Worker #include <cassert>
12*4bdc9457SAndroid Build Coastguard Worker #include <cstddef>
13*4bdc9457SAndroid Build Coastguard Worker #include <cstdlib>
14*4bdc9457SAndroid Build Coastguard Worker #include <functional>
15*4bdc9457SAndroid Build Coastguard Worker #include <random>
16*4bdc9457SAndroid Build Coastguard Worker #include <vector>
17*4bdc9457SAndroid Build Coastguard Worker 
18*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack.h>
19*4bdc9457SAndroid Build Coastguard Worker #include <xnnpack/microfnptr.h>
20*4bdc9457SAndroid Build Coastguard Worker 
21*4bdc9457SAndroid Build Coastguard Worker 
22*4bdc9457SAndroid Build Coastguard Worker class RAddExpMinusMaxMicrokernelTester {
23*4bdc9457SAndroid Build Coastguard Worker  public:
elements(size_t elements)24*4bdc9457SAndroid Build Coastguard Worker   inline RAddExpMinusMaxMicrokernelTester& elements(size_t elements) {
25*4bdc9457SAndroid Build Coastguard Worker     assert(elements != 0);
26*4bdc9457SAndroid Build Coastguard Worker     this->elements_ = elements;
27*4bdc9457SAndroid Build Coastguard Worker     return *this;
28*4bdc9457SAndroid Build Coastguard Worker   }
29*4bdc9457SAndroid Build Coastguard Worker 
elements()30*4bdc9457SAndroid Build Coastguard Worker   inline size_t elements() const {
31*4bdc9457SAndroid Build Coastguard Worker     return this->elements_;
32*4bdc9457SAndroid Build Coastguard Worker   }
33*4bdc9457SAndroid Build Coastguard Worker 
iterations(size_t iterations)34*4bdc9457SAndroid Build Coastguard Worker   inline RAddExpMinusMaxMicrokernelTester& iterations(size_t iterations) {
35*4bdc9457SAndroid Build Coastguard Worker     this->iterations_ = iterations;
36*4bdc9457SAndroid Build Coastguard Worker     return *this;
37*4bdc9457SAndroid Build Coastguard Worker   }
38*4bdc9457SAndroid Build Coastguard Worker 
iterations()39*4bdc9457SAndroid Build Coastguard Worker   inline size_t iterations() const {
40*4bdc9457SAndroid Build Coastguard Worker     return this->iterations_;
41*4bdc9457SAndroid Build Coastguard Worker   }
42*4bdc9457SAndroid Build Coastguard Worker 
Test(xnn_f32_raddexpminusmax_ukernel_function raddexpminusmax)43*4bdc9457SAndroid Build Coastguard Worker   void Test(xnn_f32_raddexpminusmax_ukernel_function raddexpminusmax) const {
44*4bdc9457SAndroid Build Coastguard Worker     std::random_device random_device;
45*4bdc9457SAndroid Build Coastguard Worker     auto rng = std::mt19937(random_device());
46*4bdc9457SAndroid Build Coastguard Worker     // Choose such range that expf(x[i]) overflows, but expf(x[i] - x_max) doesn't.
47*4bdc9457SAndroid Build Coastguard Worker     // However, the range is still narrow enough that single-precision exp doesn't overflow.
48*4bdc9457SAndroid Build Coastguard Worker     auto f32rng = std::bind(std::uniform_real_distribution<float>(90.0f, 100.0f), rng);
49*4bdc9457SAndroid Build Coastguard Worker 
50*4bdc9457SAndroid Build Coastguard Worker     std::vector<float> x(elements() + XNN_EXTRA_BYTES / sizeof(float));
51*4bdc9457SAndroid Build Coastguard Worker     for (size_t iteration = 0; iteration < iterations(); iteration++) {
52*4bdc9457SAndroid Build Coastguard Worker       std::generate(x.begin(), x.end(), std::ref(f32rng));
53*4bdc9457SAndroid Build Coastguard Worker 
54*4bdc9457SAndroid Build Coastguard Worker       // Compute reference results.
55*4bdc9457SAndroid Build Coastguard Worker       double sum_ref = 0.0f;
56*4bdc9457SAndroid Build Coastguard Worker       const float x_max = *std::max_element(x.begin(), x.begin() + elements());
57*4bdc9457SAndroid Build Coastguard Worker       for (size_t i = 0; i < elements(); i++) {
58*4bdc9457SAndroid Build Coastguard Worker         sum_ref += exp(x[i] - x_max);
59*4bdc9457SAndroid Build Coastguard Worker       }
60*4bdc9457SAndroid Build Coastguard Worker 
61*4bdc9457SAndroid Build Coastguard Worker       // Call optimized micro-kernel.
62*4bdc9457SAndroid Build Coastguard Worker       float sum = std::nanf("");
63*4bdc9457SAndroid Build Coastguard Worker       raddexpminusmax(elements() * sizeof(float), x.data(), &sum, x_max);
64*4bdc9457SAndroid Build Coastguard Worker 
65*4bdc9457SAndroid Build Coastguard Worker       // Verify results.
66*4bdc9457SAndroid Build Coastguard Worker       ASSERT_NEAR(sum_ref, double(sum), std::abs(sum_ref) * 1.0e-6)
67*4bdc9457SAndroid Build Coastguard Worker         << "elements = " << elements() << ", x_max = " << x_max;
68*4bdc9457SAndroid Build Coastguard Worker     }
69*4bdc9457SAndroid Build Coastguard Worker   }
70*4bdc9457SAndroid Build Coastguard Worker 
71*4bdc9457SAndroid Build Coastguard Worker  private:
72*4bdc9457SAndroid Build Coastguard Worker   size_t elements_{1};
73*4bdc9457SAndroid Build Coastguard Worker   size_t iterations_{15};
74*4bdc9457SAndroid Build Coastguard Worker };
75