1*9356374aSAndroid Build Coastguard Worker // Copyright 2017 The Abseil Authors.
2*9356374aSAndroid Build Coastguard Worker //
3*9356374aSAndroid Build Coastguard Worker // Licensed under the Apache License, Version 2.0 (the "License");
4*9356374aSAndroid Build Coastguard Worker // you may not use this file except in compliance with the License.
5*9356374aSAndroid Build Coastguard Worker // You may obtain a copy of the License at
6*9356374aSAndroid Build Coastguard Worker //
7*9356374aSAndroid Build Coastguard Worker // https://www.apache.org/licenses/LICENSE-2.0
8*9356374aSAndroid Build Coastguard Worker //
9*9356374aSAndroid Build Coastguard Worker // Unless required by applicable law or agreed to in writing, software
10*9356374aSAndroid Build Coastguard Worker // distributed under the License is distributed on an "AS IS" BASIS,
11*9356374aSAndroid Build Coastguard Worker // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12*9356374aSAndroid Build Coastguard Worker // See the License for the specific language governing permissions and
13*9356374aSAndroid Build Coastguard Worker // limitations under the License.
14*9356374aSAndroid Build Coastguard Worker
15*9356374aSAndroid Build Coastguard Worker #ifndef ABSL_RANDOM_INTERNAL_CHI_SQUARE_H_
16*9356374aSAndroid Build Coastguard Worker #define ABSL_RANDOM_INTERNAL_CHI_SQUARE_H_
17*9356374aSAndroid Build Coastguard Worker
18*9356374aSAndroid Build Coastguard Worker // The chi-square statistic.
19*9356374aSAndroid Build Coastguard Worker //
20*9356374aSAndroid Build Coastguard Worker // Useful for evaluating if `D` independent random variables are behaving as
21*9356374aSAndroid Build Coastguard Worker // expected, or if two distributions are similar. (`D` is the degrees of
22*9356374aSAndroid Build Coastguard Worker // freedom).
23*9356374aSAndroid Build Coastguard Worker //
24*9356374aSAndroid Build Coastguard Worker // Each bucket should have an expected count of 10 or more for the chi square to
25*9356374aSAndroid Build Coastguard Worker // be meaningful.
26*9356374aSAndroid Build Coastguard Worker
27*9356374aSAndroid Build Coastguard Worker #include <cassert>
28*9356374aSAndroid Build Coastguard Worker
29*9356374aSAndroid Build Coastguard Worker #include "absl/base/config.h"
30*9356374aSAndroid Build Coastguard Worker
31*9356374aSAndroid Build Coastguard Worker namespace absl {
32*9356374aSAndroid Build Coastguard Worker ABSL_NAMESPACE_BEGIN
33*9356374aSAndroid Build Coastguard Worker namespace random_internal {
34*9356374aSAndroid Build Coastguard Worker
35*9356374aSAndroid Build Coastguard Worker constexpr const char kChiSquared[] = "chi-squared";
36*9356374aSAndroid Build Coastguard Worker
37*9356374aSAndroid Build Coastguard Worker // Returns the measured chi square value, using a single expected value. This
38*9356374aSAndroid Build Coastguard Worker // assumes that the values in [begin, end) are uniformly distributed.
39*9356374aSAndroid Build Coastguard Worker template <typename Iterator>
ChiSquareWithExpected(Iterator begin,Iterator end,double expected)40*9356374aSAndroid Build Coastguard Worker double ChiSquareWithExpected(Iterator begin, Iterator end, double expected) {
41*9356374aSAndroid Build Coastguard Worker // Compute the sum and the number of buckets.
42*9356374aSAndroid Build Coastguard Worker assert(expected >= 10); // require at least 10 samples per bucket.
43*9356374aSAndroid Build Coastguard Worker double chi_square = 0;
44*9356374aSAndroid Build Coastguard Worker for (auto it = begin; it != end; it++) {
45*9356374aSAndroid Build Coastguard Worker double d = static_cast<double>(*it) - expected;
46*9356374aSAndroid Build Coastguard Worker chi_square += d * d;
47*9356374aSAndroid Build Coastguard Worker }
48*9356374aSAndroid Build Coastguard Worker chi_square = chi_square / expected;
49*9356374aSAndroid Build Coastguard Worker return chi_square;
50*9356374aSAndroid Build Coastguard Worker }
51*9356374aSAndroid Build Coastguard Worker
52*9356374aSAndroid Build Coastguard Worker // Returns the measured chi square value, taking the actual value of each bucket
53*9356374aSAndroid Build Coastguard Worker // from the first set of iterators, and the expected value of each bucket from
54*9356374aSAndroid Build Coastguard Worker // the second set of iterators.
55*9356374aSAndroid Build Coastguard Worker template <typename Iterator, typename Expected>
ChiSquare(Iterator it,Iterator end,Expected eit,Expected eend)56*9356374aSAndroid Build Coastguard Worker double ChiSquare(Iterator it, Iterator end, Expected eit, Expected eend) {
57*9356374aSAndroid Build Coastguard Worker double chi_square = 0;
58*9356374aSAndroid Build Coastguard Worker for (; it != end && eit != eend; ++it, ++eit) {
59*9356374aSAndroid Build Coastguard Worker if (*it > 0) {
60*9356374aSAndroid Build Coastguard Worker assert(*eit > 0);
61*9356374aSAndroid Build Coastguard Worker }
62*9356374aSAndroid Build Coastguard Worker double e = static_cast<double>(*eit);
63*9356374aSAndroid Build Coastguard Worker double d = static_cast<double>(*it - *eit);
64*9356374aSAndroid Build Coastguard Worker if (d != 0) {
65*9356374aSAndroid Build Coastguard Worker assert(e > 0);
66*9356374aSAndroid Build Coastguard Worker chi_square += (d * d) / e;
67*9356374aSAndroid Build Coastguard Worker }
68*9356374aSAndroid Build Coastguard Worker }
69*9356374aSAndroid Build Coastguard Worker assert(it == end && eit == eend);
70*9356374aSAndroid Build Coastguard Worker return chi_square;
71*9356374aSAndroid Build Coastguard Worker }
72*9356374aSAndroid Build Coastguard Worker
73*9356374aSAndroid Build Coastguard Worker // ======================================================================
74*9356374aSAndroid Build Coastguard Worker // The following methods can be used for an arbitrary significance level.
75*9356374aSAndroid Build Coastguard Worker //
76*9356374aSAndroid Build Coastguard Worker
77*9356374aSAndroid Build Coastguard Worker // Calculates critical chi-square values to produce the given p-value using a
78*9356374aSAndroid Build Coastguard Worker // bisection search for a value within epsilon, relying on the monotonicity of
79*9356374aSAndroid Build Coastguard Worker // ChiSquarePValue().
80*9356374aSAndroid Build Coastguard Worker double ChiSquareValue(int dof, double p);
81*9356374aSAndroid Build Coastguard Worker
82*9356374aSAndroid Build Coastguard Worker // Calculates the p-value (probability) of a given chi-square value.
83*9356374aSAndroid Build Coastguard Worker double ChiSquarePValue(double chi_square, int dof);
84*9356374aSAndroid Build Coastguard Worker
85*9356374aSAndroid Build Coastguard Worker } // namespace random_internal
86*9356374aSAndroid Build Coastguard Worker ABSL_NAMESPACE_END
87*9356374aSAndroid Build Coastguard Worker } // namespace absl
88*9356374aSAndroid Build Coastguard Worker
89*9356374aSAndroid Build Coastguard Worker #endif // ABSL_RANDOM_INTERNAL_CHI_SQUARE_H_
90