1*03ce13f7SAndroid Build Coastguard Worker //===- subzero/src/IceSwitchLowering.cpp - Switch lowering ----------------===//
2*03ce13f7SAndroid Build Coastguard Worker //
3*03ce13f7SAndroid Build Coastguard Worker // The Subzero Code Generator
4*03ce13f7SAndroid Build Coastguard Worker //
5*03ce13f7SAndroid Build Coastguard Worker // This file is distributed under the University of Illinois Open Source
6*03ce13f7SAndroid Build Coastguard Worker // License. See LICENSE.TXT for details.
7*03ce13f7SAndroid Build Coastguard Worker //
8*03ce13f7SAndroid Build Coastguard Worker //===----------------------------------------------------------------------===//
9*03ce13f7SAndroid Build Coastguard Worker ///
10*03ce13f7SAndroid Build Coastguard Worker /// \file
11*03ce13f7SAndroid Build Coastguard Worker /// \brief Implements platform independent analysis of switch cases to improve
12*03ce13f7SAndroid Build Coastguard Worker /// the generated code.
13*03ce13f7SAndroid Build Coastguard Worker ///
14*03ce13f7SAndroid Build Coastguard Worker //===----------------------------------------------------------------------===//
15*03ce13f7SAndroid Build Coastguard Worker #include "IceSwitchLowering.h"
16*03ce13f7SAndroid Build Coastguard Worker
17*03ce13f7SAndroid Build Coastguard Worker #include "IceCfgNode.h"
18*03ce13f7SAndroid Build Coastguard Worker #include "IceTargetLowering.h"
19*03ce13f7SAndroid Build Coastguard Worker
20*03ce13f7SAndroid Build Coastguard Worker #include <algorithm>
21*03ce13f7SAndroid Build Coastguard Worker
22*03ce13f7SAndroid Build Coastguard Worker namespace Ice {
23*03ce13f7SAndroid Build Coastguard Worker
clusterizeSwitch(Cfg * Func,const InstSwitch * Instr)24*03ce13f7SAndroid Build Coastguard Worker CaseClusterArray CaseCluster::clusterizeSwitch(Cfg *Func,
25*03ce13f7SAndroid Build Coastguard Worker const InstSwitch *Instr) {
26*03ce13f7SAndroid Build Coastguard Worker const SizeT NumCases = Instr->getNumCases();
27*03ce13f7SAndroid Build Coastguard Worker CaseClusterArray CaseClusters;
28*03ce13f7SAndroid Build Coastguard Worker CaseClusters.reserve(NumCases);
29*03ce13f7SAndroid Build Coastguard Worker
30*03ce13f7SAndroid Build Coastguard Worker // Load the cases
31*03ce13f7SAndroid Build Coastguard Worker CaseClusters.reserve(NumCases);
32*03ce13f7SAndroid Build Coastguard Worker for (SizeT I = 0; I < NumCases; ++I)
33*03ce13f7SAndroid Build Coastguard Worker CaseClusters.emplace_back(Instr->getValue(I), Instr->getLabel(I));
34*03ce13f7SAndroid Build Coastguard Worker
35*03ce13f7SAndroid Build Coastguard Worker // Sort the cases
36*03ce13f7SAndroid Build Coastguard Worker std::sort(CaseClusters.begin(), CaseClusters.end(),
37*03ce13f7SAndroid Build Coastguard Worker [](const CaseCluster &x, const CaseCluster &y) {
38*03ce13f7SAndroid Build Coastguard Worker return x.High < y.Low;
39*03ce13f7SAndroid Build Coastguard Worker });
40*03ce13f7SAndroid Build Coastguard Worker
41*03ce13f7SAndroid Build Coastguard Worker // Merge adjacent case ranges
42*03ce13f7SAndroid Build Coastguard Worker auto Active = CaseClusters.begin();
43*03ce13f7SAndroid Build Coastguard Worker std::for_each(Active + 1, CaseClusters.end(),
44*03ce13f7SAndroid Build Coastguard Worker [&Active](const CaseCluster &x) {
45*03ce13f7SAndroid Build Coastguard Worker if (!Active->tryAppend(x))
46*03ce13f7SAndroid Build Coastguard Worker *(++Active) = x;
47*03ce13f7SAndroid Build Coastguard Worker });
48*03ce13f7SAndroid Build Coastguard Worker CaseClusters.erase(Active + 1, CaseClusters.end());
49*03ce13f7SAndroid Build Coastguard Worker
50*03ce13f7SAndroid Build Coastguard Worker // TODO(ascull): Merge in a cycle i.e. -1(=UINTXX_MAX) to 0. This depends on
51*03ce13f7SAndroid Build Coastguard Worker // the types for correct wrap around behavior.
52*03ce13f7SAndroid Build Coastguard Worker
53*03ce13f7SAndroid Build Coastguard Worker // A small number of cases is more efficient without a jump table
54*03ce13f7SAndroid Build Coastguard Worker if (CaseClusters.size() < Func->getTarget()->getMinJumpTableSize())
55*03ce13f7SAndroid Build Coastguard Worker return CaseClusters;
56*03ce13f7SAndroid Build Coastguard Worker
57*03ce13f7SAndroid Build Coastguard Worker // Test for a single jump table. This can be done in constant time whereas
58*03ce13f7SAndroid Build Coastguard Worker // finding the best set of jump table would be quadratic, too slow(?). If
59*03ce13f7SAndroid Build Coastguard Worker // jump tables were included in the search tree we'd first have to traverse
60*03ce13f7SAndroid Build Coastguard Worker // to them. Ideally we would have an unbalanced tree which is biased towards
61*03ce13f7SAndroid Build Coastguard Worker // frequently executed code but we can't do this well without profiling data.
62*03ce13f7SAndroid Build Coastguard Worker // So, this single jump table is a good starting point where you can get to
63*03ce13f7SAndroid Build Coastguard Worker // the jump table quickly without figuring out how to unbalance the tree.
64*03ce13f7SAndroid Build Coastguard Worker const uint64_t MaxValue = CaseClusters.back().High;
65*03ce13f7SAndroid Build Coastguard Worker const uint64_t MinValue = CaseClusters.front().Low;
66*03ce13f7SAndroid Build Coastguard Worker // Don't +1 yet to avoid (INT64_MAX-0)+1 overflow
67*03ce13f7SAndroid Build Coastguard Worker const uint64_t Range = MaxValue - MinValue;
68*03ce13f7SAndroid Build Coastguard Worker
69*03ce13f7SAndroid Build Coastguard Worker // Might be too sparse for the jump table
70*03ce13f7SAndroid Build Coastguard Worker if (NumCases * 2 <= Range)
71*03ce13f7SAndroid Build Coastguard Worker return CaseClusters;
72*03ce13f7SAndroid Build Coastguard Worker // Unlikely. Would mean can't store size of jump table.
73*03ce13f7SAndroid Build Coastguard Worker if (Range == UINT64_MAX)
74*03ce13f7SAndroid Build Coastguard Worker return CaseClusters;
75*03ce13f7SAndroid Build Coastguard Worker const uint64_t TotalRange = Range + 1;
76*03ce13f7SAndroid Build Coastguard Worker
77*03ce13f7SAndroid Build Coastguard Worker // Replace everything with a jump table
78*03ce13f7SAndroid Build Coastguard Worker auto *JumpTable =
79*03ce13f7SAndroid Build Coastguard Worker InstJumpTable::create(Func, TotalRange, Instr->getLabelDefault());
80*03ce13f7SAndroid Build Coastguard Worker for (const CaseCluster &Case : CaseClusters) {
81*03ce13f7SAndroid Build Coastguard Worker // Case.High could be UINT64_MAX which makes the loop awkward. Unwrap the
82*03ce13f7SAndroid Build Coastguard Worker // last iteration to avoid wrap around problems.
83*03ce13f7SAndroid Build Coastguard Worker for (uint64_t I = Case.Low; I < Case.High; ++I)
84*03ce13f7SAndroid Build Coastguard Worker JumpTable->addTarget(I - MinValue, Case.Target);
85*03ce13f7SAndroid Build Coastguard Worker JumpTable->addTarget(Case.High - MinValue, Case.Target);
86*03ce13f7SAndroid Build Coastguard Worker Case.Target->setNeedsAlignment();
87*03ce13f7SAndroid Build Coastguard Worker }
88*03ce13f7SAndroid Build Coastguard Worker Func->addJumpTable(JumpTable);
89*03ce13f7SAndroid Build Coastguard Worker
90*03ce13f7SAndroid Build Coastguard Worker CaseClusters.clear();
91*03ce13f7SAndroid Build Coastguard Worker CaseClusters.emplace_back(MinValue, MaxValue, JumpTable);
92*03ce13f7SAndroid Build Coastguard Worker
93*03ce13f7SAndroid Build Coastguard Worker return CaseClusters;
94*03ce13f7SAndroid Build Coastguard Worker }
95*03ce13f7SAndroid Build Coastguard Worker
tryAppend(const CaseCluster & New)96*03ce13f7SAndroid Build Coastguard Worker bool CaseCluster::tryAppend(const CaseCluster &New) {
97*03ce13f7SAndroid Build Coastguard Worker // Can only append ranges with the same target and are adjacent
98*03ce13f7SAndroid Build Coastguard Worker const bool CanAppend =
99*03ce13f7SAndroid Build Coastguard Worker this->Target == New.Target && this->High + 1 == New.Low;
100*03ce13f7SAndroid Build Coastguard Worker if (CanAppend)
101*03ce13f7SAndroid Build Coastguard Worker this->High = New.High;
102*03ce13f7SAndroid Build Coastguard Worker return CanAppend;
103*03ce13f7SAndroid Build Coastguard Worker }
104*03ce13f7SAndroid Build Coastguard Worker
105*03ce13f7SAndroid Build Coastguard Worker } // end of namespace Ice
106