1*795d594fSAndroid Build Coastguard Worker /* 2*795d594fSAndroid Build Coastguard Worker * Copyright (C) 2017 The Android Open Source Project 3*795d594fSAndroid Build Coastguard Worker * 4*795d594fSAndroid Build Coastguard Worker * Licensed under the Apache License, Version 2.0 (the "License"); 5*795d594fSAndroid Build Coastguard Worker * you may not use this file except in compliance with the License. 6*795d594fSAndroid Build Coastguard Worker * You may obtain a copy of the License at 7*795d594fSAndroid Build Coastguard Worker * 8*795d594fSAndroid Build Coastguard Worker * http://www.apache.org/licenses/LICENSE-2.0 9*795d594fSAndroid Build Coastguard Worker * 10*795d594fSAndroid Build Coastguard Worker * Unless required by applicable law or agreed to in writing, software 11*795d594fSAndroid Build Coastguard Worker * distributed under the License is distributed on an "AS IS" BASIS, 12*795d594fSAndroid Build Coastguard Worker * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13*795d594fSAndroid Build Coastguard Worker * See the License for the specific language governing permissions and 14*795d594fSAndroid Build Coastguard Worker * limitations under the License. 15*795d594fSAndroid Build Coastguard Worker */ 16*795d594fSAndroid Build Coastguard Worker 17*795d594fSAndroid Build Coastguard Worker /** 18*795d594fSAndroid Build Coastguard Worker * Tests for halving-add idiomatic vectorization. 19*795d594fSAndroid Build Coastguard Worker * 20*795d594fSAndroid Build Coastguard Worker * Alternative version expressed with logical shift right 21*795d594fSAndroid Build Coastguard Worker * in the higher precision (has no impact on idiom). 22*795d594fSAndroid Build Coastguard Worker */ 23*795d594fSAndroid Build Coastguard Worker public class HaddAltChar { 24*795d594fSAndroid Build Coastguard Worker 25*795d594fSAndroid Build Coastguard Worker private static final int N = 64 * 1024; 26*795d594fSAndroid Build Coastguard Worker private static final int M = N + 31; 27*795d594fSAndroid Build Coastguard Worker 28*795d594fSAndroid Build Coastguard Worker static char[] sB1 = new char[M]; 29*795d594fSAndroid Build Coastguard Worker static char[] sB2 = new char[M]; 30*795d594fSAndroid Build Coastguard Worker static char[] sBo = new char[M]; 31*795d594fSAndroid Build Coastguard Worker 32*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltChar.halving_add_unsigned(char[], char[], char[]) loop_optimization (before) 33*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 34*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 35*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 36*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 37*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<Get1>>,<<Get2>>] loop:<<Loop>> outer_loop:none 38*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 39*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 40*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 41*795d594fSAndroid Build Coastguard Worker // 42*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddAltChar.halving_add_unsigned(char[], char[], char[]) loop_optimization (after) 43*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 44*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 45*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 46*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 47*795d594fSAndroid Build Coastguard Worker // 48*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddAltChar.halving_add_unsigned(char[], char[], char[]) loop_optimization (after) 49*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 50*795d594fSAndroid Build Coastguard Worker // 51*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 52*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 53*795d594fSAndroid Build Coastguard Worker // 54*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 55*795d594fSAndroid Build Coastguard Worker // 56*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 57*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 58*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 59*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 60*795d594fSAndroid Build Coastguard Worker // 61*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: halving_add_unsigned(char[] b1, char[] b2, char[] bo)62*795d594fSAndroid Build Coastguard Worker private static void halving_add_unsigned(char[] b1, char[] b2, char[] bo) { 63*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, Math.min(b1.length, b2.length)); 64*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 65*795d594fSAndroid Build Coastguard Worker bo[i] = (char) ((b1[i] + b2[i]) >>> 1); 66*795d594fSAndroid Build Coastguard Worker } 67*795d594fSAndroid Build Coastguard Worker } 68*795d594fSAndroid Build Coastguard Worker 69*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltChar.halving_add_also_unsigned(char[], char[], char[]) instruction_simplifier (before) 70*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 71*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<IMAX:i\d+>> IntConstant 65535 loop:none 72*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 73*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 74*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 75*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<And1:i\d+>> And [<<Get1>>,<<IMAX>>] loop:<<Loop>> outer_loop:none 76*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<And2:i\d+>> And [<<IMAX>>,<<Get2>>] loop:<<Loop>> outer_loop:none 77*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<And1>>,<<And2>>] loop:<<Loop>> outer_loop:none 78*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 79*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 80*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},{{i\d+}},<<Cnv>>] loop:<<Loop>> outer_loop:none 81*795d594fSAndroid Build Coastguard Worker // 82*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltChar.halving_add_also_unsigned(char[], char[], char[]) loop_optimization (before) 83*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 84*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<IMAX:i\d+>> IntConstant 65535 loop:none 85*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 86*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 87*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 88*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<Get1>>,<<Get2>>] loop:<<Loop>> outer_loop:none 89*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 90*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 91*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 92*795d594fSAndroid Build Coastguard Worker // 93*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddAltChar.halving_add_also_unsigned(char[], char[], char[]) loop_optimization (after) 94*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 95*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 96*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 97*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 98*795d594fSAndroid Build Coastguard Worker // 99*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddAltChar.halving_add_also_unsigned(char[], char[], char[]) loop_optimization (after) 100*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 101*795d594fSAndroid Build Coastguard Worker // 102*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 103*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 104*795d594fSAndroid Build Coastguard Worker // 105*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 106*795d594fSAndroid Build Coastguard Worker // 107*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 108*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 109*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 110*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 111*795d594fSAndroid Build Coastguard Worker // 112*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: 113*795d594fSAndroid Build Coastguard Worker // 114*795d594fSAndroid Build Coastguard Worker // Note: HAnd has no impact (already a zero extension). 115*795d594fSAndroid Build Coastguard Worker // halving_add_also_unsigned(char[] b1, char[] b2, char[] bo)116*795d594fSAndroid Build Coastguard Worker private static void halving_add_also_unsigned(char[] b1, char[] b2, char[] bo) { 117*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, Math.min(b1.length, b2.length)); 118*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 119*795d594fSAndroid Build Coastguard Worker bo[i] = (char) (((b1[i] & 0xffff) + (b2[i] & 0xffff)) >>> 1); 120*795d594fSAndroid Build Coastguard Worker } 121*795d594fSAndroid Build Coastguard Worker } 122*795d594fSAndroid Build Coastguard Worker 123*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltChar.rounding_halving_add_unsigned(char[], char[], char[]) loop_optimization (before) 124*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 125*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 126*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 127*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 128*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add1:i\d+>> Add [<<Get1>>,<<Get2>>] loop:<<Loop>> outer_loop:none 129*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add2:i\d+>> Add [<<Add1>>,<<I1>>] loop:<<Loop>> outer_loop:none 130*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add2>>,<<I1>>] loop:<<Loop>> outer_loop:none 131*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 132*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 133*795d594fSAndroid Build Coastguard Worker // 134*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddAltChar.rounding_halving_add_unsigned(char[], char[], char[]) loop_optimization (after) 135*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 136*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 137*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none 138*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 139*795d594fSAndroid Build Coastguard Worker // 140*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddAltChar.rounding_halving_add_unsigned(char[], char[], char[]) loop_optimization (after) 141*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 142*795d594fSAndroid Build Coastguard Worker // 143*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 144*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 145*795d594fSAndroid Build Coastguard Worker // 146*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 147*795d594fSAndroid Build Coastguard Worker // 148*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 149*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 150*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none 151*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 152*795d594fSAndroid Build Coastguard Worker // 153*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: rounding_halving_add_unsigned(char[] b1, char[] b2, char[] bo)154*795d594fSAndroid Build Coastguard Worker private static void rounding_halving_add_unsigned(char[] b1, char[] b2, char[] bo) { 155*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, Math.min(b1.length, b2.length)); 156*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 157*795d594fSAndroid Build Coastguard Worker bo[i] = (char) ((b1[i] + b2[i] + 1) >>> 1); 158*795d594fSAndroid Build Coastguard Worker } 159*795d594fSAndroid Build Coastguard Worker } 160*795d594fSAndroid Build Coastguard Worker 161*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltChar.rounding_halving_add_also_unsigned(char[], char[], char[]) instruction_simplifier (before) 162*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 163*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<IMAX:i\d+>> IntConstant 65535 loop:none 164*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 165*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 166*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 167*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<And1:i\d+>> And [<<Get1>>,<<IMAX>>] loop:<<Loop>> outer_loop:none 168*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<And2:i\d+>> And [<<IMAX>>,<<Get2>>] loop:<<Loop>> outer_loop:none 169*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add1:i\d+>> Add [<<And1>>,<<And2>>] loop:<<Loop>> outer_loop:none 170*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add2:i\d+>> Add [<<Add1>>,<<I1>>] loop:<<Loop>> outer_loop:none 171*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add2>>,<<I1>>] loop:<<Loop>> outer_loop:none 172*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 173*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},{{i\d+}},<<Cnv>>] loop:<<Loop>> outer_loop:none 174*795d594fSAndroid Build Coastguard Worker // 175*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltChar.rounding_halving_add_also_unsigned(char[], char[], char[]) loop_optimization (before) 176*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 177*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 178*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 179*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 180*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add1:i\d+>> Add [<<Get1>>,<<Get2>>] loop:<<Loop>> outer_loop:none 181*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add2:i\d+>> Add [<<Add1>>,<<I1>>] loop:<<Loop>> outer_loop:none 182*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add2>>,<<I1>>] loop:<<Loop>> outer_loop:none 183*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 184*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 185*795d594fSAndroid Build Coastguard Worker // 186*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddAltChar.rounding_halving_add_also_unsigned(char[], char[], char[]) loop_optimization (after) 187*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 188*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 189*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none 190*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 191*795d594fSAndroid Build Coastguard Worker // 192*795d594fSAndroid Build Coastguard Worker // 193*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddAltChar.rounding_halving_add_also_unsigned(char[], char[], char[]) loop_optimization (after) 194*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 195*795d594fSAndroid Build Coastguard Worker // 196*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 197*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 198*795d594fSAndroid Build Coastguard Worker // 199*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 200*795d594fSAndroid Build Coastguard Worker // 201*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 202*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 203*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none 204*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 205*795d594fSAndroid Build Coastguard Worker // 206*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: 207*795d594fSAndroid Build Coastguard Worker // 208*795d594fSAndroid Build Coastguard Worker // Note: HAnd has no impact (already a zero extension). 209*795d594fSAndroid Build Coastguard Worker // rounding_halving_add_also_unsigned(char[] b1, char[] b2, char[] bo)210*795d594fSAndroid Build Coastguard Worker private static void rounding_halving_add_also_unsigned(char[] b1, char[] b2, char[] bo) { 211*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, Math.min(b1.length, b2.length)); 212*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 213*795d594fSAndroid Build Coastguard Worker bo[i] = (char) (((b1[i] & 0xffff) + (b2[i] & 0xffff) + 1) >>> 1); 214*795d594fSAndroid Build Coastguard Worker } 215*795d594fSAndroid Build Coastguard Worker } 216*795d594fSAndroid Build Coastguard Worker 217*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltChar.halving_add_unsigned_constant(char[], char[]) loop_optimization (before) 218*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 219*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 220*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 221*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 222*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<Get>>,<<UMAX>>] loop:<<Loop>> outer_loop:none 223*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 224*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 225*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 226*795d594fSAndroid Build Coastguard Worker // 227*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddAltChar.halving_add_unsigned_constant(char[], char[]) loop_optimization (after) 228*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 229*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<UMAX>>] loop:none 230*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 231*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 232*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 233*795d594fSAndroid Build Coastguard Worker // 234*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddAltChar.halving_add_unsigned_constant(char[], char[]) loop_optimization (after) 235*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 236*795d594fSAndroid Build Coastguard Worker // 237*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 238*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 239*795d594fSAndroid Build Coastguard Worker // 240*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 241*795d594fSAndroid Build Coastguard Worker // 242*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 243*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<UMAX>>] loop:none 244*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 245*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 246*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 247*795d594fSAndroid Build Coastguard Worker // 248*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: halving_add_unsigned_constant(char[] b1, char[] bo)249*795d594fSAndroid Build Coastguard Worker private static void halving_add_unsigned_constant(char[] b1, char[] bo) { 250*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, b1.length); 251*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 252*795d594fSAndroid Build Coastguard Worker bo[i] = (char) ((b1[i] + 0xffff) >>> 1); 253*795d594fSAndroid Build Coastguard Worker } 254*795d594fSAndroid Build Coastguard Worker } 255*795d594fSAndroid Build Coastguard Worker 256*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltChar.halving_add_also_unsigned_constant(char[], char[]) instruction_simplifier (before) 257*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 258*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 259*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 260*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 261*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<And:i\d+>> And [<<Get>>,<<UMAX>>] loop:<<Loop>> outer_loop:none 262*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<And>>,<<UMAX>>] loop:<<Loop>> outer_loop:none 263*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 264*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 265*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},{{i\d+}},<<Cnv>>] loop:<<Loop>> outer_loop:none 266*795d594fSAndroid Build Coastguard Worker // 267*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltChar.halving_add_also_unsigned_constant(char[], char[]) loop_optimization (before) 268*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 269*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 270*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 271*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 272*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<Get>>,<<UMAX>>] loop:<<Loop>> outer_loop:none 273*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 274*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 275*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 276*795d594fSAndroid Build Coastguard Worker // 277*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddAltChar.halving_add_also_unsigned_constant(char[], char[]) loop_optimization (after) 278*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 279*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<UMAX>>] loop:none 280*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 281*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 282*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 283*795d594fSAndroid Build Coastguard Worker // 284*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddAltChar.halving_add_also_unsigned_constant(char[], char[]) loop_optimization (after) 285*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 286*795d594fSAndroid Build Coastguard Worker // 287*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 288*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 289*795d594fSAndroid Build Coastguard Worker // 290*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 291*795d594fSAndroid Build Coastguard Worker // 292*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 293*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<UMAX>>] loop:none 294*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 295*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 296*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 297*795d594fSAndroid Build Coastguard Worker // 298*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: 299*795d594fSAndroid Build Coastguard Worker // 300*795d594fSAndroid Build Coastguard Worker // Note: HAnd has no impact (already a zero extension). 301*795d594fSAndroid Build Coastguard Worker // halving_add_also_unsigned_constant(char[] b1, char[] bo)302*795d594fSAndroid Build Coastguard Worker private static void halving_add_also_unsigned_constant(char[] b1, char[] bo) { 303*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, b1.length); 304*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 305*795d594fSAndroid Build Coastguard Worker bo[i] = (char) (((b1[i] & 0xffff) + 0xffff) >>> 1); 306*795d594fSAndroid Build Coastguard Worker } 307*795d594fSAndroid Build Coastguard Worker } 308*795d594fSAndroid Build Coastguard Worker main()309*795d594fSAndroid Build Coastguard Worker public static void main() { 310*795d594fSAndroid Build Coastguard Worker // Some interesting values. 311*795d594fSAndroid Build Coastguard Worker char[] interesting = { 312*795d594fSAndroid Build Coastguard Worker (char) 0x0000, 313*795d594fSAndroid Build Coastguard Worker (char) 0x0001, 314*795d594fSAndroid Build Coastguard Worker (char) 0x0002, 315*795d594fSAndroid Build Coastguard Worker (char) 0x1234, 316*795d594fSAndroid Build Coastguard Worker (char) 0x8000, 317*795d594fSAndroid Build Coastguard Worker (char) 0x8001, 318*795d594fSAndroid Build Coastguard Worker (char) 0x7fff, 319*795d594fSAndroid Build Coastguard Worker (char) 0xffff 320*795d594fSAndroid Build Coastguard Worker }; 321*795d594fSAndroid Build Coastguard Worker // Initialize cross-values to test all cases, and also 322*795d594fSAndroid Build Coastguard Worker // set up some extra values to exercise the cleanup loop. 323*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 324*795d594fSAndroid Build Coastguard Worker sB1[i] = (char) i; 325*795d594fSAndroid Build Coastguard Worker sB2[i] = interesting[i & 7]; 326*795d594fSAndroid Build Coastguard Worker } 327*795d594fSAndroid Build Coastguard Worker 328*795d594fSAndroid Build Coastguard Worker // Test halving add idioms. Note that the expected result is computed 329*795d594fSAndroid Build Coastguard Worker // with the arithmetic >> to demonstrate the computed narrower result 330*795d594fSAndroid Build Coastguard Worker // does not depend on the wider >> or >>>. 331*795d594fSAndroid Build Coastguard Worker halving_add_unsigned(sB1, sB2, sBo); 332*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 333*795d594fSAndroid Build Coastguard Worker char e = (char) ((sB1[i] + sB2[i]) >> 1); 334*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 335*795d594fSAndroid Build Coastguard Worker } 336*795d594fSAndroid Build Coastguard Worker halving_add_also_unsigned(sB1, sB2, sBo); 337*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 338*795d594fSAndroid Build Coastguard Worker char e = (char) ((sB1[i] + sB2[i]) >> 1); 339*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 340*795d594fSAndroid Build Coastguard Worker } 341*795d594fSAndroid Build Coastguard Worker rounding_halving_add_unsigned(sB1, sB2, sBo); 342*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 343*795d594fSAndroid Build Coastguard Worker char e = (char) ((sB1[i] + sB2[i] + 1) >> 1); 344*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 345*795d594fSAndroid Build Coastguard Worker } 346*795d594fSAndroid Build Coastguard Worker rounding_halving_add_also_unsigned(sB1, sB2, sBo); 347*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 348*795d594fSAndroid Build Coastguard Worker char e = (char) ((sB1[i] + sB2[i] + 1) >> 1); 349*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 350*795d594fSAndroid Build Coastguard Worker } 351*795d594fSAndroid Build Coastguard Worker halving_add_unsigned_constant(sB1, sBo); 352*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 353*795d594fSAndroid Build Coastguard Worker char e = (char) ((sB1[i] + 0xffff) >> 1); 354*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 355*795d594fSAndroid Build Coastguard Worker } 356*795d594fSAndroid Build Coastguard Worker halving_add_also_unsigned_constant(sB1, sBo); 357*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 358*795d594fSAndroid Build Coastguard Worker char e = (char) ((sB1[i] + 0xffff) >> 1); 359*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 360*795d594fSAndroid Build Coastguard Worker } 361*795d594fSAndroid Build Coastguard Worker 362*795d594fSAndroid Build Coastguard Worker System.out.println("HaddAltChar passed"); 363*795d594fSAndroid Build Coastguard Worker } 364*795d594fSAndroid Build Coastguard Worker expectEquals(int expected, int result)365*795d594fSAndroid Build Coastguard Worker private static void expectEquals(int expected, int result) { 366*795d594fSAndroid Build Coastguard Worker if (expected != result) { 367*795d594fSAndroid Build Coastguard Worker throw new Error("Expected: " + expected + ", found: " + result); 368*795d594fSAndroid Build Coastguard Worker } 369*795d594fSAndroid Build Coastguard Worker } 370*795d594fSAndroid Build Coastguard Worker } 371