1*795d594fSAndroid Build Coastguard Worker /* 2*795d594fSAndroid Build Coastguard Worker * Copyright (C) 2017 The Android Open Source Project 3*795d594fSAndroid Build Coastguard Worker * 4*795d594fSAndroid Build Coastguard Worker * Licensed under the Apache License, Version 2.0 (the "License"); 5*795d594fSAndroid Build Coastguard Worker * you may not use this file except in compliance with the License. 6*795d594fSAndroid Build Coastguard Worker * You may obtain a copy of the License at 7*795d594fSAndroid Build Coastguard Worker * 8*795d594fSAndroid Build Coastguard Worker * http://www.apache.org/licenses/LICENSE-2.0 9*795d594fSAndroid Build Coastguard Worker * 10*795d594fSAndroid Build Coastguard Worker * Unless required by applicable law or agreed to in writing, software 11*795d594fSAndroid Build Coastguard Worker * distributed under the License is distributed on an "AS IS" BASIS, 12*795d594fSAndroid Build Coastguard Worker * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13*795d594fSAndroid Build Coastguard Worker * See the License for the specific language governing permissions and 14*795d594fSAndroid Build Coastguard Worker * limitations under the License. 15*795d594fSAndroid Build Coastguard Worker */ 16*795d594fSAndroid Build Coastguard Worker 17*795d594fSAndroid Build Coastguard Worker /** 18*795d594fSAndroid Build Coastguard Worker * Tests for halving-add idiomatic vectorization. 19*795d594fSAndroid Build Coastguard Worker */ 20*795d594fSAndroid Build Coastguard Worker public class HaddChar { 21*795d594fSAndroid Build Coastguard Worker 22*795d594fSAndroid Build Coastguard Worker private static final int N = 64 * 1024; 23*795d594fSAndroid Build Coastguard Worker private static final int M = N + 31; 24*795d594fSAndroid Build Coastguard Worker 25*795d594fSAndroid Build Coastguard Worker static char[] sB1 = new char[M]; 26*795d594fSAndroid Build Coastguard Worker static char[] sB2 = new char[M]; 27*795d594fSAndroid Build Coastguard Worker static char[] sBo = new char[M]; 28*795d594fSAndroid Build Coastguard Worker 29*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddChar.halving_add_unsigned(char[], char[], char[]) loop_optimization (before) 30*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 31*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 32*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 33*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 34*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<Get1>>,<<Get2>>] loop:<<Loop>> outer_loop:none 35*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Shr:i\d+>> Shr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 36*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<Shr>>] loop:<<Loop>> outer_loop:none 37*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 38*795d594fSAndroid Build Coastguard Worker // 39*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddChar.halving_add_unsigned(char[], char[], char[]) loop_optimization (after) 40*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 41*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 42*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 43*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 44*795d594fSAndroid Build Coastguard Worker // 45*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddChar.halving_add_unsigned(char[], char[], char[]) loop_optimization (after) 46*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 47*795d594fSAndroid Build Coastguard Worker // 48*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 49*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 50*795d594fSAndroid Build Coastguard Worker // 51*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 52*795d594fSAndroid Build Coastguard Worker // 53*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 54*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 55*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 56*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 57*795d594fSAndroid Build Coastguard Worker // 58*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: halving_add_unsigned(char[] b1, char[] b2, char[] bo)59*795d594fSAndroid Build Coastguard Worker private static void halving_add_unsigned(char[] b1, char[] b2, char[] bo) { 60*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, Math.min(b1.length, b2.length)); 61*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 62*795d594fSAndroid Build Coastguard Worker bo[i] = (char) ((b1[i] + b2[i]) >> 1); 63*795d594fSAndroid Build Coastguard Worker } 64*795d594fSAndroid Build Coastguard Worker } 65*795d594fSAndroid Build Coastguard Worker 66*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddChar.halving_add_also_unsigned(char[], char[], char[]) instruction_simplifier (before) 67*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 68*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<IMAX:i\d+>> IntConstant 65535 loop:none 69*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 70*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 71*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 72*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<And1:i\d+>> And [<<Get1>>,<<IMAX>>] loop:<<Loop>> outer_loop:none 73*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<And2:i\d+>> And [<<IMAX>>,<<Get2>>] loop:<<Loop>> outer_loop:none 74*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<And1>>,<<And2>>] loop:<<Loop>> outer_loop:none 75*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Shr:i\d+>> Shr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 76*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<Shr>>] loop:<<Loop>> outer_loop:none 77*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},{{i\d+}},<<Cnv>>] loop:<<Loop>> outer_loop:none 78*795d594fSAndroid Build Coastguard Worker // 79*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddChar.halving_add_also_unsigned(char[], char[], char[]) loop_optimization (before) 80*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 81*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 82*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 83*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 84*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<Get1>>,<<Get2>>] loop:<<Loop>> outer_loop:none 85*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Shr:i\d+>> Shr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 86*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<Shr>>] loop:<<Loop>> outer_loop:none 87*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 88*795d594fSAndroid Build Coastguard Worker // 89*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddChar.halving_add_also_unsigned(char[], char[], char[]) loop_optimization (after) 90*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 91*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 92*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 93*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 94*795d594fSAndroid Build Coastguard Worker // 95*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddChar.halving_add_also_unsigned(char[], char[], char[]) loop_optimization (after) 96*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 97*795d594fSAndroid Build Coastguard Worker // 98*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 99*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 100*795d594fSAndroid Build Coastguard Worker // 101*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 102*795d594fSAndroid Build Coastguard Worker // 103*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 104*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 105*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 106*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 107*795d594fSAndroid Build Coastguard Worker // 108*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: 109*795d594fSAndroid Build Coastguard Worker // 110*795d594fSAndroid Build Coastguard Worker // Note: HAnd has no impact (already a zero extension). 111*795d594fSAndroid Build Coastguard Worker // halving_add_also_unsigned(char[] b1, char[] b2, char[] bo)112*795d594fSAndroid Build Coastguard Worker private static void halving_add_also_unsigned(char[] b1, char[] b2, char[] bo) { 113*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, Math.min(b1.length, b2.length)); 114*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 115*795d594fSAndroid Build Coastguard Worker bo[i] = (char) (((b1[i] & 0xffff) + (b2[i] & 0xffff)) >> 1); 116*795d594fSAndroid Build Coastguard Worker } 117*795d594fSAndroid Build Coastguard Worker } 118*795d594fSAndroid Build Coastguard Worker 119*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddChar.rounding_halving_add_unsigned(char[], char[], char[]) loop_optimization (before) 120*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 121*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 122*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 123*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 124*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add1:i\d+>> Add [<<Get1>>,<<Get2>>] loop:<<Loop>> outer_loop:none 125*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add2:i\d+>> Add [<<Add1>>,<<I1>>] loop:<<Loop>> outer_loop:none 126*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Shr:i\d+>> Shr [<<Add2>>,<<I1>>] loop:<<Loop>> outer_loop:none 127*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<Shr>>] loop:<<Loop>> outer_loop:none 128*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 129*795d594fSAndroid Build Coastguard Worker // 130*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddChar.rounding_halving_add_unsigned(char[], char[], char[]) loop_optimization (after) 131*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 132*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 133*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none 134*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 135*795d594fSAndroid Build Coastguard Worker // 136*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddChar.rounding_halving_add_unsigned(char[], char[], char[]) loop_optimization (after) 137*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 138*795d594fSAndroid Build Coastguard Worker // 139*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 140*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 141*795d594fSAndroid Build Coastguard Worker // 142*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 143*795d594fSAndroid Build Coastguard Worker // 144*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 145*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 146*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none 147*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 148*795d594fSAndroid Build Coastguard Worker // 149*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: rounding_halving_add_unsigned(char[] b1, char[] b2, char[] bo)150*795d594fSAndroid Build Coastguard Worker private static void rounding_halving_add_unsigned(char[] b1, char[] b2, char[] bo) { 151*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, Math.min(b1.length, b2.length)); 152*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 153*795d594fSAndroid Build Coastguard Worker bo[i] = (char) ((b1[i] + b2[i] + 1) >> 1); 154*795d594fSAndroid Build Coastguard Worker } 155*795d594fSAndroid Build Coastguard Worker } 156*795d594fSAndroid Build Coastguard Worker 157*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddChar.rounding_halving_add_also_unsigned(char[], char[], char[]) instruction_simplifier (before) 158*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 159*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<IMAX:i\d+>> IntConstant 65535 loop:none 160*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 161*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 162*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 163*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<And1:i\d+>> And [<<Get1>>,<<IMAX>>] loop:<<Loop>> outer_loop:none 164*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<And2:i\d+>> And [<<IMAX>>,<<Get2>>] loop:<<Loop>> outer_loop:none 165*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add1:i\d+>> Add [<<And1>>,<<And2>>] loop:<<Loop>> outer_loop:none 166*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add2:i\d+>> Add [<<Add1>>,<<I1>>] loop:<<Loop>> outer_loop:none 167*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Shr:i\d+>> Shr [<<Add2>>,<<I1>>] loop:<<Loop>> outer_loop:none 168*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<Shr>>] loop:<<Loop>> outer_loop:none 169*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},{{i\d+}},<<Cnv>>] loop:<<Loop>> outer_loop:none 170*795d594fSAndroid Build Coastguard Worker // 171*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddChar.rounding_halving_add_also_unsigned(char[], char[], char[]) loop_optimization (before) 172*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 173*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 174*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 175*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 176*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add1:i\d+>> Add [<<Get1>>,<<Get2>>] loop:<<Loop>> outer_loop:none 177*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add2:i\d+>> Add [<<Add1>>,<<I1>>] loop:<<Loop>> outer_loop:none 178*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Shr:i\d+>> Shr [<<Add2>>,<<I1>>] loop:<<Loop>> outer_loop:none 179*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<Shr>>] loop:<<Loop>> outer_loop:none 180*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 181*795d594fSAndroid Build Coastguard Worker // 182*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddChar.rounding_halving_add_also_unsigned(char[], char[], char[]) loop_optimization (after) 183*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 184*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 185*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none 186*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 187*795d594fSAndroid Build Coastguard Worker // 188*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddChar.rounding_halving_add_also_unsigned(char[], char[], char[]) loop_optimization (after) 189*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 190*795d594fSAndroid Build Coastguard Worker // 191*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 192*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 193*795d594fSAndroid Build Coastguard Worker // 194*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 195*795d594fSAndroid Build Coastguard Worker // 196*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 197*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 198*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none 199*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 200*795d594fSAndroid Build Coastguard Worker // 201*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: 202*795d594fSAndroid Build Coastguard Worker // 203*795d594fSAndroid Build Coastguard Worker // Note: HAnd has no impact (already a zero extension). 204*795d594fSAndroid Build Coastguard Worker // rounding_halving_add_also_unsigned(char[] b1, char[] b2, char[] bo)205*795d594fSAndroid Build Coastguard Worker private static void rounding_halving_add_also_unsigned(char[] b1, char[] b2, char[] bo) { 206*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, Math.min(b1.length, b2.length)); 207*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 208*795d594fSAndroid Build Coastguard Worker bo[i] = (char) (((b1[i] & 0xffff) + (b2[i] & 0xffff) + 1) >> 1); 209*795d594fSAndroid Build Coastguard Worker } 210*795d594fSAndroid Build Coastguard Worker } 211*795d594fSAndroid Build Coastguard Worker 212*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddChar.halving_add_unsigned_constant(char[], char[]) loop_optimization (before) 213*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 214*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 215*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 216*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 217*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<Get>>,<<UMAX>>] loop:<<Loop>> outer_loop:none 218*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Shr:i\d+>> Shr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 219*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<Shr>>] loop:<<Loop>> outer_loop:none 220*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 221*795d594fSAndroid Build Coastguard Worker // 222*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddChar.halving_add_unsigned_constant(char[], char[]) loop_optimization (after) 223*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 224*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<UMAX>>] loop:none 225*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 226*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 227*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 228*795d594fSAndroid Build Coastguard Worker // 229*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddChar.halving_add_unsigned_constant(char[], char[]) loop_optimization (after) 230*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 231*795d594fSAndroid Build Coastguard Worker // 232*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 233*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 234*795d594fSAndroid Build Coastguard Worker // 235*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 236*795d594fSAndroid Build Coastguard Worker // 237*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 238*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<UMAX>>] loop:none 239*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 240*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 241*795d594fSAndroid Build Coastguard Worker // 242*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: halving_add_unsigned_constant(char[] b1, char[] bo)243*795d594fSAndroid Build Coastguard Worker private static void halving_add_unsigned_constant(char[] b1, char[] bo) { 244*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, b1.length); 245*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 246*795d594fSAndroid Build Coastguard Worker bo[i] = (char) ((b1[i] + 0xffff) >> 1); 247*795d594fSAndroid Build Coastguard Worker } 248*795d594fSAndroid Build Coastguard Worker } 249*795d594fSAndroid Build Coastguard Worker 250*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddChar.halving_add_also_unsigned_constant(char[], char[]) instruction_simplifier (before) 251*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 252*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 253*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 254*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 255*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<And:i\d+>> And [<<Get>>,<<UMAX>>] loop:<<Loop>> outer_loop:none 256*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<And>>,<<UMAX>>] loop:<<Loop>> outer_loop:none 257*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Shr:i\d+>> Shr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 258*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<Shr>>] loop:<<Loop>> outer_loop:none 259*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},{{i\d+}},<<Cnv>>] loop:<<Loop>> outer_loop:none 260*795d594fSAndroid Build Coastguard Worker // 261*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddChar.halving_add_also_unsigned_constant(char[], char[]) loop_optimization (before) 262*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 263*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 264*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 265*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 266*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<Get>>,<<UMAX>>] loop:<<Loop>> outer_loop:none 267*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Shr:i\d+>> Shr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 268*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:c\d+>> TypeConversion [<<Shr>>] loop:<<Loop>> outer_loop:none 269*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 270*795d594fSAndroid Build Coastguard Worker // 271*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddChar.halving_add_also_unsigned_constant(char[], char[]) loop_optimization (after) 272*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 273*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<UMAX>>] loop:none 274*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 275*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 276*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 277*795d594fSAndroid Build Coastguard Worker // 278*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddChar.halving_add_also_unsigned_constant(char[], char[]) loop_optimization (after) 279*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 280*795d594fSAndroid Build Coastguard Worker // 281*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 282*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 283*795d594fSAndroid Build Coastguard Worker // 284*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 285*795d594fSAndroid Build Coastguard Worker // 286*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 287*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<UMAX>>] loop:none 288*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 289*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 290*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 291*795d594fSAndroid Build Coastguard Worker // 292*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: 293*795d594fSAndroid Build Coastguard Worker // 294*795d594fSAndroid Build Coastguard Worker // Note: HAnd has no impact (already a zero extension). 295*795d594fSAndroid Build Coastguard Worker // halving_add_also_unsigned_constant(char[] b1, char[] bo)296*795d594fSAndroid Build Coastguard Worker private static void halving_add_also_unsigned_constant(char[] b1, char[] bo) { 297*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, b1.length); 298*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 299*795d594fSAndroid Build Coastguard Worker bo[i] = (char) (((b1[i] & 0xffff) + 0xffff) >> 1); 300*795d594fSAndroid Build Coastguard Worker } 301*795d594fSAndroid Build Coastguard Worker } 302*795d594fSAndroid Build Coastguard Worker main()303*795d594fSAndroid Build Coastguard Worker public static void main() { 304*795d594fSAndroid Build Coastguard Worker // Some interesting values. 305*795d594fSAndroid Build Coastguard Worker char[] interesting = { 306*795d594fSAndroid Build Coastguard Worker (char) 0x0000, 307*795d594fSAndroid Build Coastguard Worker (char) 0x0001, 308*795d594fSAndroid Build Coastguard Worker (char) 0x0002, 309*795d594fSAndroid Build Coastguard Worker (char) 0x1234, 310*795d594fSAndroid Build Coastguard Worker (char) 0x8000, 311*795d594fSAndroid Build Coastguard Worker (char) 0x8001, 312*795d594fSAndroid Build Coastguard Worker (char) 0x7fff, 313*795d594fSAndroid Build Coastguard Worker (char) 0xffff 314*795d594fSAndroid Build Coastguard Worker }; 315*795d594fSAndroid Build Coastguard Worker // Initialize cross-values to test all cases, and also 316*795d594fSAndroid Build Coastguard Worker // set up some extra values to exercise the cleanup loop. 317*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 318*795d594fSAndroid Build Coastguard Worker sB1[i] = (char) i; 319*795d594fSAndroid Build Coastguard Worker sB2[i] = interesting[i & 7]; 320*795d594fSAndroid Build Coastguard Worker } 321*795d594fSAndroid Build Coastguard Worker 322*795d594fSAndroid Build Coastguard Worker // Test halving add idioms. 323*795d594fSAndroid Build Coastguard Worker halving_add_unsigned(sB1, sB2, sBo); 324*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 325*795d594fSAndroid Build Coastguard Worker char e = (char) ((sB1[i] + sB2[i]) >> 1); 326*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 327*795d594fSAndroid Build Coastguard Worker } 328*795d594fSAndroid Build Coastguard Worker halving_add_also_unsigned(sB1, sB2, sBo); 329*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 330*795d594fSAndroid Build Coastguard Worker char e = (char) ((sB1[i] + sB2[i]) >> 1); 331*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 332*795d594fSAndroid Build Coastguard Worker } 333*795d594fSAndroid Build Coastguard Worker rounding_halving_add_unsigned(sB1, sB2, sBo); 334*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 335*795d594fSAndroid Build Coastguard Worker char e = (char) ((sB1[i] + sB2[i] + 1) >> 1); 336*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 337*795d594fSAndroid Build Coastguard Worker } 338*795d594fSAndroid Build Coastguard Worker rounding_halving_add_also_unsigned(sB1, sB2, sBo); 339*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 340*795d594fSAndroid Build Coastguard Worker char e = (char) ((sB1[i] + sB2[i] + 1) >> 1); 341*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 342*795d594fSAndroid Build Coastguard Worker } 343*795d594fSAndroid Build Coastguard Worker halving_add_unsigned_constant(sB1, sBo); 344*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 345*795d594fSAndroid Build Coastguard Worker char e = (char) ((sB1[i] + 0xffff) >> 1); 346*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 347*795d594fSAndroid Build Coastguard Worker } 348*795d594fSAndroid Build Coastguard Worker halving_add_also_unsigned_constant(sB1, sBo); 349*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 350*795d594fSAndroid Build Coastguard Worker char e = (char) ((sB1[i] + 0xffff) >> 1); 351*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 352*795d594fSAndroid Build Coastguard Worker } 353*795d594fSAndroid Build Coastguard Worker 354*795d594fSAndroid Build Coastguard Worker System.out.println("HaddChar passed"); 355*795d594fSAndroid Build Coastguard Worker } 356*795d594fSAndroid Build Coastguard Worker expectEquals(int expected, int result)357*795d594fSAndroid Build Coastguard Worker private static void expectEquals(int expected, int result) { 358*795d594fSAndroid Build Coastguard Worker if (expected != result) { 359*795d594fSAndroid Build Coastguard Worker throw new Error("Expected: " + expected + ", found: " + result); 360*795d594fSAndroid Build Coastguard Worker } 361*795d594fSAndroid Build Coastguard Worker } 362*795d594fSAndroid Build Coastguard Worker } 363