1*795d594fSAndroid Build Coastguard Worker /* 2*795d594fSAndroid Build Coastguard Worker * Copyright (C) 2017 The Android Open Source Project 3*795d594fSAndroid Build Coastguard Worker * 4*795d594fSAndroid Build Coastguard Worker * Licensed under the Apache License, Version 2.0 (the "License"); 5*795d594fSAndroid Build Coastguard Worker * you may not use this file except in compliance with the License. 6*795d594fSAndroid Build Coastguard Worker * You may obtain a copy of the License at 7*795d594fSAndroid Build Coastguard Worker * 8*795d594fSAndroid Build Coastguard Worker * http://www.apache.org/licenses/LICENSE-2.0 9*795d594fSAndroid Build Coastguard Worker * 10*795d594fSAndroid Build Coastguard Worker * Unless required by applicable law or agreed to in writing, software 11*795d594fSAndroid Build Coastguard Worker * distributed under the License is distributed on an "AS IS" BASIS, 12*795d594fSAndroid Build Coastguard Worker * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13*795d594fSAndroid Build Coastguard Worker * See the License for the specific language governing permissions and 14*795d594fSAndroid Build Coastguard Worker * limitations under the License. 15*795d594fSAndroid Build Coastguard Worker */ 16*795d594fSAndroid Build Coastguard Worker 17*795d594fSAndroid Build Coastguard Worker /** 18*795d594fSAndroid Build Coastguard Worker * Tests for halving-add idiomatic vectorization. 19*795d594fSAndroid Build Coastguard Worker * 20*795d594fSAndroid Build Coastguard Worker * Alternative version expressed with logical shift right 21*795d594fSAndroid Build Coastguard Worker * in the higher precision (has no impact on idiom). 22*795d594fSAndroid Build Coastguard Worker */ 23*795d594fSAndroid Build Coastguard Worker public class HaddAltShort { 24*795d594fSAndroid Build Coastguard Worker 25*795d594fSAndroid Build Coastguard Worker private static final int N = 64 * 1024; 26*795d594fSAndroid Build Coastguard Worker private static final int M = N + 31; 27*795d594fSAndroid Build Coastguard Worker 28*795d594fSAndroid Build Coastguard Worker static short[] sB1 = new short[M]; 29*795d594fSAndroid Build Coastguard Worker static short[] sB2 = new short[M]; 30*795d594fSAndroid Build Coastguard Worker static short[] sBo = new short[M]; 31*795d594fSAndroid Build Coastguard Worker 32*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltShort.halving_add_signed(short[], short[], short[]) loop_optimization (before) 33*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 34*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 35*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:s\d+>> ArrayGet loop:<<Loop>> outer_loop:none 36*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:s\d+>> ArrayGet loop:<<Loop>> outer_loop:none 37*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<Get1>>,<<Get2>>] loop:<<Loop>> outer_loop:none 38*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 39*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:s\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 40*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 41*795d594fSAndroid Build Coastguard Worker // 42*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddAltShort.halving_add_signed(short[], short[], short[]) loop_optimization (after) 43*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 44*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 45*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Int16 rounded:false loop:<<Loop>> outer_loop:none 46*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 47*795d594fSAndroid Build Coastguard Worker // 48*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddAltShort.halving_add_signed(short[], short[], short[]) loop_optimization (after) 49*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 50*795d594fSAndroid Build Coastguard Worker // 51*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 52*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 53*795d594fSAndroid Build Coastguard Worker // 54*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 55*795d594fSAndroid Build Coastguard Worker // 56*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 57*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 58*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Int16 rounded:false loop:<<Loop>> outer_loop:none 59*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 60*795d594fSAndroid Build Coastguard Worker // 61*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: halving_add_signed(short[] b1, short[] b2, short[] bo)62*795d594fSAndroid Build Coastguard Worker private static void halving_add_signed(short[] b1, short[] b2, short[] bo) { 63*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, Math.min(b1.length, b2.length)); 64*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 65*795d594fSAndroid Build Coastguard Worker bo[i] = (short) ((b1[i] + b2[i]) >>> 1); 66*795d594fSAndroid Build Coastguard Worker } 67*795d594fSAndroid Build Coastguard Worker } 68*795d594fSAndroid Build Coastguard Worker 69*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltShort.halving_add_unsigned(short[], short[], short[]) instruction_simplifier (before) 70*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 71*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 72*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 73*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:s\d+>> ArrayGet loop:<<Loop>> outer_loop:none 74*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:s\d+>> ArrayGet loop:<<Loop>> outer_loop:none 75*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<And1:i\d+>> And [<<Get1>>,<<UMAX>>] loop:<<Loop>> outer_loop:none 76*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<And2:i\d+>> And [<<UMAX>>,<<Get2>>] loop:<<Loop>> outer_loop:none 77*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<And1>>,<<And2>>] loop:<<Loop>> outer_loop:none 78*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 79*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:s\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 80*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},{{i\d+}},<<Cnv>>] loop:<<Loop>> outer_loop:none 81*795d594fSAndroid Build Coastguard Worker // 82*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltShort.halving_add_unsigned(short[], short[], short[]) loop_optimization (before) 83*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 84*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 85*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 86*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 87*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<Get1>>,<<Get2>>] loop:<<Loop>> outer_loop:none 88*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 89*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:s\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 90*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 91*795d594fSAndroid Build Coastguard Worker // 92*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddAltShort.halving_add_unsigned(short[], short[], short[]) loop_optimization (after) 93*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 94*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 95*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 96*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 97*795d594fSAndroid Build Coastguard Worker // 98*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddAltShort.halving_add_unsigned(short[], short[], short[]) loop_optimization (after) 99*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 100*795d594fSAndroid Build Coastguard Worker // 101*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 102*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 103*795d594fSAndroid Build Coastguard Worker // 104*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 105*795d594fSAndroid Build Coastguard Worker // 106*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 107*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 108*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 109*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 110*795d594fSAndroid Build Coastguard Worker // 111*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: halving_add_unsigned(short[] b1, short[] b2, short[] bo)112*795d594fSAndroid Build Coastguard Worker private static void halving_add_unsigned(short[] b1, short[] b2, short[] bo) { 113*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, Math.min(b1.length, b2.length)); 114*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 115*795d594fSAndroid Build Coastguard Worker int v1 = b1[i] & 0xffff; 116*795d594fSAndroid Build Coastguard Worker int v2 = b2[i] & 0xffff; 117*795d594fSAndroid Build Coastguard Worker bo[i] = (short) ((v1 + v2) >>> 1); 118*795d594fSAndroid Build Coastguard Worker } 119*795d594fSAndroid Build Coastguard Worker } 120*795d594fSAndroid Build Coastguard Worker 121*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltShort.rounding_halving_add_signed(short[], short[], short[]) loop_optimization (before) 122*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 123*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 124*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:s\d+>> ArrayGet loop:<<Loop>> outer_loop:none 125*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:s\d+>> ArrayGet loop:<<Loop>> outer_loop:none 126*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add1:i\d+>> Add [<<Get1>>,<<Get2>>] loop:<<Loop>> outer_loop:none 127*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add2:i\d+>> Add [<<Add1>>,<<I1>>] loop:<<Loop>> outer_loop:none 128*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add2>>,<<I1>>] loop:<<Loop>> outer_loop:none 129*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:s\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 130*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 131*795d594fSAndroid Build Coastguard Worker // 132*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddAltShort.rounding_halving_add_signed(short[], short[], short[]) loop_optimization (after) 133*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 134*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 135*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Int16 rounded:true loop:<<Loop>> outer_loop:none 136*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 137*795d594fSAndroid Build Coastguard Worker // 138*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddAltShort.rounding_halving_add_signed(short[], short[], short[]) loop_optimization (after) 139*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 140*795d594fSAndroid Build Coastguard Worker // 141*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 142*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 143*795d594fSAndroid Build Coastguard Worker // 144*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 145*795d594fSAndroid Build Coastguard Worker // 146*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 147*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 148*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Int16 rounded:true loop:<<Loop>> outer_loop:none 149*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 150*795d594fSAndroid Build Coastguard Worker // 151*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: rounding_halving_add_signed(short[] b1, short[] b2, short[] bo)152*795d594fSAndroid Build Coastguard Worker private static void rounding_halving_add_signed(short[] b1, short[] b2, short[] bo) { 153*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, Math.min(b1.length, b2.length)); 154*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 155*795d594fSAndroid Build Coastguard Worker bo[i] = (short) ((b1[i] + b2[i] + 1) >>> 1); 156*795d594fSAndroid Build Coastguard Worker } 157*795d594fSAndroid Build Coastguard Worker } 158*795d594fSAndroid Build Coastguard Worker 159*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltShort.rounding_halving_add_unsigned(short[], short[], short[]) instruction_simplifier (before) 160*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 161*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 162*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 163*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:s\d+>> ArrayGet loop:<<Loop>> outer_loop:none 164*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:s\d+>> ArrayGet loop:<<Loop>> outer_loop:none 165*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<And1:i\d+>> And [<<Get1>>,<<UMAX>>] loop:<<Loop>> outer_loop:none 166*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<And2:i\d+>> And [<<UMAX>>,<<Get2>>] loop:<<Loop>> outer_loop:none 167*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add1:i\d+>> Add [<<And1>>,<<And2>>] loop:<<Loop>> outer_loop:none 168*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add2:i\d+>> Add [<<Add1>>,<<I1>>] loop:<<Loop>> outer_loop:none 169*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add2>>,<<I1>>] loop:<<Loop>> outer_loop:none 170*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:s\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 171*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},{{i\d+}},<<Cnv>>] loop:<<Loop>> outer_loop:none 172*795d594fSAndroid Build Coastguard Worker // 173*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltShort.rounding_halving_add_unsigned(short[], short[], short[]) loop_optimization (before) 174*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 175*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 176*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 177*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 178*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add1:i\d+>> Add [<<Get1>>,<<Get2>>] loop:<<Loop>> outer_loop:none 179*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add2:i\d+>> Add [<<Add1>>,<<I1>>] loop:<<Loop>> outer_loop:none 180*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add2>>,<<I1>>] loop:<<Loop>> outer_loop:none 181*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:s\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 182*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 183*795d594fSAndroid Build Coastguard Worker // 184*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddAltShort.rounding_halving_add_unsigned(short[], short[], short[]) loop_optimization (after) 185*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 186*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 187*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none 188*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 189*795d594fSAndroid Build Coastguard Worker // 190*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddAltShort.rounding_halving_add_unsigned(short[], short[], short[]) loop_optimization (after) 191*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 192*795d594fSAndroid Build Coastguard Worker // 193*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 194*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 195*795d594fSAndroid Build Coastguard Worker // 196*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 197*795d594fSAndroid Build Coastguard Worker // 198*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get1:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 199*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get2:d\d+>> VecLoad loop:<<Loop>> outer_loop:none 200*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get1>>,<<Get2>>] packed_type:Uint16 rounded:true loop:<<Loop>> outer_loop:none 201*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 202*795d594fSAndroid Build Coastguard Worker // 203*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: rounding_halving_add_unsigned(short[] b1, short[] b2, short[] bo)204*795d594fSAndroid Build Coastguard Worker private static void rounding_halving_add_unsigned(short[] b1, short[] b2, short[] bo) { 205*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, Math.min(b1.length, b2.length)); 206*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 207*795d594fSAndroid Build Coastguard Worker int v1 = b1[i] & 0xffff; 208*795d594fSAndroid Build Coastguard Worker int v2 = b2[i] & 0xffff; 209*795d594fSAndroid Build Coastguard Worker bo[i] = (short) ((v1 + v2 + 1) >>> 1); 210*795d594fSAndroid Build Coastguard Worker } 211*795d594fSAndroid Build Coastguard Worker } 212*795d594fSAndroid Build Coastguard Worker 213*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltShort.halving_add_signed_constant(short[], short[]) loop_optimization (before) 214*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 215*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<SMAX:i\d+>> IntConstant 32767 loop:none 216*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 217*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:s\d+>> ArrayGet loop:<<Loop>> outer_loop:none 218*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<Get>>,<<SMAX>>] loop:<<Loop>> outer_loop:none 219*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 220*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:s\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 221*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 222*795d594fSAndroid Build Coastguard Worker // 223*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddAltShort.halving_add_signed_constant(short[], short[]) loop_optimization (after) 224*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<SMAX:i\d+>> IntConstant 32767 loop:none 225*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<SMAX>>] loop:none 226*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 227*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Int16 rounded:false loop:<<Loop>> outer_loop:none 228*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 229*795d594fSAndroid Build Coastguard Worker // 230*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddAltShort.halving_add_signed_constant(short[], short[]) loop_optimization (after) 231*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 232*795d594fSAndroid Build Coastguard Worker // 233*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 234*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 235*795d594fSAndroid Build Coastguard Worker // 236*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 237*795d594fSAndroid Build Coastguard Worker // 238*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<SMAX:i\d+>> IntConstant 32767 loop:none 239*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<SMAX>>] loop:none 240*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 241*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Int16 rounded:false loop:<<Loop>> outer_loop:none 242*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 243*795d594fSAndroid Build Coastguard Worker // 244*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: halving_add_signed_constant(short[] b1, short[] bo)245*795d594fSAndroid Build Coastguard Worker private static void halving_add_signed_constant(short[] b1, short[] bo) { 246*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, b1.length); 247*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 248*795d594fSAndroid Build Coastguard Worker bo[i] = (short) ((b1[i] + 0x7fff) >>> 1); 249*795d594fSAndroid Build Coastguard Worker } 250*795d594fSAndroid Build Coastguard Worker } 251*795d594fSAndroid Build Coastguard Worker 252*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltShort.halving_add_unsigned_constant(short[], short[]) instruction_simplifier (before) 253*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 254*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 255*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 256*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:s\d+>> ArrayGet loop:<<Loop>> outer_loop:none 257*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<And:i\d+>> And [<<Get>>,<<UMAX>>] loop:<<Loop>> outer_loop:none 258*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<And>>,<<UMAX>>] loop:<<Loop>> outer_loop:none 259*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 260*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:s\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 261*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},{{i\d+}},<<Cnv>>] loop:<<Loop>> outer_loop:none 262*795d594fSAndroid Build Coastguard Worker // 263*795d594fSAndroid Build Coastguard Worker /// CHECK-START: void HaddAltShort.halving_add_unsigned_constant(short[], short[]) loop_optimization (before) 264*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<I1:i\d+>> IntConstant 1 loop:none 265*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 266*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Phi:i\d+>> Phi loop:<<Loop:B\d+>> outer_loop:none 267*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:c\d+>> ArrayGet loop:<<Loop>> outer_loop:none 268*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Add:i\d+>> Add [<<Get>>,<<UMAX>>] loop:<<Loop>> outer_loop:none 269*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UShr:i\d+>> UShr [<<Add>>,<<I1>>] loop:<<Loop>> outer_loop:none 270*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Cnv:s\d+>> TypeConversion [<<UShr>>] loop:<<Loop>> outer_loop:none 271*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: ArraySet [{{l\d+}},<<Phi>>,<<Cnv>>] loop:<<Loop>> outer_loop:none 272*795d594fSAndroid Build Coastguard Worker // 273*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddAltShort.halving_add_unsigned_constant(short[], short[]) loop_optimization (after) 274*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 275*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<UMAX>>] loop:none 276*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 277*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 278*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 279*795d594fSAndroid Build Coastguard Worker // 280*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddAltShort.halving_add_unsigned_constant(short[], short[]) loop_optimization (after) 281*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 282*795d594fSAndroid Build Coastguard Worker // 283*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 284*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 285*795d594fSAndroid Build Coastguard Worker // 286*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 287*795d594fSAndroid Build Coastguard Worker // 288*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<UMAX:i\d+>> IntConstant 65535 loop:none 289*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Repl:d\d+>> VecReplicateScalar [<<UMAX>>] loop:none 290*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<Get:d\d+>> VecLoad loop:<<Loop:B\d+>> outer_loop:none 291*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: <<HAdd:d\d+>> VecHalvingAdd [<<Get>>,<<Repl>>] packed_type:Uint16 rounded:false loop:<<Loop>> outer_loop:none 292*795d594fSAndroid Build Coastguard Worker /// CHECK-DAG: VecStore [{{l\d+}},{{i\d+}},<<HAdd>>] loop:<<Loop>> outer_loop:none 293*795d594fSAndroid Build Coastguard Worker // 294*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: halving_add_unsigned_constant(short[] b1, short[] bo)295*795d594fSAndroid Build Coastguard Worker private static void halving_add_unsigned_constant(short[] b1, short[] bo) { 296*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(bo.length, b1.length); 297*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 298*795d594fSAndroid Build Coastguard Worker bo[i] = (short) (((b1[i] & 0xffff) + 0xffff) >>> 1); 299*795d594fSAndroid Build Coastguard Worker } 300*795d594fSAndroid Build Coastguard Worker } 301*795d594fSAndroid Build Coastguard Worker main()302*795d594fSAndroid Build Coastguard Worker public static void main() { 303*795d594fSAndroid Build Coastguard Worker // Some interesting values. 304*795d594fSAndroid Build Coastguard Worker short[] interesting = { 305*795d594fSAndroid Build Coastguard Worker (short) 0x0000, 306*795d594fSAndroid Build Coastguard Worker (short) 0x0001, 307*795d594fSAndroid Build Coastguard Worker (short) 0x0002, 308*795d594fSAndroid Build Coastguard Worker (short) 0x1234, 309*795d594fSAndroid Build Coastguard Worker (short) 0x8000, 310*795d594fSAndroid Build Coastguard Worker (short) 0x8001, 311*795d594fSAndroid Build Coastguard Worker (short) 0x7fff, 312*795d594fSAndroid Build Coastguard Worker (short) 0xffff 313*795d594fSAndroid Build Coastguard Worker }; 314*795d594fSAndroid Build Coastguard Worker // Initialize cross-values to test all cases, and also 315*795d594fSAndroid Build Coastguard Worker // set up some extra values to exercise the cleanup loop. 316*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 317*795d594fSAndroid Build Coastguard Worker sB1[i] = (short) i; 318*795d594fSAndroid Build Coastguard Worker sB2[i] = interesting[i & 7]; 319*795d594fSAndroid Build Coastguard Worker } 320*795d594fSAndroid Build Coastguard Worker 321*795d594fSAndroid Build Coastguard Worker // Test halving add idioms. Note that the expected result is computed 322*795d594fSAndroid Build Coastguard Worker // with the arithmetic >> to demonstrate the computed narrower result 323*795d594fSAndroid Build Coastguard Worker // does not depend on the wider >> or >>>. 324*795d594fSAndroid Build Coastguard Worker halving_add_signed(sB1, sB2, sBo); 325*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 326*795d594fSAndroid Build Coastguard Worker short e = (short) ((sB1[i] + sB2[i]) >> 1); 327*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 328*795d594fSAndroid Build Coastguard Worker } 329*795d594fSAndroid Build Coastguard Worker halving_add_unsigned(sB1, sB2, sBo); 330*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 331*795d594fSAndroid Build Coastguard Worker short e = (short) (((sB1[i] & 0xffff) + (sB2[i] & 0xffff)) >> 1); 332*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 333*795d594fSAndroid Build Coastguard Worker } 334*795d594fSAndroid Build Coastguard Worker rounding_halving_add_signed(sB1, sB2, sBo); 335*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 336*795d594fSAndroid Build Coastguard Worker short e = (short) ((sB1[i] + sB2[i] + 1) >> 1); 337*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 338*795d594fSAndroid Build Coastguard Worker } 339*795d594fSAndroid Build Coastguard Worker rounding_halving_add_unsigned(sB1, sB2, sBo); 340*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 341*795d594fSAndroid Build Coastguard Worker short e = (short) (((sB1[i] & 0xffff) + (sB2[i] & 0xffff) + 1) >> 1); 342*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 343*795d594fSAndroid Build Coastguard Worker } 344*795d594fSAndroid Build Coastguard Worker halving_add_signed_constant(sB1, sBo); 345*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 346*795d594fSAndroid Build Coastguard Worker short e = (short) ((sB1[i] + 0x7fff) >> 1); 347*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 348*795d594fSAndroid Build Coastguard Worker } 349*795d594fSAndroid Build Coastguard Worker halving_add_unsigned_constant(sB1, sBo); 350*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 351*795d594fSAndroid Build Coastguard Worker short e = (short) (((sB1[i] & 0xffff) + 0xffff) >> 1); 352*795d594fSAndroid Build Coastguard Worker expectEquals(e, sBo[i]); 353*795d594fSAndroid Build Coastguard Worker } 354*795d594fSAndroid Build Coastguard Worker 355*795d594fSAndroid Build Coastguard Worker System.out.println("HaddAltShort passed"); 356*795d594fSAndroid Build Coastguard Worker } 357*795d594fSAndroid Build Coastguard Worker expectEquals(int expected, int result)358*795d594fSAndroid Build Coastguard Worker private static void expectEquals(int expected, int result) { 359*795d594fSAndroid Build Coastguard Worker if (expected != result) { 360*795d594fSAndroid Build Coastguard Worker throw new Error("Expected: " + expected + ", found: " + result); 361*795d594fSAndroid Build Coastguard Worker } 362*795d594fSAndroid Build Coastguard Worker } 363*795d594fSAndroid Build Coastguard Worker } 364