1*795d594fSAndroid Build Coastguard Worker /* 2*795d594fSAndroid Build Coastguard Worker * Copyright (C) 2020 The Android Open Source Project 3*795d594fSAndroid Build Coastguard Worker * 4*795d594fSAndroid Build Coastguard Worker * Licensed under the Apache License, Version 2.0 (the "License"); 5*795d594fSAndroid Build Coastguard Worker * you may not use this file except in compliance with the License. 6*795d594fSAndroid Build Coastguard Worker * You may obtain a copy of the License at 7*795d594fSAndroid Build Coastguard Worker * 8*795d594fSAndroid Build Coastguard Worker * http://www.apache.org/licenses/LICENSE-2.0 9*795d594fSAndroid Build Coastguard Worker * 10*795d594fSAndroid Build Coastguard Worker * Unless required by applicable law or agreed to in writing, software 11*795d594fSAndroid Build Coastguard Worker * distributed under the License is distributed on an "AS IS" BASIS, 12*795d594fSAndroid Build Coastguard Worker * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13*795d594fSAndroid Build Coastguard Worker * See the License for the specific language governing permissions and 14*795d594fSAndroid Build Coastguard Worker * limitations under the License. 15*795d594fSAndroid Build Coastguard Worker */ 16*795d594fSAndroid Build Coastguard Worker 17*795d594fSAndroid Build Coastguard Worker public class HaddOther { 18*795d594fSAndroid Build Coastguard Worker private static final int N = 2 * 1024; 19*795d594fSAndroid Build Coastguard Worker private static final int M = N + 31; 20*795d594fSAndroid Build Coastguard Worker 21*795d594fSAndroid Build Coastguard Worker // Should be just shift right, not halving add. 22*795d594fSAndroid Build Coastguard Worker // 23*795d594fSAndroid Build Coastguard Worker /// CHECK-START-{ARM,ARM64}: void HaddOther.test_no_hadd_short2short(short[], short[]) loop_optimization (after) 24*795d594fSAndroid Build Coastguard Worker /// CHECK: VecShr 25*795d594fSAndroid Build Coastguard Worker 26*795d594fSAndroid Build Coastguard Worker /// CHECK-START-{ARM,ARM64}: void HaddOther.test_no_hadd_short2short(short[], short[]) loop_optimization (after) 27*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd test_no_hadd_short2short(short[] a, short[] out)28*795d594fSAndroid Build Coastguard Worker private static void test_no_hadd_short2short(short[] a, short[] out) { 29*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(out.length, a.length); 30*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 31*795d594fSAndroid Build Coastguard Worker out[i] = (short) (a[i] >> 1); 32*795d594fSAndroid Build Coastguard Worker } 33*795d594fSAndroid Build Coastguard Worker } 34*795d594fSAndroid Build Coastguard Worker 35*795d594fSAndroid Build Coastguard Worker // This loop is not vectorized: shift right with a signed type is not supported. 36*795d594fSAndroid Build Coastguard Worker // 37*795d594fSAndroid Build Coastguard Worker /// CHECK-START-{ARM,ARM64}: void HaddOther.test_no_hadd_short2short_logical(short[], short[]) loop_optimization (after) 38*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecLoad 39*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd test_no_hadd_short2short_logical(short[] a, short[] out)40*795d594fSAndroid Build Coastguard Worker private static void test_no_hadd_short2short_logical(short[] a, short[] out) { 41*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(out.length, a.length); 42*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 43*795d594fSAndroid Build Coastguard Worker out[i] = (short) (a[i] >>> 1); 44*795d594fSAndroid Build Coastguard Worker } 45*795d594fSAndroid Build Coastguard Worker } 46*795d594fSAndroid Build Coastguard Worker 47*795d594fSAndroid Build Coastguard Worker // This loop is not vectorized: mismatched packed type size. 48*795d594fSAndroid Build Coastguard Worker // 49*795d594fSAndroid Build Coastguard Worker /// CHECK-START-{ARM,ARM64}: void HaddOther.test_no_hadd_int2short(int[], short[]) loop_optimization (after) 50*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecLoad 51*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd test_no_hadd_int2short(int[] a, short[] out)52*795d594fSAndroid Build Coastguard Worker private static void test_no_hadd_int2short(int[] a, short[] out) { 53*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(out.length, a.length); 54*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 55*795d594fSAndroid Build Coastguard Worker out[i] = (short) (a[i] >> 1); 56*795d594fSAndroid Build Coastguard Worker } 57*795d594fSAndroid Build Coastguard Worker } 58*795d594fSAndroid Build Coastguard Worker 59*795d594fSAndroid Build Coastguard Worker // Should be just shift right, not halving add. 60*795d594fSAndroid Build Coastguard Worker // 61*795d594fSAndroid Build Coastguard Worker /// CHECK-START-{ARM,ARM64}: void HaddOther.test_no_hadd_int2int(int[], int[]) loop_optimization (after) 62*795d594fSAndroid Build Coastguard Worker /// CHECK: VecShr 63*795d594fSAndroid Build Coastguard Worker 64*795d594fSAndroid Build Coastguard Worker /// CHECK-START-{ARM,ARM64}: void HaddOther.test_no_hadd_int2int(int[], int[]) loop_optimization (after) 65*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd test_no_hadd_int2int(int[] a, int[] out)66*795d594fSAndroid Build Coastguard Worker private static void test_no_hadd_int2int(int[] a, int[] out) { 67*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(out.length, a.length); 68*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 69*795d594fSAndroid Build Coastguard Worker out[i] = a[i] >> 1; 70*795d594fSAndroid Build Coastguard Worker } 71*795d594fSAndroid Build Coastguard Worker } 72*795d594fSAndroid Build Coastguard Worker 73*795d594fSAndroid Build Coastguard Worker // Should be just add and shift right, not halving add. 74*795d594fSAndroid Build Coastguard Worker // 75*795d594fSAndroid Build Coastguard Worker /// CHECK-START-{ARM,ARM64}: void HaddOther.test_no_hadd_sum_cast(short[], short[], short[]) loop_optimization (after) 76*795d594fSAndroid Build Coastguard Worker /// CHECK: VecAdd 77*795d594fSAndroid Build Coastguard Worker /// CHECK: VecShr 78*795d594fSAndroid Build Coastguard Worker 79*795d594fSAndroid Build Coastguard Worker /// CHECK-START-{ARM,ARM64}: void HaddOther.test_no_hadd_sum_cast(short[], short[], short[]) loop_optimization (after) 80*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd test_no_hadd_sum_cast(short[] a, short[] b, short[] out)81*795d594fSAndroid Build Coastguard Worker private static void test_no_hadd_sum_cast(short[] a, short[] b, short[] out) { 82*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(out.length, Math.min(a.length, b.length)); 83*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 84*795d594fSAndroid Build Coastguard Worker out[i] = (short) (((short) (a[i] + b[i])) >> 1); 85*795d594fSAndroid Build Coastguard Worker } 86*795d594fSAndroid Build Coastguard Worker } 87*795d594fSAndroid Build Coastguard Worker 88*795d594fSAndroid Build Coastguard Worker // This loop is not vectorized: mismatched packed type size. 89*795d594fSAndroid Build Coastguard Worker // 90*795d594fSAndroid Build Coastguard Worker /// CHECK-START-{ARM,ARM64}: void HaddOther.test_no_hadd_sum_cast_ints(int[], int[], int[]) loop_optimization (after) 91*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecLoad 92*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd test_no_hadd_sum_cast_ints(int[] a, int[] b, int[] out)93*795d594fSAndroid Build Coastguard Worker private static void test_no_hadd_sum_cast_ints(int[] a, int[] b, int[] out) { 94*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(out.length, Math.min(a.length, b.length)); 95*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 96*795d594fSAndroid Build Coastguard Worker out[i] = (short) ((short) (a[i] + b[i]) >> 1); 97*795d594fSAndroid Build Coastguard Worker } 98*795d594fSAndroid Build Coastguard Worker } 99*795d594fSAndroid Build Coastguard Worker 100*795d594fSAndroid Build Coastguard Worker // Should be an add, followed by a halving add. 101*795d594fSAndroid Build Coastguard Worker // 102*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM: void HaddOther.test_no_hadd_sum_cast_plus_const(short[], short[], short[]) loop_optimization (after) 103*795d594fSAndroid Build Coastguard Worker /// CHECK: VecAdd 104*795d594fSAndroid Build Coastguard Worker /// CHECK: VecHalvingAdd 105*795d594fSAndroid Build Coastguard Worker // 106*795d594fSAndroid Build Coastguard Worker /// CHECK-START-ARM64: void HaddOther.test_no_hadd_sum_cast_plus_const(short[], short[], short[]) loop_optimization (after) 107*795d594fSAndroid Build Coastguard Worker /// CHECK-IF: hasIsaFeature("sve") and os.environ.get('ART_FORCE_TRY_PREDICATED_SIMD') == 'true' 108*795d594fSAndroid Build Coastguard Worker // 109*795d594fSAndroid Build Coastguard Worker // HalvingAdd idiom is not supported for SVE. 110*795d594fSAndroid Build Coastguard Worker /// CHECK-NOT: VecHalvingAdd 111*795d594fSAndroid Build Coastguard Worker // 112*795d594fSAndroid Build Coastguard Worker /// CHECK-ELSE: 113*795d594fSAndroid Build Coastguard Worker // 114*795d594fSAndroid Build Coastguard Worker /// CHECK: VecAdd 115*795d594fSAndroid Build Coastguard Worker /// CHECK: VecHalvingAdd 116*795d594fSAndroid Build Coastguard Worker // 117*795d594fSAndroid Build Coastguard Worker /// CHECK-FI: test_no_hadd_sum_cast_plus_const(short[] a, short[] b, short[] out)118*795d594fSAndroid Build Coastguard Worker private static void test_no_hadd_sum_cast_plus_const(short[] a, short[] b, short[] out) { 119*795d594fSAndroid Build Coastguard Worker int min_length = Math.min(out.length, Math.min(a.length, b.length)); 120*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < min_length; i++) { 121*795d594fSAndroid Build Coastguard Worker out[i] = (short) (((short) (a[i] + b[i]) + 1) >> 1); 122*795d594fSAndroid Build Coastguard Worker } 123*795d594fSAndroid Build Coastguard Worker } 124*795d594fSAndroid Build Coastguard Worker main()125*795d594fSAndroid Build Coastguard Worker public static void main() { 126*795d594fSAndroid Build Coastguard Worker short[] sA = new short[M]; 127*795d594fSAndroid Build Coastguard Worker short[] sB = new short[M]; 128*795d594fSAndroid Build Coastguard Worker short[] sOut = new short[M]; 129*795d594fSAndroid Build Coastguard Worker int[] iA = new int[M]; 130*795d594fSAndroid Build Coastguard Worker int[] iB = new int[M]; 131*795d594fSAndroid Build Coastguard Worker int[] iOut = new int[M]; 132*795d594fSAndroid Build Coastguard Worker 133*795d594fSAndroid Build Coastguard Worker // Some interesting values. 134*795d594fSAndroid Build Coastguard Worker short[] interesting = { 135*795d594fSAndroid Build Coastguard Worker (short) 0x0000, 136*795d594fSAndroid Build Coastguard Worker (short) 0x0001, 137*795d594fSAndroid Build Coastguard Worker (short) 0x0002, 138*795d594fSAndroid Build Coastguard Worker (short) 0x1234, 139*795d594fSAndroid Build Coastguard Worker (short) 0x8000, 140*795d594fSAndroid Build Coastguard Worker (short) 0x8001, 141*795d594fSAndroid Build Coastguard Worker (short) 0x7fff, 142*795d594fSAndroid Build Coastguard Worker (short) 0xffff 143*795d594fSAndroid Build Coastguard Worker }; 144*795d594fSAndroid Build Coastguard Worker // Initialize cross-values to test all cases, and also 145*795d594fSAndroid Build Coastguard Worker // set up some extra values to exercise the cleanup loop. 146*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 147*795d594fSAndroid Build Coastguard Worker sA[i] = (short) i; 148*795d594fSAndroid Build Coastguard Worker sB[i] = interesting[i & 7]; 149*795d594fSAndroid Build Coastguard Worker iA[i] = i; 150*795d594fSAndroid Build Coastguard Worker iB[i] = interesting[i & 7]; 151*795d594fSAndroid Build Coastguard Worker } 152*795d594fSAndroid Build Coastguard Worker 153*795d594fSAndroid Build Coastguard Worker test_no_hadd_short2short(sA, sOut); 154*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 155*795d594fSAndroid Build Coastguard Worker short e = (short) (sA[i] >> 1); 156*795d594fSAndroid Build Coastguard Worker expectEquals(e, sOut[i]); 157*795d594fSAndroid Build Coastguard Worker } 158*795d594fSAndroid Build Coastguard Worker test_no_hadd_short2short_logical(sA, sOut); 159*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 160*795d594fSAndroid Build Coastguard Worker short e = (short) (sA[i] >>> 1); 161*795d594fSAndroid Build Coastguard Worker expectEquals(e, sOut[i]); 162*795d594fSAndroid Build Coastguard Worker } 163*795d594fSAndroid Build Coastguard Worker test_no_hadd_int2short(iA, sOut); 164*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 165*795d594fSAndroid Build Coastguard Worker short e = (short) (iA[i] >> 1); 166*795d594fSAndroid Build Coastguard Worker expectEquals(e, sOut[i]); 167*795d594fSAndroid Build Coastguard Worker } 168*795d594fSAndroid Build Coastguard Worker test_no_hadd_int2int(iA, iOut); 169*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 170*795d594fSAndroid Build Coastguard Worker int e = iA[i] >> 1; 171*795d594fSAndroid Build Coastguard Worker expectEquals(e, iOut[i]); 172*795d594fSAndroid Build Coastguard Worker } 173*795d594fSAndroid Build Coastguard Worker test_no_hadd_sum_cast(sA, sB, sOut); 174*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 175*795d594fSAndroid Build Coastguard Worker short e = (short) (((short) (sA[i] + sB[i])) >> 1); 176*795d594fSAndroid Build Coastguard Worker expectEquals(e, sOut[i]); 177*795d594fSAndroid Build Coastguard Worker } 178*795d594fSAndroid Build Coastguard Worker test_no_hadd_sum_cast_ints(iA, iB, iOut); 179*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 180*795d594fSAndroid Build Coastguard Worker int e = (short) ((short) (iA[i] + iB[i]) >> 1); 181*795d594fSAndroid Build Coastguard Worker expectEquals(e, iOut[i]); 182*795d594fSAndroid Build Coastguard Worker } 183*795d594fSAndroid Build Coastguard Worker test_no_hadd_sum_cast_plus_const(sA, sB, sOut); 184*795d594fSAndroid Build Coastguard Worker for (int i = 0; i < M; i++) { 185*795d594fSAndroid Build Coastguard Worker short e = (short) (((short) (sA[i] + sB[i]) + 1) >> 1); 186*795d594fSAndroid Build Coastguard Worker expectEquals(e, sOut[i]); 187*795d594fSAndroid Build Coastguard Worker } 188*795d594fSAndroid Build Coastguard Worker 189*795d594fSAndroid Build Coastguard Worker System.out.println("HaddOther passed"); 190*795d594fSAndroid Build Coastguard Worker } 191*795d594fSAndroid Build Coastguard Worker expectEquals(int expected, int result)192*795d594fSAndroid Build Coastguard Worker private static void expectEquals(int expected, int result) { 193*795d594fSAndroid Build Coastguard Worker if (expected != result) { 194*795d594fSAndroid Build Coastguard Worker throw new Error("Expected: " + expected + ", found: " + result); 195*795d594fSAndroid Build Coastguard Worker } 196*795d594fSAndroid Build Coastguard Worker } 197*795d594fSAndroid Build Coastguard Worker } 198