| /* |
| * Copyright (C) 2017 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| /** |
| * Functional tests for SIMD vectorization. |
| */ |
| public class Main { |
| |
| static byte[] a; |
| |
| // |
| // Arithmetic operations. |
| // |
| |
| /// CHECK-START: void Main.add(int) loop_optimization (before) |
| /// CHECK-DAG: ArrayGet loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: ArraySet loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-ARM: void Main.add(int) loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecAdd loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-ARM64: void Main.add(int) loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecAdd loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-MIPS64: void Main.add(int) loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecAdd loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| static void add(int x) { |
| for (int i = 0; i < 128; i++) |
| a[i] += x; |
| } |
| |
| /// CHECK-START: void Main.sub(int) loop_optimization (before) |
| /// CHECK-DAG: ArrayGet loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: ArraySet loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-ARM: void Main.sub(int) loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecSub loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-ARM64: void Main.sub(int) loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecSub loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-MIPS64: void Main.sub(int) loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecSub loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| static void sub(int x) { |
| for (int i = 0; i < 128; i++) |
| a[i] -= x; |
| } |
| |
| /// CHECK-START: void Main.mul(int) loop_optimization (before) |
| /// CHECK-DAG: ArrayGet loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: ArraySet loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-ARM: void Main.mul(int) loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecMul loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-ARM64: void Main.mul(int) loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecMul loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-MIPS64: void Main.mul(int) loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecMul loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| static void mul(int x) { |
| for (int i = 0; i < 128; i++) |
| a[i] *= x; |
| } |
| |
| /// CHECK-START: void Main.div(int) loop_optimization (before) |
| /// CHECK-DAG: ArrayGet loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: ArraySet loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START: void Main.div(int) loop_optimization (after) |
| // |
| // Not supported on any architecture. |
| // |
| static void div(int x) { |
| for (int i = 0; i < 128; i++) |
| a[i] /= x; |
| } |
| |
| /// CHECK-START: void Main.neg() loop_optimization (before) |
| /// CHECK-DAG: ArrayGet loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: ArraySet loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-ARM: void Main.neg() loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecNeg loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-ARM64: void Main.neg() loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecNeg loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-MIPS64: void Main.neg() loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecNeg loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| static void neg() { |
| for (int i = 0; i < 128; i++) |
| a[i] = (byte) -a[i]; |
| } |
| |
| /// CHECK-START: void Main.not() loop_optimization (before) |
| /// CHECK-DAG: ArrayGet loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: ArraySet loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-ARM: void Main.not() loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecNot loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-ARM64: void Main.not() loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecNot loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-MIPS64: void Main.not() loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecNot loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| static void not() { |
| for (int i = 0; i < 128; i++) |
| a[i] = (byte) ~a[i]; |
| } |
| |
| /// CHECK-START: void Main.shl4() loop_optimization (before) |
| /// CHECK-DAG: ArrayGet loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: ArraySet loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-ARM: void Main.shl4() loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecShl loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-ARM64: void Main.shl4() loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecShl loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-MIPS64: void Main.shl4() loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecShl loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| static void shl4() { |
| for (int i = 0; i < 128; i++) |
| a[i] <<= 4; |
| } |
| |
| /// CHECK-START: void Main.sar2() loop_optimization (before) |
| /// CHECK-DAG: ArrayGet loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: ArraySet loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-ARM: void Main.sar2() loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecShr loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-ARM64: void Main.sar2() loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecShr loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| // |
| /// CHECK-START-MIPS64: void Main.sar2() loop_optimization (after) |
| /// CHECK-DAG: VecLoad loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: VecShr loop:<<Loop>> outer_loop:none |
| /// CHECK-DAG: VecStore loop:<<Loop>> outer_loop:none |
| static void sar2() { |
| for (int i = 0; i < 128; i++) |
| a[i] >>= 2; |
| } |
| |
| /// CHECK-START: void Main.shr2() loop_optimization (before) |
| /// CHECK-DAG: ArrayGet loop:<<Loop:B\d+>> outer_loop:none |
| /// CHECK-DAG: ArraySet loop:<<Loop>> outer_loop:none |
| // |
| // TODO: would need signess flip. |
| /// CHECK-START: void Main.shr2() loop_optimization (after) |
| /// CHECK-NOT: VecUShr |
| static void shr2() { |
| for (int i = 0; i < 128; i++) |
| a[i] >>>= 2; |
| } |
| |
| // |
| // Shift sanity. |
| // |
| |
| static void sar31() { |
| for (int i = 0; i < 128; i++) |
| a[i] >>= 31; |
| } |
| |
| static void shr31() { |
| for (int i = 0; i < 128; i++) |
| a[i] >>>= 31; |
| } |
| |
| static void shr32() { |
| for (int i = 0; i < 128; i++) |
| a[i] >>>= 32; // 0, since & 31 |
| } |
| |
| static void shr33() { |
| for (int i = 0; i < 128; i++) |
| a[i] >>>= 33; // 1, since & 31 |
| } |
| |
| static void shl9() { |
| for (int i = 0; i < 128; i++) |
| a[i] <<= 9; // yields all-zeros |
| } |
| |
| // |
| // Loop bounds. |
| // |
| |
| static void bounds() { |
| for (int i = 1; i < 127; i++) |
| a[i] += 11; |
| } |
| |
| // |
| // Test Driver. |
| // |
| |
| public static void main(String[] args) { |
| // Set up. |
| a = new byte[128]; |
| for (int i = 0; i < 128; i++) { |
| a[i] = (byte) i; |
| } |
| // Arithmetic operations. |
| add(2); |
| for (int i = 0; i < 128; i++) { |
| expectEquals((byte)(i + 2), a[i], "add"); |
| } |
| sub(2); |
| for (int i = 0; i < 128; i++) { |
| expectEquals(i, a[i], "sub"); |
| } |
| mul(2); |
| for (int i = 0; i < 128; i++) { |
| expectEquals((byte)(i + i), a[i], "mul"); |
| } |
| div(2); |
| for (int i = 0; i < 128; i++) { |
| expectEquals(((byte)(i + i)) >> 1, a[i], "div"); |
| a[i] = (byte) i; // undo arithmetic wrap-around effects |
| } |
| neg(); |
| for (int i = 0; i < 128; i++) { |
| expectEquals(-i, a[i], "neg"); |
| } |
| // Loop bounds. |
| bounds(); |
| expectEquals(0, a[0], "bounds0"); |
| for (int i = 1; i < 127; i++) { |
| expectEquals(11 - i, a[i], "bounds"); |
| } |
| expectEquals(-127, a[127], "bounds127"); |
| // Shifts. |
| for (int i = 0; i < 128; i++) { |
| a[i] = (byte) 0xff; |
| } |
| shl4(); |
| for (int i = 0; i < 128; i++) { |
| expectEquals((byte) 0xf0, a[i], "shl4"); |
| } |
| sar2(); |
| for (int i = 0; i < 128; i++) { |
| expectEquals((byte) 0xfc, a[i], "sar2"); |
| } |
| shr2(); |
| for (int i = 0; i < 128; i++) { |
| expectEquals((byte) 0xff, a[i], "shr2"); // sic! |
| } |
| sar31(); |
| for (int i = 0; i < 128; i++) { |
| expectEquals((byte) 0xff, a[i], "sar31"); |
| } |
| shr31(); |
| for (int i = 0; i < 128; i++) { |
| expectEquals(0x01, a[i], "shr31"); |
| a[i] = (byte) 0x12; // reset |
| } |
| shr32(); |
| for (int i = 0; i < 128; i++) { |
| expectEquals((byte) 0x12, a[i], "shr32"); |
| } |
| shr33(); |
| for (int i = 0; i < 128; i++) { |
| expectEquals((byte) 0x09, a[i], "shr33"); |
| } |
| shl9(); |
| for (int i = 0; i < 128; i++) { |
| expectEquals((byte) 0x00, a[i], "shl9"); |
| a[i] = (byte) 0xf0; // reset |
| } |
| not(); |
| for (int i = 0; i < 128; i++) { |
| expectEquals((byte) 0x0f, a[i], "not"); |
| } |
| // Done. |
| System.out.println("passed"); |
| } |
| |
| private static void expectEquals(int expected, int result, String action) { |
| if (expected != result) { |
| throw new Error("Expected: " + expected + ", found: " + result + " for " + action); |
| } |
| } |
| } |