summaryrefslogtreecommitdiffstats
path: root/test/CodeGenOpenCL/shifts.cl
diff options
context:
space:
mode:
Diffstat (limited to 'test/CodeGenOpenCL/shifts.cl')
-rw-r--r--test/CodeGenOpenCL/shifts.cl57
1 files changed, 57 insertions, 0 deletions
diff --git a/test/CodeGenOpenCL/shifts.cl b/test/CodeGenOpenCL/shifts.cl
new file mode 100644
index 0000000..015a777
--- /dev/null
+++ b/test/CodeGenOpenCL/shifts.cl
@@ -0,0 +1,57 @@
+// RUN: %clang_cc1 -x cl -O1 -emit-llvm %s -o - -triple x86_64-linux-gnu | FileCheck %s
+// OpenCL essentially reduces all shift amounts to the last word-size bits before evaluating.
+// Test this both for variables and constants evaluated in the front-end.
+
+
+//CHECK: @positiveShift32
+int positiveShift32(int a,int b) {
+ //CHECK: [[M32:%.+]] = and i32 %b, 31
+ //CHECK-NEXT: [[C32:%.+]] = shl i32 %a, [[M32]]
+ int c = a<<b;
+ int d = ((int)1)<<33;
+ //CHECK-NEXT: [[E32:%.+]] = add nsw i32 [[C32]], 2
+ int e = c + d;
+ //CHECK-NEXT: ret i32 [[E32]]
+ return e;
+}
+
+//CHECK: @positiveShift64
+long positiveShift64(long a,long b) {
+ //CHECK: [[M64:%.+]] = and i64 %b, 63
+ //CHECK-NEXT: [[C64:%.+]] = ashr i64 %a, [[M64]]
+ long c = a>>b;
+ long d = ((long)8)>>65;
+ //CHECK-NEXT: [[E64:%.+]] = add nsw i64 [[C64]], 4
+ long e = c + d;
+ //CHECK-NEXT: ret i64 [[E64]]
+ return e;
+}
+
+typedef __attribute__((ext_vector_type(4))) int int4;
+
+//CHECK: @vectorVectorTest
+int4 vectorVectorTest(int4 a,int4 b) {
+ //CHECK: [[VM:%.+]] = and <4 x i32> %b, <i32 31, i32 31, i32 31, i32 31>
+ //CHECK-NEXT: [[VC:%.+]] = shl <4 x i32> %a, [[VM]]
+ int4 c = a << b;
+ //CHECK-NEXT: [[VF:%.+]] = add <4 x i32> [[VC]], <i32 2, i32 4, i32 16, i32 8>
+ int4 d = {1, 1, 1, 1};
+ int4 e = {33, 34, -28, -29};
+ int4 f = c + (d << e);
+ //CHECK-NEXT: ret <4 x i32> [[VF]]
+ return f;
+}
+
+//CHECK: @vectorScalarTest
+int4 vectorScalarTest(int4 a,int b) {
+ //CHECK: [[SP0:%.+]] = insertelement <4 x i32> undef, i32 %b, i32 0
+ //CHECK: [[SP1:%.+]] = shufflevector <4 x i32> [[SP0]], <4 x i32> undef, <4 x i32> zeroinitializer
+ //CHECK: [[VSM:%.+]] = and <4 x i32> [[SP1]], <i32 31, i32 31, i32 31, i32 31>
+ //CHECK-NEXT: [[VSC:%.+]] = shl <4 x i32> %a, [[VSM]]
+ int4 c = a << b;
+ //CHECK-NEXT: [[VSF:%.+]] = add <4 x i32> [[VSC]], <i32 4, i32 4, i32 4, i32 4>
+ int4 d = {1, 1, 1, 1};
+ int4 f = c + (d << 34);
+ //CHECK-NEXT: ret <4 x i32> [[VSF]]
+ return f;
+}
OpenPOWER on IntegriCloud