summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
-rw-r--r--contrib/llvm/patches/patch-31-llvm-r222292-aarch64-no-neon.diff61
1 files changed, 61 insertions, 0 deletions
diff --git a/contrib/llvm/patches/patch-31-llvm-r222292-aarch64-no-neon.diff b/contrib/llvm/patches/patch-31-llvm-r222292-aarch64-no-neon.diff
new file mode 100644
index 0000000..c1120bb
--- /dev/null
+++ b/contrib/llvm/patches/patch-31-llvm-r222292-aarch64-no-neon.diff
@@ -0,0 +1,61 @@
+Pull in r222292 from upstream llvm trunk (by Weiming Zhao):
+
+ [Aarch64] Customer lowering of CTPOP to SIMD should check for NEON
+ availability
+
+This ensures llvm's AArch64 backend does not emit floating point
+instructions if they are disabled.
+
+Introduced here: http://svnweb.freebsd.org/changeset/base/276786
+
+Index: lib/Target/AArch64/AArch64ISelLowering.cpp
+===================================================================
+--- lib/Target/AArch64/AArch64ISelLowering.cpp
++++ lib/Target/AArch64/AArch64ISelLowering.cpp
+@@ -3062,6 +3062,9 @@ SDValue AArch64TargetLowering::LowerCTPOP(SDValue
+ AttributeSet::FunctionIndex, Attribute::NoImplicitFloat))
+ return SDValue();
+
++ if (!Subtarget->hasNEON())
++ return SDValue();
++
+ // While there is no integer popcount instruction, it can
+ // be more efficiently lowered to the following sequence that uses
+ // AdvSIMD registers/instructions as long as the copies to/from
+Index: test/CodeGen/AArch64/arm64-popcnt.ll
+===================================================================
+--- test/CodeGen/AArch64/arm64-popcnt.ll
++++ test/CodeGen/AArch64/arm64-popcnt.ll
+@@ -1,4 +1,5 @@
+ ; RUN: llc < %s -march=arm64 -aarch64-neon-syntax=apple | FileCheck %s
++; RUN: llc < %s -march=aarch64 -mattr -neon -aarch64-neon-syntax=apple | FileCheck -check-prefix=CHECK-NONEON %s
+
+ define i32 @cnt32_advsimd(i32 %x) nounwind readnone {
+ %cnt = tail call i32 @llvm.ctpop.i32(i32 %x)
+@@ -8,6 +9,13 @@ define i32 @cnt32_advsimd(i32 %x) nounwind readnon
+ ; CHECK: uaddlv.8b h0, v0
+ ; CHECK: fmov w0, s0
+ ; CHECK: ret
++; CHECK-NONEON-LABEL: cnt32_advsimd
++; CHECK-NONEON-NOT: 8b
++; CHECK-NONEON: and w{{[0-9]+}}, w{{[0-9]+}}, #0x55555555
++; CHECK-NONEON: and w{{[0-9]+}}, w{{[0-9]+}}, #0x33333333
++; CHECK-NONEON: and w{{[0-9]+}}, w{{[0-9]+}}, #0xf0f0f0f
++; CHECK-NONEON: mul
++
+ }
+
+ define i64 @cnt64_advsimd(i64 %x) nounwind readnone {
+@@ -18,6 +26,12 @@ define i64 @cnt64_advsimd(i64 %x) nounwind readnon
+ ; CHECK: uaddlv.8b h0, v0
+ ; CHECK: fmov w0, s0
+ ; CHECK: ret
++; CHECK-NONEON-LABEL: cnt64_advsimd
++; CHECK-NONEON-NOT: 8b
++; CHECK-NONEON: and x{{[0-9]+}}, x{{[0-9]+}}, #0x5555555555555555
++; CHECK-NONEON: and x{{[0-9]+}}, x{{[0-9]+}}, #0x3333333333333333
++; CHECK-NONEON: and x{{[0-9]+}}, x{{[0-9]+}}, #0xf0f0f0f0f0f0f0f
++; CHECK-NONEON: mul
+ }
+
+ ; Do not use AdvSIMD when -mno-implicit-float is specified.
OpenPOWER on IntegriCloud