add llvm patches

vchuravy · vchuravy · commit c581ef42e4e7 · 2019-12-24T07:52:44.000-05:00
diff --git a/deps/llvm.mk b/deps/llvm.mk
@@ -462,6 +462,8 @@ $(eval $(call LLVM_PATCH,llvm-8.0-D63688-wasm-isLocal)) # remove for 9.0
 $(eval $(call LLVM_PATCH,llvm-8.0-D55758-tablegen-cond)) # remove for 9.0
 $(eval $(call LLVM_PATCH,llvm-8.0-D59389-refactor-wmma)) # remove for 9.0
 $(eval $(call LLVM_PATCH,llvm-8.0-D59393-mma-ptx63-fix)) # remove for 9.0
+$(eval $(call LLVM_PATCH,llvm-8.0-D66657-codegen-degenerate)) # remove for 10.0
+$(eval $(call LLVM_PATCH,llvm-8.0-D71495-vectorize-freduce)) # remove for 10.0
 endif # LLVM_VER 8.0
 
 ifeq ($(LLVM_VER_SHORT),9.0)
@@ -476,6 +478,8 @@ $(eval $(call LLVM_PATCH,llvm8-WASM-addrspaces)) # WebAssembly
 $(eval $(call LLVM_PATCH,llvm-exegesis-mingw)) # mingw build
 $(eval $(call LLVM_PATCH,llvm-test-plugin-mingw)) # mingw build
 $(eval $(call LLVM_PATCH,llvm7-revert-D44485))
+$(eval $(call LLVM_PATCH,llvm-8.0-D66657-codegen-degenerate)) # remove for 10.0
+$(eval $(call LLVM_PATCH,llvm-8.0-D71495-vectorize-freduce)) # remove for 10.0
 endif # LLVM_VER 9.0
 
 
diff --git a/deps/patches/llvm-8.0-D66657-codegen-degenerate.patch b/deps/patches/llvm-8.0-D66657-codegen-degenerate.patch
@@ -0,0 +1,65 @@
+From 4c7e1defbddafcfcfe1211b041d43a36114a8f48 Mon Sep 17 00:00:00 2001
+From: Valentin Churavy <v.churavy@gmail.com>
+Date: Sat, 14 Dec 2019 10:33:30 -0500
+Subject: [PATCH 2/2] [CodegenPrepare] Guard against degenerate branches
+
+Summary:
+Guard against a potential crash observed in https://github.com/JuliaLang/julia/issues/32994#issuecomment-524249628
+If two branches are collapsed we can encounter a degenerate conditional branch `TBB==FBB`.
+The subsequent code assumes that they differ, so we exit out early.
+
+Reviewers: ributzka, spatel
+
+Subscribers: loladiro, dexonsmith, hiraditya, llvm-commits
+
+Tags: #llvm
+
+Differential Revision: https://reviews.llvm.org/D66657
+---
+ llvm/lib/CodeGen/CodeGenPrepare.cpp            |  4 ++++
+ .../CodeGen/X86/codegen-prepare-collapse.ll    | 18 ++++++++++++++++++
+ 2 files changed, 22 insertions(+)
+ create mode 100644 llvm/test/CodeGen/X86/codegen-prepare-collapse.ll
+
+diff --git a/lib/CodeGen/CodeGenPrepare.cpp b/lib/CodeGen/CodeGenPrepare.cpp
+index c35f8666fa3..3647641c594 100644
+--- a/lib/CodeGen/CodeGenPrepare.cpp
++++ b/lib/CodeGen/CodeGenPrepare.cpp
+@@ -6929,6 +6929,10 @@ bool CodeGenPrepare::splitBranchCondition(Function &F) {
+     if (Br1->getMetadata(LLVMContext::MD_unpredictable))
+       continue;
+ 
++    // The merging of mostly empty BB can cause a degenerate branch.
++    if (TBB == FBB)
++      continue;
++
+     unsigned Opc;
+     Value *Cond1, *Cond2;
+     if (match(LogicOp, m_And(m_OneUse(m_Value(Cond1)),
+diff --git a/test/CodeGen/X86/codegen-prepare-collapse.ll b/test/CodeGen/X86/codegen-prepare-collapse.ll
+new file mode 100644
+index 00000000000..18e3ef7afbd
+--- /dev/null
++++ b/test/CodeGen/X86/codegen-prepare-collapse.ll
+@@ -0,0 +1,18 @@
++; RUN: llc -fast-isel=true -O1 -mtriple=x86_64-unkown-linux-gnu -start-before=codegenprepare -stop-after=codegenprepare -o - < %s | FileCheck %s
++
++; CHECK-LABEL: @foo
++define void @foo() {
++top:
++; CHECK: br label %L34
++  br label %L34
++
++L34:                                              ; preds = %L34, %L34, %top
++  %.sroa.075.0 = phi i64 [ undef, %top ], [ undef, %L34 ], [ undef, %L34 ]
++  %0 = icmp sgt i8 undef, -1
++  %cond5896 = icmp eq i8 0, 2
++  %cond58 = and i1 %cond5896, %0
++; During codegenprepare such degenerate branches can occur and should not
++; lead to crashes.
++; CHECK: br label %L34
++  br i1 %cond58, label %L34, label %L34
++}
+-- 
+2.24.1
+
diff --git a/deps/patches/llvm-8.0-D71495-vectorize-freduce.patch b/deps/patches/llvm-8.0-D71495-vectorize-freduce.patch
@@ -0,0 +1,94 @@
+From 7c30e23f115ae285b497ef11af0153703111dff2 Mon Sep 17 00:00:00 2001
+From: Valentin Churavy <v.churavy@gmail.com>
+Date: Sun, 22 Dec 2019 14:25:50 -0500
+Subject: [PATCH 1/2] [SelectionDAG] Copy FP flags when visiting a binary
+ instruction.
+
+Summary:
+We noticed in Julia that the sequence below no longer turned into
+a sequence of FMA instructions in LLVM 7+, but it did in LLVM 6.
+
+```
+    %29 = fmul contract <4 x double> %wide.load, %wide.load16
+    %30 = fmul contract <4 x double> %wide.load13, %wide.load17
+    %31 = fmul contract <4 x double> %wide.load14, %wide.load18
+    %32 = fmul contract <4 x double> %wide.load15, %wide.load19
+    %33 = fadd fast <4 x double> %vec.phi, %29
+    %34 = fadd fast <4 x double> %vec.phi10, %30
+    %35 = fadd fast <4 x double> %vec.phi11, %31
+    %36 = fadd fast <4 x double> %vec.phi12, %32
+```
+
+Unlike Clang, Julia doesn't set the `unsafe-fp-math=true` function
+attribute, but rather emits more local instruction flags.
+
+This partially undoes https://reviews.llvm.org/D46854 and if required I can try to minimize the test further.
+
+Reviewers: spatel, mcberg2017
+
+Reviewed By: spatel
+
+Subscribers: chriselrod, merge_guards_bot, hiraditya, llvm-commits
+
+Tags: #llvm
+
+Differential Revision: https://reviews.llvm.org/D71495
+---
+ .../SelectionDAG/SelectionDAGBuilder.cpp      |  7 +++++
+ llvm/test/CodeGen/X86/fmf-reduction.ll        | 26 +++++++++++++++++++
+ 2 files changed, 33 insertions(+)
+ create mode 100644 llvm/test/CodeGen/X86/fmf-reduction.ll
+
+diff --git a/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp b/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp
+index bfeb3d1bc2b..e6362c19691 100644
+--- a/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp
++++ b/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp
+@@ -2833,6 +2833,13 @@ void SelectionDAGBuilder::visitBinary(const User &I, unsigned Opcode) {
+   if (isVectorReductionOp(&I)) {
+     Flags.setVectorReduction(true);
+     LLVM_DEBUG(dbgs() << "Detected a reduction operation:" << I << "\n");
++
++    // If no flags are set we will propagate the incoming flags, if any flags
++    // are set, we will intersect them with the incoming flag and so we need to
++    // copy the FMF flags here.
++    if (auto *FPOp = dyn_cast<FPMathOperator>(&I)) {
++      Flags.copyFMF(*FPOp);
++    }
+   }
+ 
+   SDValue Op1 = getValue(I.getOperand(0));
+diff --git a/test/CodeGen/X86/fmf-reduction.ll b/test/CodeGen/X86/fmf-reduction.ll
+new file mode 100644
+index 00000000000..1d669d2a924
+--- /dev/null
++++ b/test/CodeGen/X86/fmf-reduction.ll
+@@ -0,0 +1,26 @@
++; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
++; RUN: llc < %s -mtriple=x86_64-- -mattr=fma | FileCheck %s
++
++; Propagation of IR FMF should not drop flags when adding the DAG reduction flag.
++; This should include an FMA instruction, not separate FMUL/FADD.
++
++define double @julia_dotf(<4 x double> %x, <4 x double> %y, <4 x double> %z, i1 %t3) {
++; CHECK-LABEL: julia_dotf:
++; CHECK:       # %bb.0:
++; CHECK-NEXT:    vfmadd213pd {{.*#+}} ymm0 = (ymm1 * ymm0) + ymm2
++; CHECK-NEXT:    vextractf128 $1, %ymm0, %xmm1
++; CHECK-NEXT:    vaddpd %xmm1, %xmm0, %xmm0
++; CHECK-NEXT:    vpermilpd {{.*#+}} xmm1 = xmm0[1,0]
++; CHECK-NEXT:    vaddsd %xmm1, %xmm0, %xmm0
++; CHECK-NEXT:    vzeroupper
++; CHECK-NEXT:    retq
++  %t1 = fmul contract <4 x double> %x, %y
++  %t2 = fadd fast <4 x double> %z, %t1
++  %rdx.shuf = shufflevector <4 x double> %t2, <4 x double> undef, <4 x i32> <i32 2, i32 3, i32 undef, i32 undef>
++  %bin.rdx22 = fadd fast <4 x double> %t2, %rdx.shuf
++  %rdx.shuf23 = shufflevector <4 x double> %bin.rdx22, <4 x double> undef, <4 x i32> <i32 1, i32 undef, i32 undef, i32 undef>
++  %bin.rdx24 = fadd fast <4 x double> %bin.rdx22, %rdx.shuf23
++  %t4 = extractelement <4 x double> %bin.rdx24, i32 0
++  ret double %t4
++}
++
+-- 
+2.24.1
+