summaryrefslogtreecommitdiff
path: root/test/CodeGen/NVPTX/fma.ll
diff options
context:
space:
mode:
authorJustin Holewinski <jholewinski@nvidia.com>2014-07-17 18:10:09 +0000
committerJustin Holewinski <jholewinski@nvidia.com>2014-07-17 18:10:09 +0000
commit11ae250ec9d1adbd15fec36ccaf6e01a0fb1e518 (patch)
tree4eeed8daf9971fb6defbc9fbddb6f33186eb47f1 /test/CodeGen/NVPTX/fma.ll
parent15865afcf777b2323d56e02a8d62e295fd21b7ed (diff)
[NVPTX] Improve handling of FP fusion
We now consider the FPOpFusion flag when determining whether to fuse ops. We also explicitly emit add.rn when fusion is disabled to prevent ptxas from fusing the operations on its own. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@213287 91177308-0d34-0410-b5e6-96231b3b80d8
Diffstat (limited to 'test/CodeGen/NVPTX/fma.ll')
-rw-r--r--test/CodeGen/NVPTX/fma.ll2
1 files changed, 1 insertions, 1 deletions
diff --git a/test/CodeGen/NVPTX/fma.ll b/test/CodeGen/NVPTX/fma.ll
index 7716f77ef37..14b5c45b87d 100644
--- a/test/CodeGen/NVPTX/fma.ll
+++ b/test/CodeGen/NVPTX/fma.ll
@@ -1,4 +1,4 @@
-; RUN: llc < %s -march=nvptx -mcpu=sm_20 | FileCheck %s
+; RUN: llc < %s -march=nvptx -mcpu=sm_20 -fp-contract=fast | FileCheck %s
define ptx_device float @t1_f32(float %x, float %y, float %z) {
; CHECK: fma.rn.f32 %f{{[0-9]+}}, %f{{[0-9]+}}, %f{{[0-9]+}}, %f{{[0-9]+}};