diff options
author | Justin Holewinski <jholewinski@nvidia.com> | 2014-07-17 18:10:09 +0000 |
---|---|---|
committer | Justin Holewinski <jholewinski@nvidia.com> | 2014-07-17 18:10:09 +0000 |
commit | 11ae250ec9d1adbd15fec36ccaf6e01a0fb1e518 (patch) | |
tree | 4eeed8daf9971fb6defbc9fbddb6f33186eb47f1 /test/CodeGen/NVPTX/fma.ll | |
parent | 15865afcf777b2323d56e02a8d62e295fd21b7ed (diff) |
[NVPTX] Improve handling of FP fusion
We now consider the FPOpFusion flag when determining whether
to fuse ops. We also explicitly emit add.rn when fusion is
disabled to prevent ptxas from fusing the operations on its
own.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@213287 91177308-0d34-0410-b5e6-96231b3b80d8
Diffstat (limited to 'test/CodeGen/NVPTX/fma.ll')
-rw-r--r-- | test/CodeGen/NVPTX/fma.ll | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/test/CodeGen/NVPTX/fma.ll b/test/CodeGen/NVPTX/fma.ll index 7716f77ef37..14b5c45b87d 100644 --- a/test/CodeGen/NVPTX/fma.ll +++ b/test/CodeGen/NVPTX/fma.ll @@ -1,4 +1,4 @@ -; RUN: llc < %s -march=nvptx -mcpu=sm_20 | FileCheck %s +; RUN: llc < %s -march=nvptx -mcpu=sm_20 -fp-contract=fast | FileCheck %s define ptx_device float @t1_f32(float %x, float %y, float %z) { ; CHECK: fma.rn.f32 %f{{[0-9]+}}, %f{{[0-9]+}}, %f{{[0-9]+}}, %f{{[0-9]+}}; |