From f51a22e815a7494cbe1aba25d275015a70b5c31d Mon Sep 17 00:00:00 2001 From: Justin Holewinski Date: Fri, 28 Jun 2013 17:58:13 +0000 Subject: [NVPTX] Add (1.0 / sqrt(x)) => rsqrt(x) generation when allowable by FP flags git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@185178 91177308-0d34-0410-b5e6-96231b3b80d8 --- test/CodeGen/NVPTX/rsqrt.ll | 13 +++++++++++++ 1 file changed, 13 insertions(+) create mode 100644 test/CodeGen/NVPTX/rsqrt.ll (limited to 'test/CodeGen/NVPTX') diff --git a/test/CodeGen/NVPTX/rsqrt.ll b/test/CodeGen/NVPTX/rsqrt.ll new file mode 100644 index 0000000..d49eebe --- /dev/null +++ b/test/CodeGen/NVPTX/rsqrt.ll @@ -0,0 +1,13 @@ +; RUN: llc < %s -march=nvptx -mcpu=sm_20 -nvptx-prec-divf32=1 -nvptx-prec-sqrtf32=0 | FileCheck %s + +target datalayout = "e-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v16:16:16-v32:32:32-v64:64:64-v128:128:128-n16:32:64" + +declare float @llvm.nvvm.sqrt.f(float) + +define float @foo(float %a) { +; CHECK: rsqrt.approx.f32 + %val = tail call float @llvm.nvvm.sqrt.f(float %a) + %ret = fdiv float 1.0, %val + ret float %ret +} + \ No newline at end of file -- cgit v1.1