From: Justin Holewinski Date: Mon, 27 Jun 2016 20:22:22 +0000 (+0000) Subject: Only emit extension for zeroext/signext arguments if type is < 32 bits X-Git-Url: https://granicus.if.org/sourcecode?a=commitdiff_plain;h=76e2771df0365b053c249949da93e2f783a2d813;p=llvm Only emit extension for zeroext/signext arguments if type is < 32 bits Reviewers: jingyue, jlebar Subscribers: jholewinski Differential Revision: http://reviews.llvm.org/D21756 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@273922 91177308-0d34-0410-b5e6-96231b3b80d8 --- diff --git a/lib/Target/NVPTX/NVPTXISelLowering.cpp b/lib/Target/NVPTX/NVPTXISelLowering.cpp index cdac1ac4695..7d457aff46c 100644 --- a/lib/Target/NVPTX/NVPTXISelLowering.cpp +++ b/lib/Target/NVPTX/NVPTXISelLowering.cpp @@ -1311,9 +1311,9 @@ SDValue NVPTXTargetLowering::LowerCall(TargetLowering::CallLoweringInfo &CLI, InFlag }; unsigned opcode = NVPTXISD::StoreParam; - if (Outs[OIdx].Flags.isZExt()) + if (Outs[OIdx].Flags.isZExt() && VT.getSizeInBits() < 32) opcode = NVPTXISD::StoreParamU32; - else if (Outs[OIdx].Flags.isSExt()) + else if (Outs[OIdx].Flags.isSExt() && VT.getSizeInBits() < 32) opcode = NVPTXISD::StoreParamS32; Chain = DAG.getMemIntrinsicNode(opcode, dl, CopyParamVTs, CopyParamOps, VT, MachinePointerInfo()); diff --git a/test/CodeGen/NVPTX/zeroext-32bit.ll b/test/CodeGen/NVPTX/zeroext-32bit.ll new file mode 100644 index 00000000000..c2f0ec4b144 --- /dev/null +++ b/test/CodeGen/NVPTX/zeroext-32bit.ll @@ -0,0 +1,26 @@ +; RUN: llc < %s -march=nvptx64 -mcpu=sm_30 | FileCheck %s + +; The zeroext attribute below should be silently ignored because +; we can pass a 32-bit integer across a function call without +; needing to extend it. + +target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v16:16:16-v32:32:32-v64:64:64-v128:128:128-n16:32:64" +target triple = "nvptx64-unknown-cuda" + +; CHECK-LABEL: .visible .func zeroext_test +; CHECK-NOT: cvt.u32.u16 +define void @zeroext_test() { + tail call void @call1(i32 zeroext 0) + ret void +} + +declare void @call1(i32 zeroext) + +; CHECK-LABEL: .visible .func signext_test +; CHECK-NOT: cvt.s32.s16 +define void @signext_test() { + tail call void @call2(i32 zeroext 0) + ret void +} + +declare void @call2(i32 zeroext)