From c689f67424dc0216fff82989d7ec168c9d252748 Mon Sep 17 00:00:00 2001 From: Artem Belevich Date: Sat, 1 Dec 2018 00:21:52 +0000 Subject: [PATCH] [NVPTX] Add lowering of i128 numbers as struct fields Addition to D34555 - override VTs computation with ComputePTXValueVTs for struct fields. Author: Denys Zariaiev Differential Revision: https://reviews.llvm.org/D55144 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@348057 91177308-0d34-0410-b5e6-96231b3b80d8 --- lib/Target/NVPTX/NVPTXISelLowering.cpp | 12 ++++++++++++ test/CodeGen/NVPTX/i128-struct.ll | 13 +++++++++++++ 2 files changed, 25 insertions(+) create mode 100644 test/CodeGen/NVPTX/i128-struct.ll diff --git a/lib/Target/NVPTX/NVPTXISelLowering.cpp b/lib/Target/NVPTX/NVPTXISelLowering.cpp index c352b9b9c9d..eceb4fc6d88 100644 --- a/lib/Target/NVPTX/NVPTXISelLowering.cpp +++ b/lib/Target/NVPTX/NVPTXISelLowering.cpp @@ -180,6 +180,18 @@ static void ComputePTXValueVTs(const TargetLowering &TLI, const DataLayout &DL, return; } + // Given a struct type, recursively traverse the elements with custom ComputePTXValueVTs. + if (StructType *STy = dyn_cast(Ty)) { + auto const *SL = DL.getStructLayout(STy); + auto ElementNum = 0; + for(auto *EI : STy->elements()) { + ComputePTXValueVTs(TLI, DL, EI, ValueVTs, Offsets, + StartingOffset + SL->getElementOffset(ElementNum)); + ++ElementNum; + } + return; + } + ComputeValueVTs(TLI, DL, Ty, TempVTs, &TempOffsets, StartingOffset); for (unsigned i = 0, e = TempVTs.size(); i != e; ++i) { EVT VT = TempVTs[i]; diff --git a/test/CodeGen/NVPTX/i128-struct.ll b/test/CodeGen/NVPTX/i128-struct.ll new file mode 100644 index 00000000000..c619be40f36 --- /dev/null +++ b/test/CodeGen/NVPTX/i128-struct.ll @@ -0,0 +1,13 @@ +; RUN: llc < %s -O0 -march=nvptx64 -mcpu=sm_20 | FileCheck %s + +; CHECK-LABEL: .visible .func (.param .align 16 .b8 func_retval0[32]) foo( +define { i128, i128 } @foo(i64 %a, i32 %b) { + %1 = sext i64 %a to i128 + %2 = sext i32 %b to i128 + %3 = insertvalue { i128, i128 } undef, i128 %1, 0 + %4 = insertvalue { i128, i128 } %3, i128 %2, 1 + + ; CHECK: st.param.v2.b64 [func_retval0+0], {%[[REG1:rd[0-9]+]], %[[REG2:rd[0-9]+]]}; + ; CHECK: st.param.v2.b64 [func_retval0+16], {%[[REG3:rd[0-9]+]], %[[REG4:rd[0-9]+]]}; + ret { i128, i128 } %4 +} -- 2.11.0