From b9e7253e391e90a1d0a91a2baa00254625a0d328 Mon Sep 17 00:00:00 2001 From: Haicheng Wu Date: Mon, 26 Mar 2018 16:47:37 +0000 Subject: [PATCH] [SLP] Add a test case. NFC. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@328546 91177308-0d34-0410-b5e6-96231b3b80d8 --- test/Transforms/SLPVectorizer/AArch64/ext-trunc.ll | 38 ++++++++++++++++++++++ 1 file changed, 38 insertions(+) create mode 100644 test/Transforms/SLPVectorizer/AArch64/ext-trunc.ll diff --git a/test/Transforms/SLPVectorizer/AArch64/ext-trunc.ll b/test/Transforms/SLPVectorizer/AArch64/ext-trunc.ll new file mode 100644 index 00000000000..8f50b8bedec --- /dev/null +++ b/test/Transforms/SLPVectorizer/AArch64/ext-trunc.ll @@ -0,0 +1,38 @@ +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py +; RUN: opt -S -slp-vectorizer -mtriple=aarch64--linux-gnu -instcombine < %s | FileCheck %s + +target datalayout = "e-m:e-i32:64-i128:128-n32:64-S128" + +declare void @foo(i64, i64, i64, i64) + +define void @test(<4 x i16> %a, <4 x i16> %b, i64* %p) { +; Make sure types of sub and its sources are not extended. +; CHECK-LABEL: @test( +; CHECK-NEXT: entry: +; CHECK-NEXT: [[Z0:%.*]] = zext <4 x i16> [[A:%.*]] to <4 x i64> +; CHECK-NEXT: [[Z1:%.*]] = zext <4 x i16> [[B:%.*]] to <4 x i64> +; CHECK-NEXT: [[SUB0:%.*]] = sub nsw <4 x i64> [[Z0]], [[Z1]] +; +entry: + %z0 = zext <4 x i16> %a to <4 x i32> + %z1 = zext <4 x i16> %b to <4 x i32> + %sub0 = sub <4 x i32> %z0, %z1 + %e0 = extractelement <4 x i32> %sub0, i32 0 + %s0 = sext i32 %e0 to i64 + %gep0 = getelementptr inbounds i64, i64* %p, i64 %s0 + %load0 = load i64, i64* %gep0 + %e1 = extractelement <4 x i32> %sub0, i32 1 + %s1 = sext i32 %e1 to i64 + %gep1 = getelementptr inbounds i64, i64* %p, i64 %s1 + %load1 = load i64, i64* %gep1 + %e2 = extractelement <4 x i32> %sub0, i32 2 + %s2 = sext i32 %e2 to i64 + %gep2 = getelementptr inbounds i64, i64* %p, i64 %s2 + %load2 = load i64, i64* %gep2 + %e3 = extractelement <4 x i32> %sub0, i32 3 + %s3 = sext i32 %e3 to i64 + %gep3 = getelementptr inbounds i64, i64* %p, i64 %s3 + %load3 = load i64, i64* %gep3 + call void @foo(i64 %load0, i64 %load1, i64 %load2, i64 %load3) + ret void +} -- 2.11.0