From: Pirama Arumuga Nainar Date: Fri, 8 Jan 2016 17:46:05 +0000 (+0000) Subject: Do not ASSERTZEXT for i16 result of bitcast from f16 operand X-Git-Url: http://demsky.eecs.uci.edu/git/?a=commitdiff_plain;h=0de8d7820f74ed70d2b737406be353e641d3e9f9;p=oota-llvm.git Do not ASSERTZEXT for i16 result of bitcast from f16 operand Summary: During legalization if i16, do not ASSERTZEXT the result of FP_TO_FP16. Directly return an FP_TO_FP16 node with return type as the promote-to-type of i16. This patch also removes extraneous length check. This legalization should be valid even if integer and float types are of different lengths. This patch breaks a hard-float test for fp16 args. The test is changed to allow a vmov to zero-out the top bits, and also ensure that the return value is in an FP register. Reviewers: ab, jmolloy Subscribers: srhines, llvm-commits Differential Revision: http://reviews.llvm.org/D15438 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@257184 91177308-0d34-0410-b5e6-96231b3b80d8 --- diff --git a/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp b/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp index cd114d668e2..74f80db6d01 100644 --- a/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp +++ b/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp @@ -262,12 +262,8 @@ SDValue DAGTypeLegalizer::PromoteIntRes_BITCAST(SDNode *N) { return DAG.getNode(ISD::ANY_EXTEND, dl, NOutVT, GetSoftenedFloat(InOp)); case TargetLowering::TypePromoteFloat: { // Convert the promoted float by hand. - if (NOutVT.bitsEq(NInVT)) { - SDValue PromotedOp = GetPromotedFloat(InOp); - SDValue Trunc = DAG.getNode(ISD::FP_TO_FP16, dl, NOutVT, PromotedOp); - return DAG.getNode(ISD::AssertZext, dl, NOutVT, Trunc, - DAG.getValueType(OutVT)); - } + SDValue PromotedOp = GetPromotedFloat(InOp); + return DAG.getNode(ISD::FP_TO_FP16, dl, NOutVT, PromotedOp); break; } case TargetLowering::TypeExpandInteger: diff --git a/test/CodeGen/ARM/fp16-args.ll b/test/CodeGen/ARM/fp16-args.ll index 31a20f85483..708fae7f9ff 100644 --- a/test/CodeGen/ARM/fp16-args.ll +++ b/test/CodeGen/ARM/fp16-args.ll @@ -32,9 +32,10 @@ entry: ; HARD: vcvtb.f32.f16 {{s[0-9]+}}, s1 ; HARD: vcvtb.f32.f16 {{s[0-9]+}}, s0 ; HARD: vadd.f32 {{s[0-9]+}}, {{s[0-9]+}}, {{s[0-9]+}} -; HARD: vcvtb.f16.f32 s0, {{s[0-9]+}} -; HARD-NOT: vmov -; HARD-NOT: uxth +; HARD: vcvtb.f16.f32 [[SREG:s[0-9]+]], {{s[0-9]+}} +; HARD-NEXT: vmov [[REG0:r[0-9]+]], [[SREG]] +; HARD-NEXT: uxth [[REG1:r[0-9]+]], [[REG0]] +; HARD-NEXT: vmov s0, [[REG1]] ; CHECK: bx lr } diff --git a/test/CodeGen/ARM/fp16-v3.ll b/test/CodeGen/ARM/fp16-v3.ll new file mode 100644 index 00000000000..6ed9c9d22c9 --- /dev/null +++ b/test/CodeGen/ARM/fp16-v3.ll @@ -0,0 +1,28 @@ +; RUN: llc -mattr=+fp16 < %s | FileCheck %s --check-prefix=CHECK + +target datalayout = "e-m:e-p:32:32-i64:64-v128:64:128-a:0:32-n32-S64" +target triple = "armv7a--none-eabi" + +; CHECK-LABEL: test_vec3: +; CHECK: vcvtb.f32.f16 +; CHECK: vcvt.f32.s32 +; CHECK: vadd.f32 +; CHECK-NEXT: vcvtb.f16.f32 [[SREG:s[0-9]+]], {{.*}} +; CHECK-NEXT: vmov [[RREG1:r[0-9]+]], [[SREG]] +; CHECK-NEXT: uxth [[RREG2:r[0-9]+]], [[RREG1]] +; CHECK-NEXT: pkhbt [[RREG3:r[0-9]+]], [[RREG1]], [[RREG1]], lsl #16 +; CHECK-DAG: strh [[RREG1]], [r0, #4] +; CHECK-DAG: vmov [[DREG:d[0-9]+]], [[RREG3]], [[RREG2]] +; CHECK-DAG: vst1.32 {[[DREG]][0]}, [r0:32] +; CHECK-NEXT: bx lr +define void @test_vec3(<3 x half>* %arr, i32 %i) #0 { + %H = sitofp i32 %i to half + %S = fadd half %H, 0xH4A00 + %1 = insertelement <3 x half> undef, half %S, i32 0 + %2 = insertelement <3 x half> %1, half %S, i32 1 + %3 = insertelement <3 x half> %2, half %S, i32 2 + store <3 x half> %3, <3 x half>* %arr, align 8 + ret void +} + +attributes #0 = { nounwind }