2018-12-05 04:14:57 +08:00
|
|
|
; RUN: llc -relocation-model=pic -mcpu=pwr9 -mtriple=powerpc64le-unknown-unknown \
|
2018-07-13 04:18:57 +08:00
|
|
|
; RUN: -enable-ppc-quad-precision -verify-machineinstrs \
|
|
|
|
; RUN: -ppc-vsr-nums-as-vr -ppc-asm-full-reg-names < %s | FileCheck %s
|
2018-12-05 04:14:57 +08:00
|
|
|
; RUN: llc -relocation-model=pic -mcpu=pwr9 -mtriple=powerpc64-unknown-unknown \
|
2018-07-13 04:18:57 +08:00
|
|
|
; RUN: -enable-ppc-quad-precision -verify-machineinstrs \
|
|
|
|
; RUN: -ppc-vsr-nums-as-vr -ppc-asm-full-reg-names < %s \
|
2018-07-05 14:51:38 +08:00
|
|
|
; RUN: | FileCheck -check-prefix=CHECK-BE %s
|
|
|
|
|
|
|
|
; Testing homogeneous aggregates.
|
|
|
|
|
|
|
|
%struct.With9fp128params = type { fp128, fp128, fp128, fp128, fp128, fp128,
|
|
|
|
fp128, fp128, fp128 }
|
|
|
|
|
|
|
|
@a1 = common local_unnamed_addr global [3 x fp128] zeroinitializer, align 16
|
|
|
|
|
|
|
|
; Function Attrs: norecurse nounwind readonly
|
|
|
|
define fp128 @testArray_01(fp128* nocapture readonly %sa) {
|
|
|
|
; CHECK-LABEL: testArray_01:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-NEXT: lxv v2, 32(r3)
|
2018-07-05 14:51:38 +08:00
|
|
|
; CHECK-NEXT: blr
|
|
|
|
|
|
|
|
; CHECK-BE-LABEL: testArray_01:
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-BE: lxv v2, 32(r3)
|
2018-07-05 14:51:38 +08:00
|
|
|
; CHECK-BE-NEXT: blr
|
|
|
|
entry:
|
|
|
|
%arrayidx = getelementptr inbounds fp128, fp128* %sa, i64 2
|
|
|
|
%0 = load fp128, fp128* %arrayidx, align 16
|
|
|
|
ret fp128 %0
|
|
|
|
}
|
|
|
|
|
|
|
|
; Function Attrs: norecurse nounwind readonly
|
|
|
|
define fp128 @testArray_02() {
|
|
|
|
; CHECK-LABEL: testArray_02:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-NEXT: addis r3, r2, .LC0@toc@ha
|
|
|
|
; CHECK-NEXT: ld r3, .LC0@toc@l(r3)
|
|
|
|
; CHECK-NEXT: lxv v2, 32(r3)
|
2018-07-05 14:51:38 +08:00
|
|
|
; CHECK-NEXT: blr
|
|
|
|
|
|
|
|
; CHECK-BE-LABEL: testArray_02:
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-BE: lxv v2, 32(r3)
|
2018-07-05 14:51:38 +08:00
|
|
|
; CHECK-BE-NEXT: blr
|
|
|
|
entry:
|
|
|
|
%0 = load fp128, fp128* getelementptr inbounds ([3 x fp128], [3 x fp128]* @a1,
|
|
|
|
i64 0, i64 2), align 16
|
|
|
|
ret fp128 %0
|
|
|
|
}
|
|
|
|
|
|
|
|
; Function Attrs: norecurse nounwind readnone
|
|
|
|
define fp128 @testStruct_01(fp128 inreg returned %a.coerce) {
|
|
|
|
; CHECK-LABEL: testStruct_01:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
|
|
|
; CHECK-NEXT: blr
|
|
|
|
|
|
|
|
; CHECK-BE-LABEL: testStruct_01:
|
|
|
|
; CHECK-BE: # %bb.0: # %entry
|
|
|
|
; CHECK-BE-NEXT: blr
|
|
|
|
entry:
|
|
|
|
ret fp128 %a.coerce
|
|
|
|
}
|
|
|
|
|
|
|
|
; Function Attrs: norecurse nounwind readnone
|
|
|
|
define fp128 @testStruct_02([8 x fp128] %a.coerce) {
|
|
|
|
; CHECK-LABEL: testStruct_02:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-NEXT: vmr v2, v9
|
2018-07-05 14:51:38 +08:00
|
|
|
; CHECK-NEXT: blr
|
|
|
|
|
|
|
|
; CHECK-BE-LABEL: testStruct_02:
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-BE: vmr v2, v9
|
2018-07-05 14:51:38 +08:00
|
|
|
; CHECK-BE-NEXT: blr
|
|
|
|
entry:
|
|
|
|
%a.coerce.fca.7.extract = extractvalue [8 x fp128] %a.coerce, 7
|
|
|
|
ret fp128 %a.coerce.fca.7.extract
|
|
|
|
}
|
|
|
|
|
|
|
|
; Since we can only pass a max of 8 float128 value in VSX registers, ensure we
|
|
|
|
; store to stack if passing more.
|
|
|
|
; Function Attrs: norecurse nounwind readonly
|
|
|
|
define fp128 @testStruct_03(%struct.With9fp128params* byval nocapture readonly
|
|
|
|
align 16 %a) {
|
|
|
|
; CHECK-LABEL: testStruct_03:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
2019-07-02 11:28:52 +08:00
|
|
|
; CHECK: lxv v2, 128(r1)
|
[DAGCombiner] If a TokenFactor would be merged into its user, consider the user later.
Summary:
A number of optimizations are inhibited by single-use TokenFactors not
being merged into the TokenFactor using it. This makes we consider if
we can do the merge immediately.
Most tests changes here are due to the change in visitation causing
minor reorderings and associated reassociation of paired memory
operations.
CodeGen tests with non-reordering changes:
X86/aligned-variadic.ll -- memory-based add folded into stored leaq
value.
X86/constant-combiners.ll -- Optimizes out overlap between stores.
X86/pr40631_deadstore_elision -- folds constant byte store into
preceding quad word constant store.
Reviewers: RKSimon, craig.topper, spatel, efriedma, courbet
Reviewed By: courbet
Subscribers: dylanmckay, sdardis, nemanjai, jvesely, nhaehnle, javed.absar, eraman, hiraditya, kbarton, jrtc27, atanasyan, jsji, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59260
llvm-svn: 356068
2019-03-14 01:07:09 +08:00
|
|
|
; CHECK-DAG: std r10, 88(r1)
|
|
|
|
; CHECK-DAG: std r9, 80(r1)
|
|
|
|
; CHECK-DAG: std r8, 72(r1)
|
|
|
|
; CHECK-DAG: std r7, 64(r1)
|
|
|
|
; CHECK-DAG: std r6, 56(r1)
|
|
|
|
; CHECK-DAG: std r5, 48(r1)
|
|
|
|
; CHECK-DAG: std r4, 40(r1)
|
|
|
|
; CHECK-DAG: std r3, 32(r1)
|
2018-07-05 14:51:38 +08:00
|
|
|
; CHECK-NEXT: blr
|
|
|
|
|
|
|
|
; CHECK-BE-LABEL: testStruct_03:
|
|
|
|
; CHECK-BE: # %bb.0: # %entry
|
2019-07-02 11:28:52 +08:00
|
|
|
; CHECK-BE: lxv v2, 144(r1)
|
[DAGCombiner] If a TokenFactor would be merged into its user, consider the user later.
Summary:
A number of optimizations are inhibited by single-use TokenFactors not
being merged into the TokenFactor using it. This makes we consider if
we can do the merge immediately.
Most tests changes here are due to the change in visitation causing
minor reorderings and associated reassociation of paired memory
operations.
CodeGen tests with non-reordering changes:
X86/aligned-variadic.ll -- memory-based add folded into stored leaq
value.
X86/constant-combiners.ll -- Optimizes out overlap between stores.
X86/pr40631_deadstore_elision -- folds constant byte store into
preceding quad word constant store.
Reviewers: RKSimon, craig.topper, spatel, efriedma, courbet
Reviewed By: courbet
Subscribers: dylanmckay, sdardis, nemanjai, jvesely, nhaehnle, javed.absar, eraman, hiraditya, kbarton, jrtc27, atanasyan, jsji, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59260
llvm-svn: 356068
2019-03-14 01:07:09 +08:00
|
|
|
; CHECK-BE-DAG: std r10, 104(r1)
|
|
|
|
; CHECK-BE-DAG: std r9, 96(r1)
|
|
|
|
; CHECK-BE-DAG: std r8, 88(r1)
|
|
|
|
; CHECK-BE-DAG: std r7, 80(r1)
|
|
|
|
; CHECK-BE-DAG: std r6, 72(r1)
|
|
|
|
; CHECK-BE-DAG: std r5, 64(r1)
|
|
|
|
; CHECK-BE-DAG: std r4, 56(r1)
|
|
|
|
; CHECK-BE-DAG: std r3, 48(r1)
|
2018-07-05 14:51:38 +08:00
|
|
|
; CHECK-BE-NEXT: blr
|
|
|
|
entry:
|
|
|
|
%a7 = getelementptr inbounds %struct.With9fp128params,
|
|
|
|
%struct.With9fp128params* %a, i64 0, i32 6
|
|
|
|
%0 = load fp128, fp128* %a7, align 16
|
|
|
|
ret fp128 %0
|
|
|
|
}
|
|
|
|
|
|
|
|
; Function Attrs: norecurse nounwind readnone
|
|
|
|
define fp128 @testStruct_04([8 x fp128] %a.coerce) {
|
|
|
|
; CHECK-LABEL: testStruct_04:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-NEXT: vmr v2, v5
|
2018-07-05 14:51:38 +08:00
|
|
|
; CHECK-NEXT: blr
|
|
|
|
|
|
|
|
; CHECK-BE-LABEL: testStruct_04:
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-BE: vmr v2, v5
|
2018-07-05 14:51:38 +08:00
|
|
|
; CHECK-BE-NEXT: blr
|
|
|
|
entry:
|
|
|
|
%a.coerce.fca.3.extract = extractvalue [8 x fp128] %a.coerce, 3
|
|
|
|
ret fp128 %a.coerce.fca.3.extract
|
|
|
|
}
|
|
|
|
|
|
|
|
; Function Attrs: norecurse nounwind readnone
|
|
|
|
define fp128 @testHUnion_01([1 x fp128] %a.coerce) {
|
|
|
|
; CHECK-LABEL: testHUnion_01:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
|
|
|
; CHECK-NEXT: blr
|
|
|
|
|
|
|
|
; CHECK-BE-LABEL: testHUnion_01:
|
|
|
|
; CHECK-BE: # %bb.0: # %entry
|
|
|
|
; CHECK-BE-NEXT: blr
|
|
|
|
entry:
|
|
|
|
%a.coerce.fca.0.extract = extractvalue [1 x fp128] %a.coerce, 0
|
|
|
|
ret fp128 %a.coerce.fca.0.extract
|
|
|
|
}
|
|
|
|
|
|
|
|
; Function Attrs: norecurse nounwind readnone
|
|
|
|
define fp128 @testHUnion_02([3 x fp128] %a.coerce) {
|
|
|
|
; CHECK-LABEL: testHUnion_02:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
|
|
|
; CHECK-NEXT: blr
|
|
|
|
|
|
|
|
; CHECK-BE-LABEL: testHUnion_02:
|
|
|
|
; CHECK-BE: # %bb.0: # %entry
|
|
|
|
; CHECK-BE-NEXT: blr
|
|
|
|
entry:
|
|
|
|
%a.coerce.fca.0.extract = extractvalue [3 x fp128] %a.coerce, 0
|
|
|
|
ret fp128 %a.coerce.fca.0.extract
|
|
|
|
}
|
|
|
|
|
|
|
|
; Function Attrs: norecurse nounwind readnone
|
|
|
|
define fp128 @testHUnion_03([3 x fp128] %a.coerce) {
|
|
|
|
; CHECK-LABEL: testHUnion_03:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-NEXT: vmr v2, v3
|
2018-07-05 14:51:38 +08:00
|
|
|
; CHECK-NEXT: blr
|
|
|
|
|
|
|
|
; CHECK-BE-LABEL: testHUnion_03:
|
|
|
|
; CHECK-BE: # %bb.0: # %entry
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-BE-NEXT: vmr v2, v3
|
2018-07-05 14:51:38 +08:00
|
|
|
; CHECK-BE-NEXT: blr
|
|
|
|
entry:
|
|
|
|
%a.coerce.fca.1.extract = extractvalue [3 x fp128] %a.coerce, 1
|
|
|
|
ret fp128 %a.coerce.fca.1.extract
|
|
|
|
}
|
|
|
|
|
|
|
|
; Function Attrs: norecurse nounwind readnone
|
|
|
|
define fp128 @testHUnion_04([3 x fp128] %a.coerce) {
|
|
|
|
; CHECK-LABEL: testHUnion_04:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-NEXT: vmr v2, v4
|
2018-07-05 14:51:38 +08:00
|
|
|
; CHECK-NEXT: blr
|
|
|
|
|
|
|
|
; CHECK-BE-LABEL: testHUnion_04:
|
|
|
|
; CHECK-BE: # %bb.0: # %entry
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-BE-NEXT: vmr v2, v4
|
2018-07-05 14:51:38 +08:00
|
|
|
; CHECK-BE-NEXT: blr
|
|
|
|
entry:
|
|
|
|
%a.coerce.fca.2.extract = extractvalue [3 x fp128] %a.coerce, 2
|
|
|
|
ret fp128 %a.coerce.fca.2.extract
|
|
|
|
}
|
|
|
|
|
|
|
|
; Testing mixed member aggregates.
|
2018-07-05 14:29:28 +08:00
|
|
|
|
|
|
|
%struct.MixedC = type { i32, %struct.SA, float, [12 x i8] }
|
|
|
|
%struct.SA = type { double, fp128, <4 x float> }
|
|
|
|
|
|
|
|
; Function Attrs: norecurse nounwind readnone
|
|
|
|
define fp128 @testMixedAggregate([3 x i128] %a.coerce) {
|
|
|
|
; CHECK-LABEL: testMixedAggregate:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-NEXT: mtvsrdd v2, r8, r7
|
2018-07-05 14:29:28 +08:00
|
|
|
; CHECK-NEXT: blr
|
|
|
|
|
|
|
|
; CHECK-BE-LABEL: testMixedAggregate:
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-BE: mtvsrdd v2, r8, r7
|
2018-07-05 14:29:28 +08:00
|
|
|
; CHECK-BE-NEXT: blr
|
|
|
|
entry:
|
|
|
|
%a.coerce.fca.2.extract = extractvalue [3 x i128] %a.coerce, 2
|
|
|
|
%0 = bitcast i128 %a.coerce.fca.2.extract to fp128
|
|
|
|
ret fp128 %0
|
|
|
|
}
|
|
|
|
|
|
|
|
; Function Attrs: norecurse nounwind readnone
|
|
|
|
define fp128 @testMixedAggregate_02([4 x i128] %a.coerce) {
|
|
|
|
; CHECK-LABEL: testMixedAggregate_02:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-NEXT: mtvsrdd v2, r6, r5
|
2018-07-05 14:29:28 +08:00
|
|
|
; CHECK-NEXT: blr
|
|
|
|
|
|
|
|
; CHECK-BE-LABEL: testMixedAggregate_02:
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-BE: mtvsrdd v2, r6, r5
|
2018-07-05 14:29:28 +08:00
|
|
|
; CHECK-BE-NEXT: blr
|
|
|
|
entry:
|
|
|
|
%a.coerce.fca.1.extract = extractvalue [4 x i128] %a.coerce, 1
|
|
|
|
%0 = bitcast i128 %a.coerce.fca.1.extract to fp128
|
|
|
|
ret fp128 %0
|
|
|
|
}
|
|
|
|
|
|
|
|
; Function Attrs: norecurse nounwind readnone
|
|
|
|
define fp128 @testMixedAggregate_03([4 x i128] %sa.coerce) {
|
|
|
|
; CHECK-LABEL: testMixedAggregate_03:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
2019-01-03 13:04:18 +08:00
|
|
|
; CHECK: mtvsrwa v2, r3
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK: xscvsdqp v2, v2
|
2019-01-03 13:04:18 +08:00
|
|
|
; CHECK: mtvsrdd v3, r6, r5
|
|
|
|
; CHECK: xsaddqp v2, v3, v2
|
|
|
|
; CHECK: mtvsrd v[[REG1:[0-9]+]], r10
|
|
|
|
; CHECK: xscvsdqp v[[REG:[0-9]+]], v[[REG1]]
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK: xsaddqp v2, v2, v[[REG]]
|
2018-07-05 14:29:28 +08:00
|
|
|
; CHECK-NEXT: blr
|
|
|
|
entry:
|
|
|
|
%sa.coerce.fca.0.extract = extractvalue [4 x i128] %sa.coerce, 0
|
|
|
|
%sa.sroa.0.0.extract.trunc = trunc i128 %sa.coerce.fca.0.extract to i32
|
|
|
|
%sa.coerce.fca.1.extract = extractvalue [4 x i128] %sa.coerce, 1
|
|
|
|
%sa.coerce.fca.3.extract = extractvalue [4 x i128] %sa.coerce, 3
|
|
|
|
%sa.sroa.6.48.extract.shift = lshr i128 %sa.coerce.fca.3.extract, 64
|
|
|
|
%sa.sroa.6.48.extract.trunc = trunc i128 %sa.sroa.6.48.extract.shift to i64
|
|
|
|
%conv = sitofp i32 %sa.sroa.0.0.extract.trunc to fp128
|
|
|
|
%0 = bitcast i128 %sa.coerce.fca.1.extract to fp128
|
|
|
|
%add = fadd fp128 %0, %conv
|
|
|
|
%conv2 = sitofp i64 %sa.sroa.6.48.extract.trunc to fp128
|
|
|
|
%add3 = fadd fp128 %add, %conv2
|
|
|
|
ret fp128 %add3
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
; Function Attrs: norecurse nounwind readonly
|
|
|
|
define fp128 @testNestedAggregate(%struct.MixedC* byval nocapture readonly align 16 %a) {
|
|
|
|
; CHECK-LABEL: testNestedAggregate:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
[DAGCombiner] If a TokenFactor would be merged into its user, consider the user later.
Summary:
A number of optimizations are inhibited by single-use TokenFactors not
being merged into the TokenFactor using it. This makes we consider if
we can do the merge immediately.
Most tests changes here are due to the change in visitation causing
minor reorderings and associated reassociation of paired memory
operations.
CodeGen tests with non-reordering changes:
X86/aligned-variadic.ll -- memory-based add folded into stored leaq
value.
X86/constant-combiners.ll -- Optimizes out overlap between stores.
X86/pr40631_deadstore_elision -- folds constant byte store into
preceding quad word constant store.
Reviewers: RKSimon, craig.topper, spatel, efriedma, courbet
Reviewed By: courbet
Subscribers: dylanmckay, sdardis, nemanjai, jvesely, nhaehnle, javed.absar, eraman, hiraditya, kbarton, jrtc27, atanasyan, jsji, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59260
llvm-svn: 356068
2019-03-14 01:07:09 +08:00
|
|
|
; CHECK-DAG: std r8, 72(r1)
|
|
|
|
; CHECK-DAG: std r7, 64(r1)
|
2019-07-02 11:28:52 +08:00
|
|
|
; CHECK: lxv v2, 64(r1)
|
|
|
|
; CHECK-DAG: std r10, 88(r1)
|
|
|
|
; CHECK-DAG: std r9, 80(r1)
|
[DAGCombiner] If a TokenFactor would be merged into its user, consider the user later.
Summary:
A number of optimizations are inhibited by single-use TokenFactors not
being merged into the TokenFactor using it. This makes we consider if
we can do the merge immediately.
Most tests changes here are due to the change in visitation causing
minor reorderings and associated reassociation of paired memory
operations.
CodeGen tests with non-reordering changes:
X86/aligned-variadic.ll -- memory-based add folded into stored leaq
value.
X86/constant-combiners.ll -- Optimizes out overlap between stores.
X86/pr40631_deadstore_elision -- folds constant byte store into
preceding quad word constant store.
Reviewers: RKSimon, craig.topper, spatel, efriedma, courbet
Reviewed By: courbet
Subscribers: dylanmckay, sdardis, nemanjai, jvesely, nhaehnle, javed.absar, eraman, hiraditya, kbarton, jrtc27, atanasyan, jsji, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59260
llvm-svn: 356068
2019-03-14 01:07:09 +08:00
|
|
|
; CHECK-DAG: std r6, 56(r1)
|
|
|
|
; CHECK-DAG: std r5, 48(r1)
|
|
|
|
; CHECK-DAG: std r4, 40(r1)
|
|
|
|
; CHECK-DAG: std r3, 32(r1)
|
2018-07-05 14:29:28 +08:00
|
|
|
; CHECK-NEXT: blr
|
|
|
|
|
|
|
|
; CHECK-BE-LABEL: testNestedAggregate:
|
|
|
|
; CHECK-BE: # %bb.0: # %entry
|
[DAGCombiner] If a TokenFactor would be merged into its user, consider the user later.
Summary:
A number of optimizations are inhibited by single-use TokenFactors not
being merged into the TokenFactor using it. This makes we consider if
we can do the merge immediately.
Most tests changes here are due to the change in visitation causing
minor reorderings and associated reassociation of paired memory
operations.
CodeGen tests with non-reordering changes:
X86/aligned-variadic.ll -- memory-based add folded into stored leaq
value.
X86/constant-combiners.ll -- Optimizes out overlap between stores.
X86/pr40631_deadstore_elision -- folds constant byte store into
preceding quad word constant store.
Reviewers: RKSimon, craig.topper, spatel, efriedma, courbet
Reviewed By: courbet
Subscribers: dylanmckay, sdardis, nemanjai, jvesely, nhaehnle, javed.absar, eraman, hiraditya, kbarton, jrtc27, atanasyan, jsji, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59260
llvm-svn: 356068
2019-03-14 01:07:09 +08:00
|
|
|
; CHECK-BE-DAG: std r8, 88(r1)
|
|
|
|
; CHECK-BE-DAG: std r7, 80(r1)
|
2019-07-02 11:28:52 +08:00
|
|
|
; CHECK-BE-NEXT: lxv v2, 80(r1)
|
[DAGCombiner] If a TokenFactor would be merged into its user, consider the user later.
Summary:
A number of optimizations are inhibited by single-use TokenFactors not
being merged into the TokenFactor using it. This makes we consider if
we can do the merge immediately.
Most tests changes here are due to the change in visitation causing
minor reorderings and associated reassociation of paired memory
operations.
CodeGen tests with non-reordering changes:
X86/aligned-variadic.ll -- memory-based add folded into stored leaq
value.
X86/constant-combiners.ll -- Optimizes out overlap between stores.
X86/pr40631_deadstore_elision -- folds constant byte store into
preceding quad word constant store.
Reviewers: RKSimon, craig.topper, spatel, efriedma, courbet
Reviewed By: courbet
Subscribers: dylanmckay, sdardis, nemanjai, jvesely, nhaehnle, javed.absar, eraman, hiraditya, kbarton, jrtc27, atanasyan, jsji, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59260
llvm-svn: 356068
2019-03-14 01:07:09 +08:00
|
|
|
; CHECK-BE-DAG: std r10, 104(r1)
|
|
|
|
; CHECK-BE-DAG: std r9, 96(r1)
|
|
|
|
; CHECK-BE-DAG: std r6, 72(r1)
|
|
|
|
; CHECK-BE-DAG: std r5, 64(r1)
|
|
|
|
; CHECK-BE-DAG: std r4, 56(r1)
|
|
|
|
; CHECK-BE-DAG: std r3, 48(r1)
|
2018-07-05 14:29:28 +08:00
|
|
|
; CHECK-BE-NEXT: blr
|
|
|
|
entry:
|
|
|
|
%c = getelementptr inbounds %struct.MixedC, %struct.MixedC* %a, i64 0, i32 1, i32 1
|
|
|
|
%0 = load fp128, fp128* %c, align 16
|
|
|
|
ret fp128 %0
|
|
|
|
}
|
|
|
|
|
|
|
|
; Function Attrs: norecurse nounwind readnone
|
|
|
|
define fp128 @testUnion_01([1 x i128] %a.coerce) {
|
|
|
|
; CHECK-LABEL: testUnion_01:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-NEXT: mtvsrdd v2, r4, r3
|
2018-07-05 14:29:28 +08:00
|
|
|
; CHECK-NEXT: blr
|
|
|
|
|
|
|
|
; CHECK-BE-LABEL: testUnion_01:
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-BE: mtvsrdd v2, r4, r3
|
2018-07-05 14:29:28 +08:00
|
|
|
; CHECK-BE-NEXT: blr
|
|
|
|
entry:
|
|
|
|
%a.coerce.fca.0.extract = extractvalue [1 x i128] %a.coerce, 0
|
|
|
|
%0 = bitcast i128 %a.coerce.fca.0.extract to fp128
|
|
|
|
ret fp128 %0
|
|
|
|
}
|
|
|
|
|
|
|
|
; Function Attrs: norecurse nounwind readnone
|
|
|
|
define fp128 @testUnion_02([1 x i128] %a.coerce) {
|
|
|
|
; CHECK-LABEL: testUnion_02:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-NEXT: mtvsrdd v2, r4, r3
|
2018-07-05 14:29:28 +08:00
|
|
|
; CHECK-NEXT: blr
|
|
|
|
|
|
|
|
; CHECK-BE-LABEL: testUnion_02:
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-BE: mtvsrdd v2, r4, r3
|
2018-07-05 14:29:28 +08:00
|
|
|
; CHECK-BE-NEXT: blr
|
|
|
|
entry:
|
|
|
|
%a.coerce.fca.0.extract = extractvalue [1 x i128] %a.coerce, 0
|
|
|
|
%0 = bitcast i128 %a.coerce.fca.0.extract to fp128
|
|
|
|
ret fp128 %0
|
|
|
|
}
|
|
|
|
|
|
|
|
; Function Attrs: norecurse nounwind readnone
|
|
|
|
define fp128 @testUnion_03([4 x i128] %a.coerce) {
|
|
|
|
; CHECK-LABEL: testUnion_03:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-NEXT: mtvsrdd v2, r8, r7
|
2018-07-05 14:29:28 +08:00
|
|
|
; CHECK-NEXT: blr
|
|
|
|
|
|
|
|
; CHECK-BE-LABEL: testUnion_03:
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-BE: mtvsrdd v2, r8, r7
|
2018-07-05 14:29:28 +08:00
|
|
|
; CHECK-BE-NEXT: blr
|
|
|
|
entry:
|
|
|
|
%a.coerce.fca.2.extract = extractvalue [4 x i128] %a.coerce, 2
|
|
|
|
%0 = bitcast i128 %a.coerce.fca.2.extract to fp128
|
|
|
|
ret fp128 %0
|
|
|
|
}
|
|
|
|
|
|
|
|
; Function Attrs: nounwind
|
|
|
|
define fp128 @sum_float128(i32 signext %count, ...) {
|
|
|
|
; CHECK-LABEL: sum_float128:
|
|
|
|
; CHECK: # %bb.0: # %entry
|
[DAGCombiner] If a TokenFactor would be merged into its user, consider the user later.
Summary:
A number of optimizations are inhibited by single-use TokenFactors not
being merged into the TokenFactor using it. This makes we consider if
we can do the merge immediately.
Most tests changes here are due to the change in visitation causing
minor reorderings and associated reassociation of paired memory
operations.
CodeGen tests with non-reordering changes:
X86/aligned-variadic.ll -- memory-based add folded into stored leaq
value.
X86/constant-combiners.ll -- Optimizes out overlap between stores.
X86/pr40631_deadstore_elision -- folds constant byte store into
preceding quad word constant store.
Reviewers: RKSimon, craig.topper, spatel, efriedma, courbet
Reviewed By: courbet
Subscribers: dylanmckay, sdardis, nemanjai, jvesely, nhaehnle, javed.absar, eraman, hiraditya, kbarton, jrtc27, atanasyan, jsji, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59260
llvm-svn: 356068
2019-03-14 01:07:09 +08:00
|
|
|
; CHECK-DAG: std r10, 88(r1)
|
|
|
|
; CHECK-DAG: std r9, 80(r1)
|
|
|
|
; CHECK-DAG: std r8, 72(r1)
|
|
|
|
; CHECK-DAG: std r7, 64(r1)
|
|
|
|
; CHECK-DAG: std r6, 56(r1)
|
|
|
|
; CHECK-DAG: std r4, 40(r1)
|
|
|
|
; CHECK-DAG: cmpwi cr0, r3, 1
|
|
|
|
; CHECK-DAG: std r5, 48(r1)
|
|
|
|
; CHECK-DAG: addis [[REG:r[0-9]+]], r2, .LCPI17_0@toc@ha
|
|
|
|
; CHECK-DAG: addi [[REG1:r[0-9]+]], [[REG]], .LCPI17_0@toc@l
|
|
|
|
; CHECK-DAG: lxvx v2, 0, [[REG1]]
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-NEXT: bltlr cr0
|
2018-07-05 14:29:28 +08:00
|
|
|
; CHECK-NEXT: # %bb.1: # %if.end
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-NEXT: addi r3, r1, 40
|
|
|
|
; CHECK-NEXT: lxvx v3, 0, r3
|
|
|
|
; CHECK-NEXT: xsaddqp v2, v3, v2
|
2019-01-03 13:04:18 +08:00
|
|
|
; CHECK-NEXT: addi [[REG2:r[0-9]+]], r1, 72
|
|
|
|
; CHECK-NEXT: std [[REG2]], -8(r1)
|
2018-07-13 04:18:57 +08:00
|
|
|
; CHECK-NEXT: lxv v3, 16(r3)
|
|
|
|
; CHECK-NEXT: xsaddqp v2, v2, v3
|
2018-07-05 14:29:28 +08:00
|
|
|
; CHECK-NEXT: blr
|
|
|
|
entry:
|
|
|
|
%ap = alloca i8*, align 8
|
|
|
|
%0 = bitcast i8** %ap to i8*
|
|
|
|
call void @llvm.lifetime.start.p0i8(i64 8, i8* nonnull %0) #2
|
|
|
|
%cmp = icmp slt i32 %count, 1
|
|
|
|
br i1 %cmp, label %cleanup, label %if.end
|
|
|
|
|
|
|
|
if.end: ; preds = %entry
|
|
|
|
call void @llvm.va_start(i8* nonnull %0)
|
|
|
|
%argp.cur = load i8*, i8** %ap, align 8
|
|
|
|
%argp.next = getelementptr inbounds i8, i8* %argp.cur, i64 16
|
|
|
|
%1 = bitcast i8* %argp.cur to fp128*
|
|
|
|
%2 = load fp128, fp128* %1, align 8
|
|
|
|
%add = fadd fp128 %2, 0xL00000000000000000000000000000000
|
|
|
|
%argp.next3 = getelementptr inbounds i8, i8* %argp.cur, i64 32
|
|
|
|
store i8* %argp.next3, i8** %ap, align 8
|
|
|
|
%3 = bitcast i8* %argp.next to fp128*
|
|
|
|
%4 = load fp128, fp128* %3, align 8
|
|
|
|
%add4 = fadd fp128 %add, %4
|
|
|
|
call void @llvm.va_end(i8* nonnull %0)
|
|
|
|
br label %cleanup
|
|
|
|
|
|
|
|
cleanup: ; preds = %entry, %if.end
|
|
|
|
%retval.0 = phi fp128 [ %add4, %if.end ], [ 0xL00000000000000000000000000000000, %entry ]
|
|
|
|
call void @llvm.lifetime.end.p0i8(i64 8, i8* nonnull %0) #2
|
|
|
|
ret fp128 %retval.0
|
|
|
|
}
|
|
|
|
|
|
|
|
declare void @llvm.lifetime.start.p0i8(i64, i8* nocapture) #1
|
|
|
|
declare void @llvm.va_start(i8*) #2
|
|
|
|
declare void @llvm.va_end(i8*) #2
|
|
|
|
declare void @llvm.lifetime.end.p0i8(i64, i8* nocapture) #1
|