2015-09-23 01:22:58 +08:00
|
|
|
; RUN: llc < %s -mtriple=armv7-apple-ios -verify-machineinstrs | FileCheck %s --check-prefix=CHECK --check-prefix CHECK-ARMV7
|
|
|
|
; RUN: llc < %s -mtriple=thumbv7-apple-ios -verify-machineinstrs | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK-T2
|
2013-10-25 17:30:20 +08:00
|
|
|
; RUN: llc < %s -mtriple=thumbv6-apple-ios -verify-machineinstrs | FileCheck %s --check-prefix=CHECK-T1
|
2016-11-04 05:49:08 +08:00
|
|
|
; RUN: llc < %s -mtriple=thumbv6-apple-ios -verify-machineinstrs -mcpu=cortex-m0 | FileCheck %s --check-prefix=CHECK-T1-M0
|
2014-08-21 22:35:47 +08:00
|
|
|
; RUN: llc < %s -mtriple=thumbv7--none-eabi -thread-model single -verify-machineinstrs | FileCheck %s --check-prefix=CHECK-BAREMETAL
|
2011-05-28 07:54:00 +08:00
|
|
|
|
2014-10-15 06:12:14 +08:00
|
|
|
target datalayout = "e-m:e-p:32:32-i64:64-v128:64:128-a:0:32-n32-S64"
|
|
|
|
|
2011-05-28 07:54:00 +08:00
|
|
|
define void @func(i32 %argc, i8** %argv) nounwind {
|
|
|
|
entry:
|
|
|
|
%argc.addr = alloca i32 ; <i32*> [#uses=1]
|
|
|
|
%argv.addr = alloca i8** ; <i8***> [#uses=1]
|
|
|
|
%val1 = alloca i32 ; <i32*> [#uses=2]
|
|
|
|
%val2 = alloca i32 ; <i32*> [#uses=15]
|
|
|
|
%andt = alloca i32 ; <i32*> [#uses=2]
|
|
|
|
%ort = alloca i32 ; <i32*> [#uses=2]
|
|
|
|
%xort = alloca i32 ; <i32*> [#uses=2]
|
|
|
|
%old = alloca i32 ; <i32*> [#uses=18]
|
|
|
|
%temp = alloca i32 ; <i32*> [#uses=2]
|
|
|
|
store i32 %argc, i32* %argc.addr
|
|
|
|
store i8** %argv, i8*** %argv.addr
|
|
|
|
store i32 0, i32* %val1
|
|
|
|
store i32 31, i32* %val2
|
|
|
|
store i32 3855, i32* %andt
|
|
|
|
store i32 3855, i32* %ort
|
|
|
|
store i32 3855, i32* %xort
|
|
|
|
store i32 4, i32* %temp
|
2015-02-28 05:17:42 +08:00
|
|
|
%tmp = load i32, i32* %temp
|
[DAG] Improve Aliasing of operations to static alloca
Re-recommiting after landing DAG extension-crash fix.
Recommiting after adding check to avoid miscomputing alias information
on addresses of the same base but different subindices.
Memory accesses offset from frame indices may alias, e.g., we
may merge write from function arguments passed on the stack when they
are contiguous. As a result, when checking aliasing, we consider the
underlying frame index's offset from the stack pointer.
Static allocs are realized as stack objects in SelectionDAG, but its
offset is not set until post-DAG causing DAGCombiner's alias check to
consider access to static allocas to frequently alias. Modify isAlias
to consider access between static allocas and access from other frame
objects to be considered aliasing.
Many test changes are included here. Most are fixes for tests which
indirectly relied on our aliasing ability and needed to be modified to
preserve their original intent.
The remaining tests have minor improvements due to relaxed
ordering. The exception is CodeGen/X86/2011-10-19-widen_vselect.ll
which has a minor degradation dispite though the pre-legalized DAG is
improved.
Reviewers: rnk, mkuper, jonpa, hfinkel, uweigand
Reviewed By: rnk
Subscribers: sdardis, nemanjai, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D33345
llvm-svn: 308350
2017-07-19 04:06:24 +08:00
|
|
|
call void asm sideeffect "", "~{memory},~{dirflag},~{fpsr},~{flags}"()
|
2011-05-28 07:54:00 +08:00
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: add
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_add_4
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_add_4
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: add
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-09-27 04:27:49 +08:00
|
|
|
%0 = atomicrmw add i32* %val1, i32 %tmp monotonic
|
2011-05-28 07:54:00 +08:00
|
|
|
store i32 %0, i32* %old
|
[DAG] Improve Aliasing of operations to static alloca
Re-recommiting after landing DAG extension-crash fix.
Recommiting after adding check to avoid miscomputing alias information
on addresses of the same base but different subindices.
Memory accesses offset from frame indices may alias, e.g., we
may merge write from function arguments passed on the stack when they
are contiguous. As a result, when checking aliasing, we consider the
underlying frame index's offset from the stack pointer.
Static allocs are realized as stack objects in SelectionDAG, but its
offset is not set until post-DAG causing DAGCombiner's alias check to
consider access to static allocas to frequently alias. Modify isAlias
to consider access between static allocas and access from other frame
objects to be considered aliasing.
Many test changes are included here. Most are fixes for tests which
indirectly relied on our aliasing ability and needed to be modified to
preserve their original intent.
The remaining tests have minor improvements due to relaxed
ordering. The exception is CodeGen/X86/2011-10-19-widen_vselect.ll
which has a minor degradation dispite though the pre-legalized DAG is
improved.
Reviewers: rnk, mkuper, jonpa, hfinkel, uweigand
Reviewed By: rnk
Subscribers: sdardis, nemanjai, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D33345
llvm-svn: 308350
2017-07-19 04:06:24 +08:00
|
|
|
call void asm sideeffect "", "~{memory},~{dirflag},~{fpsr},~{flags}"()
|
2011-05-28 07:54:00 +08:00
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: sub
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_sub_4
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_sub_4
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: sub
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-09-27 04:27:49 +08:00
|
|
|
%1 = atomicrmw sub i32* %val2, i32 30 monotonic
|
2011-05-28 07:54:00 +08:00
|
|
|
store i32 %1, i32* %old
|
[DAG] Improve Aliasing of operations to static alloca
Re-recommiting after landing DAG extension-crash fix.
Recommiting after adding check to avoid miscomputing alias information
on addresses of the same base but different subindices.
Memory accesses offset from frame indices may alias, e.g., we
may merge write from function arguments passed on the stack when they
are contiguous. As a result, when checking aliasing, we consider the
underlying frame index's offset from the stack pointer.
Static allocs are realized as stack objects in SelectionDAG, but its
offset is not set until post-DAG causing DAGCombiner's alias check to
consider access to static allocas to frequently alias. Modify isAlias
to consider access between static allocas and access from other frame
objects to be considered aliasing.
Many test changes are included here. Most are fixes for tests which
indirectly relied on our aliasing ability and needed to be modified to
preserve their original intent.
The remaining tests have minor improvements due to relaxed
ordering. The exception is CodeGen/X86/2011-10-19-widen_vselect.ll
which has a minor degradation dispite though the pre-legalized DAG is
improved.
Reviewers: rnk, mkuper, jonpa, hfinkel, uweigand
Reviewed By: rnk
Subscribers: sdardis, nemanjai, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D33345
llvm-svn: 308350
2017-07-19 04:06:24 +08:00
|
|
|
call void asm sideeffect "", "~{memory},~{dirflag},~{fpsr},~{flags}"()
|
2011-05-28 07:54:00 +08:00
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: add
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_add_4
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_add_4
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: add
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-09-27 04:27:49 +08:00
|
|
|
%2 = atomicrmw add i32* %val2, i32 1 monotonic
|
2011-05-28 07:54:00 +08:00
|
|
|
store i32 %2, i32* %old
|
[DAG] Improve Aliasing of operations to static alloca
Re-recommiting after landing DAG extension-crash fix.
Recommiting after adding check to avoid miscomputing alias information
on addresses of the same base but different subindices.
Memory accesses offset from frame indices may alias, e.g., we
may merge write from function arguments passed on the stack when they
are contiguous. As a result, when checking aliasing, we consider the
underlying frame index's offset from the stack pointer.
Static allocs are realized as stack objects in SelectionDAG, but its
offset is not set until post-DAG causing DAGCombiner's alias check to
consider access to static allocas to frequently alias. Modify isAlias
to consider access between static allocas and access from other frame
objects to be considered aliasing.
Many test changes are included here. Most are fixes for tests which
indirectly relied on our aliasing ability and needed to be modified to
preserve their original intent.
The remaining tests have minor improvements due to relaxed
ordering. The exception is CodeGen/X86/2011-10-19-widen_vselect.ll
which has a minor degradation dispite though the pre-legalized DAG is
improved.
Reviewers: rnk, mkuper, jonpa, hfinkel, uweigand
Reviewed By: rnk
Subscribers: sdardis, nemanjai, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D33345
llvm-svn: 308350
2017-07-19 04:06:24 +08:00
|
|
|
call void asm sideeffect "", "~{memory},~{dirflag},~{fpsr},~{flags}"()
|
2011-05-28 07:54:00 +08:00
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: sub
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_sub_4
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_sub_4
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: sub
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-09-27 04:27:49 +08:00
|
|
|
%3 = atomicrmw sub i32* %val2, i32 1 monotonic
|
2011-05-28 07:54:00 +08:00
|
|
|
store i32 %3, i32* %old
|
[DAG] Improve Aliasing of operations to static alloca
Re-recommiting after landing DAG extension-crash fix.
Recommiting after adding check to avoid miscomputing alias information
on addresses of the same base but different subindices.
Memory accesses offset from frame indices may alias, e.g., we
may merge write from function arguments passed on the stack when they
are contiguous. As a result, when checking aliasing, we consider the
underlying frame index's offset from the stack pointer.
Static allocs are realized as stack objects in SelectionDAG, but its
offset is not set until post-DAG causing DAGCombiner's alias check to
consider access to static allocas to frequently alias. Modify isAlias
to consider access between static allocas and access from other frame
objects to be considered aliasing.
Many test changes are included here. Most are fixes for tests which
indirectly relied on our aliasing ability and needed to be modified to
preserve their original intent.
The remaining tests have minor improvements due to relaxed
ordering. The exception is CodeGen/X86/2011-10-19-widen_vselect.ll
which has a minor degradation dispite though the pre-legalized DAG is
improved.
Reviewers: rnk, mkuper, jonpa, hfinkel, uweigand
Reviewed By: rnk
Subscribers: sdardis, nemanjai, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D33345
llvm-svn: 308350
2017-07-19 04:06:24 +08:00
|
|
|
call void asm sideeffect "", "~{memory},~{dirflag},~{fpsr},~{flags}"()
|
2011-05-28 07:54:00 +08:00
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: and
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_and_4
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_and_4
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: and
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-09-27 04:27:49 +08:00
|
|
|
%4 = atomicrmw and i32* %andt, i32 4080 monotonic
|
2011-05-28 07:54:00 +08:00
|
|
|
store i32 %4, i32* %old
|
[DAG] Improve Aliasing of operations to static alloca
Re-recommiting after landing DAG extension-crash fix.
Recommiting after adding check to avoid miscomputing alias information
on addresses of the same base but different subindices.
Memory accesses offset from frame indices may alias, e.g., we
may merge write from function arguments passed on the stack when they
are contiguous. As a result, when checking aliasing, we consider the
underlying frame index's offset from the stack pointer.
Static allocs are realized as stack objects in SelectionDAG, but its
offset is not set until post-DAG causing DAGCombiner's alias check to
consider access to static allocas to frequently alias. Modify isAlias
to consider access between static allocas and access from other frame
objects to be considered aliasing.
Many test changes are included here. Most are fixes for tests which
indirectly relied on our aliasing ability and needed to be modified to
preserve their original intent.
The remaining tests have minor improvements due to relaxed
ordering. The exception is CodeGen/X86/2011-10-19-widen_vselect.ll
which has a minor degradation dispite though the pre-legalized DAG is
improved.
Reviewers: rnk, mkuper, jonpa, hfinkel, uweigand
Reviewed By: rnk
Subscribers: sdardis, nemanjai, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D33345
llvm-svn: 308350
2017-07-19 04:06:24 +08:00
|
|
|
call void asm sideeffect "", "~{memory},~{dirflag},~{fpsr},~{flags}"()
|
2011-05-28 07:54:00 +08:00
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: or
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_or_4
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_or_4
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: or
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-09-27 04:27:49 +08:00
|
|
|
%5 = atomicrmw or i32* %ort, i32 4080 monotonic
|
2011-05-28 07:54:00 +08:00
|
|
|
store i32 %5, i32* %old
|
[DAG] Improve Aliasing of operations to static alloca
Re-recommiting after landing DAG extension-crash fix.
Recommiting after adding check to avoid miscomputing alias information
on addresses of the same base but different subindices.
Memory accesses offset from frame indices may alias, e.g., we
may merge write from function arguments passed on the stack when they
are contiguous. As a result, when checking aliasing, we consider the
underlying frame index's offset from the stack pointer.
Static allocs are realized as stack objects in SelectionDAG, but its
offset is not set until post-DAG causing DAGCombiner's alias check to
consider access to static allocas to frequently alias. Modify isAlias
to consider access between static allocas and access from other frame
objects to be considered aliasing.
Many test changes are included here. Most are fixes for tests which
indirectly relied on our aliasing ability and needed to be modified to
preserve their original intent.
The remaining tests have minor improvements due to relaxed
ordering. The exception is CodeGen/X86/2011-10-19-widen_vselect.ll
which has a minor degradation dispite though the pre-legalized DAG is
improved.
Reviewers: rnk, mkuper, jonpa, hfinkel, uweigand
Reviewed By: rnk
Subscribers: sdardis, nemanjai, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D33345
llvm-svn: 308350
2017-07-19 04:06:24 +08:00
|
|
|
call void asm sideeffect "", "~{memory},~{dirflag},~{fpsr},~{flags}"()
|
2011-05-28 07:54:00 +08:00
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: eor
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_xor_4
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_xor_4
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: eor
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-09-27 04:27:49 +08:00
|
|
|
%6 = atomicrmw xor i32* %xort, i32 4080 monotonic
|
2011-05-28 07:54:00 +08:00
|
|
|
store i32 %6, i32* %old
|
[DAG] Improve Aliasing of operations to static alloca
Re-recommiting after landing DAG extension-crash fix.
Recommiting after adding check to avoid miscomputing alias information
on addresses of the same base but different subindices.
Memory accesses offset from frame indices may alias, e.g., we
may merge write from function arguments passed on the stack when they
are contiguous. As a result, when checking aliasing, we consider the
underlying frame index's offset from the stack pointer.
Static allocs are realized as stack objects in SelectionDAG, but its
offset is not set until post-DAG causing DAGCombiner's alias check to
consider access to static allocas to frequently alias. Modify isAlias
to consider access between static allocas and access from other frame
objects to be considered aliasing.
Many test changes are included here. Most are fixes for tests which
indirectly relied on our aliasing ability and needed to be modified to
preserve their original intent.
The remaining tests have minor improvements due to relaxed
ordering. The exception is CodeGen/X86/2011-10-19-widen_vselect.ll
which has a minor degradation dispite though the pre-legalized DAG is
improved.
Reviewers: rnk, mkuper, jonpa, hfinkel, uweigand
Reviewed By: rnk
Subscribers: sdardis, nemanjai, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D33345
llvm-svn: 308350
2017-07-19 04:06:24 +08:00
|
|
|
call void asm sideeffect "", "~{memory},~{dirflag},~{fpsr},~{flags}"()
|
2011-05-28 07:54:00 +08:00
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: cmp
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_min_4
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_min_4
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: cmp
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-09-27 04:27:49 +08:00
|
|
|
%7 = atomicrmw min i32* %val2, i32 16 monotonic
|
2011-05-28 07:54:00 +08:00
|
|
|
store i32 %7, i32* %old
|
[DAG] Improve Aliasing of operations to static alloca
Re-recommiting after landing DAG extension-crash fix.
Recommiting after adding check to avoid miscomputing alias information
on addresses of the same base but different subindices.
Memory accesses offset from frame indices may alias, e.g., we
may merge write from function arguments passed on the stack when they
are contiguous. As a result, when checking aliasing, we consider the
underlying frame index's offset from the stack pointer.
Static allocs are realized as stack objects in SelectionDAG, but its
offset is not set until post-DAG causing DAGCombiner's alias check to
consider access to static allocas to frequently alias. Modify isAlias
to consider access between static allocas and access from other frame
objects to be considered aliasing.
Many test changes are included here. Most are fixes for tests which
indirectly relied on our aliasing ability and needed to be modified to
preserve their original intent.
The remaining tests have minor improvements due to relaxed
ordering. The exception is CodeGen/X86/2011-10-19-widen_vselect.ll
which has a minor degradation dispite though the pre-legalized DAG is
improved.
Reviewers: rnk, mkuper, jonpa, hfinkel, uweigand
Reviewed By: rnk
Subscribers: sdardis, nemanjai, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D33345
llvm-svn: 308350
2017-07-19 04:06:24 +08:00
|
|
|
call void asm sideeffect "", "~{memory},~{dirflag},~{fpsr},~{flags}"()
|
2011-12-21 11:04:10 +08:00
|
|
|
%neg = sub i32 0, 1
|
2011-05-28 07:54:00 +08:00
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: cmp
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_min_4
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_min_4
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: cmp
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-09-27 04:27:49 +08:00
|
|
|
%8 = atomicrmw min i32* %val2, i32 %neg monotonic
|
2011-05-28 07:54:00 +08:00
|
|
|
store i32 %8, i32* %old
|
[DAG] Improve Aliasing of operations to static alloca
Re-recommiting after landing DAG extension-crash fix.
Recommiting after adding check to avoid miscomputing alias information
on addresses of the same base but different subindices.
Memory accesses offset from frame indices may alias, e.g., we
may merge write from function arguments passed on the stack when they
are contiguous. As a result, when checking aliasing, we consider the
underlying frame index's offset from the stack pointer.
Static allocs are realized as stack objects in SelectionDAG, but its
offset is not set until post-DAG causing DAGCombiner's alias check to
consider access to static allocas to frequently alias. Modify isAlias
to consider access between static allocas and access from other frame
objects to be considered aliasing.
Many test changes are included here. Most are fixes for tests which
indirectly relied on our aliasing ability and needed to be modified to
preserve their original intent.
The remaining tests have minor improvements due to relaxed
ordering. The exception is CodeGen/X86/2011-10-19-widen_vselect.ll
which has a minor degradation dispite though the pre-legalized DAG is
improved.
Reviewers: rnk, mkuper, jonpa, hfinkel, uweigand
Reviewed By: rnk
Subscribers: sdardis, nemanjai, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D33345
llvm-svn: 308350
2017-07-19 04:06:24 +08:00
|
|
|
call void asm sideeffect "", "~{memory},~{dirflag},~{fpsr},~{flags}"()
|
2011-05-28 07:54:00 +08:00
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: cmp
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_max_4
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_max_4
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: cmp
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-09-27 04:27:49 +08:00
|
|
|
%9 = atomicrmw max i32* %val2, i32 1 monotonic
|
2011-05-28 07:54:00 +08:00
|
|
|
store i32 %9, i32* %old
|
[DAG] Improve Aliasing of operations to static alloca
Re-recommiting after landing DAG extension-crash fix.
Recommiting after adding check to avoid miscomputing alias information
on addresses of the same base but different subindices.
Memory accesses offset from frame indices may alias, e.g., we
may merge write from function arguments passed on the stack when they
are contiguous. As a result, when checking aliasing, we consider the
underlying frame index's offset from the stack pointer.
Static allocs are realized as stack objects in SelectionDAG, but its
offset is not set until post-DAG causing DAGCombiner's alias check to
consider access to static allocas to frequently alias. Modify isAlias
to consider access between static allocas and access from other frame
objects to be considered aliasing.
Many test changes are included here. Most are fixes for tests which
indirectly relied on our aliasing ability and needed to be modified to
preserve their original intent.
The remaining tests have minor improvements due to relaxed
ordering. The exception is CodeGen/X86/2011-10-19-widen_vselect.ll
which has a minor degradation dispite though the pre-legalized DAG is
improved.
Reviewers: rnk, mkuper, jonpa, hfinkel, uweigand
Reviewed By: rnk
Subscribers: sdardis, nemanjai, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D33345
llvm-svn: 308350
2017-07-19 04:06:24 +08:00
|
|
|
call void asm sideeffect "", "~{memory},~{dirflag},~{fpsr},~{flags}"()
|
2011-05-28 07:54:00 +08:00
|
|
|
; CHECK: ldrex
|
[ARM] Lower lower saturate to 0 and lower saturate to -1 using bit-operations
Summary:
Expressions of the form x < 0 ? 0 : x; and x < -1 ? -1 : x can be lowered using bit-operations instead of branching or conditional moves
In thumb-mode this results in a two-instruction sequence, a shift followed by a bic or or while in ARM/thumb2 mode that has flexible second operand the shift can be folded into a single bic/or instructions. In most cases this results in smaller code and possibly less branches, and in no case larger than before.
Patch by Martin Svanfeldt
Reviewers: fhahn, pbarrio, rogfer01
Reviewed By: pbarrio, rogfer01
Subscribers: chrib, yroux, eugenis, efriedma, rogfer01, aemerson, javed.absar, kristof.beyls, llvm-commits
Differential Revision: https://reviews.llvm.org/D42574
llvm-svn: 326333
2018-03-01 01:13:07 +08:00
|
|
|
; CHECK: bic
|
|
|
|
; CHECK-NOT: cmp
|
2011-05-28 07:54:00 +08:00
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_max_4
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_max_4
|
[ARM] Lower lower saturate to 0 and lower saturate to -1 using bit-operations
Summary:
Expressions of the form x < 0 ? 0 : x; and x < -1 ? -1 : x can be lowered using bit-operations instead of branching or conditional moves
In thumb-mode this results in a two-instruction sequence, a shift followed by a bic or or while in ARM/thumb2 mode that has flexible second operand the shift can be folded into a single bic/or instructions. In most cases this results in smaller code and possibly less branches, and in no case larger than before.
Patch by Martin Svanfeldt
Reviewers: fhahn, pbarrio, rogfer01
Reviewed By: pbarrio, rogfer01
Subscribers: chrib, yroux, eugenis, efriedma, rogfer01, aemerson, javed.absar, kristof.beyls, llvm-commits
Differential Revision: https://reviews.llvm.org/D42574
llvm-svn: 326333
2018-03-01 01:13:07 +08:00
|
|
|
; CHECK-BAREMETAL: bic
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-09-27 04:27:49 +08:00
|
|
|
%10 = atomicrmw max i32* %val2, i32 0 monotonic
|
2011-05-28 07:54:00 +08:00
|
|
|
store i32 %10, i32* %old
|
[DAG] Improve Aliasing of operations to static alloca
Re-recommiting after landing DAG extension-crash fix.
Recommiting after adding check to avoid miscomputing alias information
on addresses of the same base but different subindices.
Memory accesses offset from frame indices may alias, e.g., we
may merge write from function arguments passed on the stack when they
are contiguous. As a result, when checking aliasing, we consider the
underlying frame index's offset from the stack pointer.
Static allocs are realized as stack objects in SelectionDAG, but its
offset is not set until post-DAG causing DAGCombiner's alias check to
consider access to static allocas to frequently alias. Modify isAlias
to consider access between static allocas and access from other frame
objects to be considered aliasing.
Many test changes are included here. Most are fixes for tests which
indirectly relied on our aliasing ability and needed to be modified to
preserve their original intent.
The remaining tests have minor improvements due to relaxed
ordering. The exception is CodeGen/X86/2011-10-19-widen_vselect.ll
which has a minor degradation dispite though the pre-legalized DAG is
improved.
Reviewers: rnk, mkuper, jonpa, hfinkel, uweigand
Reviewed By: rnk
Subscribers: sdardis, nemanjai, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D33345
llvm-svn: 308350
2017-07-19 04:06:24 +08:00
|
|
|
call void asm sideeffect "", "~{memory},~{dirflag},~{fpsr},~{flags}"()
|
2011-12-21 11:04:10 +08:00
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: cmp
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_umin_4
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_umin_4
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: cmp
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-12-21 11:04:10 +08:00
|
|
|
%11 = atomicrmw umin i32* %val2, i32 16 monotonic
|
|
|
|
store i32 %11, i32* %old
|
[DAG] Improve Aliasing of operations to static alloca
Re-recommiting after landing DAG extension-crash fix.
Recommiting after adding check to avoid miscomputing alias information
on addresses of the same base but different subindices.
Memory accesses offset from frame indices may alias, e.g., we
may merge write from function arguments passed on the stack when they
are contiguous. As a result, when checking aliasing, we consider the
underlying frame index's offset from the stack pointer.
Static allocs are realized as stack objects in SelectionDAG, but its
offset is not set until post-DAG causing DAGCombiner's alias check to
consider access to static allocas to frequently alias. Modify isAlias
to consider access between static allocas and access from other frame
objects to be considered aliasing.
Many test changes are included here. Most are fixes for tests which
indirectly relied on our aliasing ability and needed to be modified to
preserve their original intent.
The remaining tests have minor improvements due to relaxed
ordering. The exception is CodeGen/X86/2011-10-19-widen_vselect.ll
which has a minor degradation dispite though the pre-legalized DAG is
improved.
Reviewers: rnk, mkuper, jonpa, hfinkel, uweigand
Reviewed By: rnk
Subscribers: sdardis, nemanjai, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D33345
llvm-svn: 308350
2017-07-19 04:06:24 +08:00
|
|
|
call void asm sideeffect "", "~{memory},~{dirflag},~{fpsr},~{flags}"()
|
2011-12-21 11:04:10 +08:00
|
|
|
%uneg = sub i32 0, 1
|
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: cmp
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_umin_4
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_umin_4
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: cmp
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-12-21 11:04:10 +08:00
|
|
|
%12 = atomicrmw umin i32* %val2, i32 %uneg monotonic
|
|
|
|
store i32 %12, i32* %old
|
[DAG] Improve Aliasing of operations to static alloca
Re-recommiting after landing DAG extension-crash fix.
Recommiting after adding check to avoid miscomputing alias information
on addresses of the same base but different subindices.
Memory accesses offset from frame indices may alias, e.g., we
may merge write from function arguments passed on the stack when they
are contiguous. As a result, when checking aliasing, we consider the
underlying frame index's offset from the stack pointer.
Static allocs are realized as stack objects in SelectionDAG, but its
offset is not set until post-DAG causing DAGCombiner's alias check to
consider access to static allocas to frequently alias. Modify isAlias
to consider access between static allocas and access from other frame
objects to be considered aliasing.
Many test changes are included here. Most are fixes for tests which
indirectly relied on our aliasing ability and needed to be modified to
preserve their original intent.
The remaining tests have minor improvements due to relaxed
ordering. The exception is CodeGen/X86/2011-10-19-widen_vselect.ll
which has a minor degradation dispite though the pre-legalized DAG is
improved.
Reviewers: rnk, mkuper, jonpa, hfinkel, uweigand
Reviewed By: rnk
Subscribers: sdardis, nemanjai, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D33345
llvm-svn: 308350
2017-07-19 04:06:24 +08:00
|
|
|
call void asm sideeffect "", "~{memory},~{dirflag},~{fpsr},~{flags}"()
|
2011-12-21 11:04:10 +08:00
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: cmp
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_umax_4
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_umax_4
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: cmp
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-12-21 11:04:10 +08:00
|
|
|
%13 = atomicrmw umax i32* %val2, i32 1 monotonic
|
|
|
|
store i32 %13, i32* %old
|
[DAG] Improve Aliasing of operations to static alloca
Re-recommiting after landing DAG extension-crash fix.
Recommiting after adding check to avoid miscomputing alias information
on addresses of the same base but different subindices.
Memory accesses offset from frame indices may alias, e.g., we
may merge write from function arguments passed on the stack when they
are contiguous. As a result, when checking aliasing, we consider the
underlying frame index's offset from the stack pointer.
Static allocs are realized as stack objects in SelectionDAG, but its
offset is not set until post-DAG causing DAGCombiner's alias check to
consider access to static allocas to frequently alias. Modify isAlias
to consider access between static allocas and access from other frame
objects to be considered aliasing.
Many test changes are included here. Most are fixes for tests which
indirectly relied on our aliasing ability and needed to be modified to
preserve their original intent.
The remaining tests have minor improvements due to relaxed
ordering. The exception is CodeGen/X86/2011-10-19-widen_vselect.ll
which has a minor degradation dispite though the pre-legalized DAG is
improved.
Reviewers: rnk, mkuper, jonpa, hfinkel, uweigand
Reviewed By: rnk
Subscribers: sdardis, nemanjai, javed.absar, llvm-commits
Differential Revision: https://reviews.llvm.org/D33345
llvm-svn: 308350
2017-07-19 04:06:24 +08:00
|
|
|
call void asm sideeffect "", "~{memory},~{dirflag},~{fpsr},~{flags}"()
|
2011-12-21 11:04:10 +08:00
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: cmp
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_umax_4
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_umax_4
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: cmp
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-12-21 11:04:10 +08:00
|
|
|
%14 = atomicrmw umax i32* %val2, i32 0 monotonic
|
|
|
|
store i32 %14, i32* %old
|
|
|
|
|
|
|
|
ret void
|
2011-05-28 07:54:00 +08:00
|
|
|
}
|
2011-12-22 02:56:22 +08:00
|
|
|
|
[SelectionDAG] Compute known bits of CopyFromReg
Summary:
Teach SelectionDAG how to compute known bits of ISD::CopyFromReg if
the virtual reg used has one def only.
This can be particularly useful when calling isBaseWithConstantOffset()
with the ISD::CopyFromReg argument, as more optimizations may get enabled
in the result.
Also add a missing truncation on X86, found by testing of this patch.
Change-Id: Id1c9fceec862d118c54a5b53adf72ada5d6daefa
Reviewers: bogner, craig.topper, RKSimon
Reviewed By: RKSimon
Subscribers: lebedev.ri, nemanjai, jvesely, nhaehnle, javed.absar, jsji, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59535
llvm-svn: 357745
2019-04-05 15:44:09 +08:00
|
|
|
define void @func2(i16 %int_val) nounwind {
|
2011-12-22 02:56:22 +08:00
|
|
|
entry:
|
|
|
|
%val = alloca i16
|
|
|
|
%old = alloca i16
|
[SelectionDAG] Compute known bits of CopyFromReg
Summary:
Teach SelectionDAG how to compute known bits of ISD::CopyFromReg if
the virtual reg used has one def only.
This can be particularly useful when calling isBaseWithConstantOffset()
with the ISD::CopyFromReg argument, as more optimizations may get enabled
in the result.
Also add a missing truncation on X86, found by testing of this patch.
Change-Id: Id1c9fceec862d118c54a5b53adf72ada5d6daefa
Reviewers: bogner, craig.topper, RKSimon
Reviewed By: RKSimon
Subscribers: lebedev.ri, nemanjai, jvesely, nhaehnle, javed.absar, jsji, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59535
llvm-svn: 357745
2019-04-05 15:44:09 +08:00
|
|
|
store i16 %int_val, i16* %val
|
2011-12-22 02:56:22 +08:00
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: cmp
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_umin_2
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_umin_2
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: cmp
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-12-22 02:56:22 +08:00
|
|
|
%0 = atomicrmw umin i16* %val, i16 16 monotonic
|
|
|
|
store i16 %0, i16* %old
|
[SelectionDAG] Compute known bits of CopyFromReg
Summary:
Teach SelectionDAG how to compute known bits of ISD::CopyFromReg if
the virtual reg used has one def only.
This can be particularly useful when calling isBaseWithConstantOffset()
with the ISD::CopyFromReg argument, as more optimizations may get enabled
in the result.
Also add a missing truncation on X86, found by testing of this patch.
Change-Id: Id1c9fceec862d118c54a5b53adf72ada5d6daefa
Reviewers: bogner, craig.topper, RKSimon
Reviewed By: RKSimon
Subscribers: lebedev.ri, nemanjai, jvesely, nhaehnle, javed.absar, jsji, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59535
llvm-svn: 357745
2019-04-05 15:44:09 +08:00
|
|
|
%uneg = sub i16 0, 2
|
2011-12-22 02:56:22 +08:00
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: cmp
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_umin_2
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_umin_2
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: cmp
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-12-22 02:56:22 +08:00
|
|
|
%1 = atomicrmw umin i16* %val, i16 %uneg monotonic
|
|
|
|
store i16 %1, i16* %old
|
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: cmp
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_umax_2
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_umax_2
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: cmp
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-12-22 02:56:22 +08:00
|
|
|
%2 = atomicrmw umax i16* %val, i16 1 monotonic
|
|
|
|
store i16 %2, i16* %old
|
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: cmp
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_umax_2
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_umax_2
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: cmp
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-12-22 02:56:22 +08:00
|
|
|
%3 = atomicrmw umax i16* %val, i16 0 monotonic
|
|
|
|
store i16 %3, i16* %old
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @func3() nounwind {
|
|
|
|
entry:
|
|
|
|
%val = alloca i8
|
|
|
|
%old = alloca i8
|
|
|
|
store i8 31, i8* %val
|
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: cmp
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_umin_1
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_umin_1
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: cmp
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-12-22 02:56:22 +08:00
|
|
|
%0 = atomicrmw umin i8* %val, i8 16 monotonic
|
|
|
|
store i8 %0, i8* %old
|
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: cmp
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_umin_1
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_umin_1
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: cmp
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
[SelectionDAG] Compute known bits of CopyFromReg
Summary:
Teach SelectionDAG how to compute known bits of ISD::CopyFromReg if
the virtual reg used has one def only.
This can be particularly useful when calling isBaseWithConstantOffset()
with the ISD::CopyFromReg argument, as more optimizations may get enabled
in the result.
Also add a missing truncation on X86, found by testing of this patch.
Change-Id: Id1c9fceec862d118c54a5b53adf72ada5d6daefa
Reviewers: bogner, craig.topper, RKSimon
Reviewed By: RKSimon
Subscribers: lebedev.ri, nemanjai, jvesely, nhaehnle, javed.absar, jsji, jdoerfert, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59535
llvm-svn: 357745
2019-04-05 15:44:09 +08:00
|
|
|
%uneg = sub i8 0, 2
|
2011-12-22 02:56:22 +08:00
|
|
|
%1 = atomicrmw umin i8* %val, i8 %uneg monotonic
|
|
|
|
store i8 %1, i8* %old
|
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: cmp
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_umax_1
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_umax_1
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: cmp
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-12-22 02:56:22 +08:00
|
|
|
%2 = atomicrmw umax i8* %val, i8 1 monotonic
|
|
|
|
store i8 %2, i8* %old
|
|
|
|
; CHECK: ldrex
|
|
|
|
; CHECK: cmp
|
|
|
|
; CHECK: strex
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: bl ___sync_fetch_and_umax_1
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: bl ___sync_fetch_and_umax_1
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL: cmp
|
|
|
|
; CHECK-BAREMETAL-NOT: __sync
|
2011-12-22 02:56:22 +08:00
|
|
|
%3 = atomicrmw umax i8* %val, i8 0 monotonic
|
|
|
|
store i8 %3, i8* %old
|
|
|
|
ret void
|
|
|
|
}
|
2012-08-31 10:08:34 +08:00
|
|
|
|
|
|
|
; CHECK: func4
|
|
|
|
; This function should not need to use callee-saved registers.
|
|
|
|
; rdar://problem/12203728
|
|
|
|
; CHECK-NOT: r4
|
|
|
|
define i32 @func4(i32* %p) nounwind optsize ssp {
|
|
|
|
entry:
|
|
|
|
%0 = atomicrmw add i32* %p, i32 1 monotonic
|
|
|
|
ret i32 %0
|
|
|
|
}
|
2014-04-03 21:06:54 +08:00
|
|
|
|
|
|
|
define i32 @test_cmpxchg_fail_order(i32 *%addr, i32 %desired, i32 %new) {
|
|
|
|
; CHECK-LABEL: test_cmpxchg_fail_order:
|
|
|
|
|
IR: add "cmpxchg weak" variant to support permitted failure.
This commit adds a weak variant of the cmpxchg operation, as described
in C++11. A cmpxchg instruction with this modifier is permitted to
fail to store, even if the comparison indicated it should.
As a result, cmpxchg instructions must return a flag indicating
success in addition to their original iN value loaded. Thus, for
uniformity *all* cmpxchg instructions now return "{ iN, i1 }". The
second flag is 1 when the store succeeded.
At the DAG level, a new ATOMIC_CMP_SWAP_WITH_SUCCESS node has been
added as the natural representation for the new cmpxchg instructions.
It is a strong cmpxchg.
By default this gets Expanded to the existing ATOMIC_CMP_SWAP during
Legalization, so existing backends should see no change in behaviour.
If they wish to deal with the enhanced node instead, they can call
setOperationAction on it. Beware: as a node with 2 results, it cannot
be selected from TableGen.
Currently, no use is made of the extra information provided in this
patch. Test updates are almost entirely adapting the input IR to the
new scheme.
Summary for out of tree users:
------------------------------
+ Legacy Bitcode files are upgraded during read.
+ Legacy assembly IR files will be invalid.
+ Front-ends must adapt to different type for "cmpxchg".
+ Backends should be unaffected by default.
llvm-svn: 210903
2014-06-13 22:24:07 +08:00
|
|
|
%pair = cmpxchg i32* %addr, i32 %desired, i32 %new seq_cst monotonic
|
|
|
|
%oldval = extractvalue { i32, i1 } %pair, 0
|
2018-02-28 00:59:10 +08:00
|
|
|
; CHECK-ARMV7: mov r[[ADDR:[0-9]+]], r0
|
|
|
|
; CHECK-ARMV7: ldrex [[OLDVAL:r[0-9]+]], [r0]
|
2015-09-23 01:22:58 +08:00
|
|
|
; CHECK-ARMV7: cmp [[OLDVAL]], r1
|
|
|
|
; CHECK-ARMV7: bne [[FAIL_BB:\.?LBB[0-9]+_[0-9]+]]
|
2016-02-23 04:55:50 +08:00
|
|
|
; CHECK-ARMV7: dmb ish
|
|
|
|
; CHECK-ARMV7: [[LOOP_BB:\.?LBB.*]]:
|
2015-09-23 01:22:58 +08:00
|
|
|
; CHECK-ARMV7: strex [[SUCCESS:r[0-9]+]], r2, [r[[ADDR]]]
|
|
|
|
; CHECK-ARMV7: cmp [[SUCCESS]], #0
|
2016-02-23 04:55:50 +08:00
|
|
|
; CHECK-ARMV7: beq [[SUCCESS_BB:\.?LBB.*]]
|
|
|
|
; CHECK-ARMV7: ldrex [[OLDVAL]], [r[[ADDR]]]
|
|
|
|
; CHECK-ARMV7: cmp [[OLDVAL]], r1
|
|
|
|
; CHECK-ARMV7: beq [[LOOP_BB]]
|
2015-09-23 01:22:58 +08:00
|
|
|
; CHECK-ARMV7: [[FAIL_BB]]:
|
|
|
|
; CHECK-ARMV7: clrex
|
|
|
|
; CHECK-ARMV7: bx lr
|
2016-02-23 04:55:50 +08:00
|
|
|
; CHECK-ARMV7: [[SUCCESS_BB]]:
|
|
|
|
; CHECK-ARMV7: dmb ish
|
|
|
|
; CHECK-ARMV7: bx lr
|
2015-09-23 01:22:58 +08:00
|
|
|
|
2018-02-28 00:59:10 +08:00
|
|
|
; CHECK-T2: mov r[[ADDR:[0-9]+]], r0
|
|
|
|
; CHECK-T2: ldrex [[OLDVAL:r[0-9]+]], [r0]
|
2015-09-23 01:22:58 +08:00
|
|
|
; CHECK-T2: cmp [[OLDVAL]], r1
|
2016-02-23 04:55:50 +08:00
|
|
|
; CHECK-T2: bne [[FAIL_BB:\.?LBB.*]]
|
|
|
|
; CHECK-T2: dmb ish
|
|
|
|
; CHECK-T2: [[LOOP_BB:\.?LBB.*]]:
|
2015-09-23 01:22:58 +08:00
|
|
|
; CHECK-T2: strex [[SUCCESS:r[0-9]+]], r2, [r[[ADDR]]]
|
|
|
|
; CHECK-T2: cmp [[SUCCESS]], #0
|
|
|
|
; CHECK-T2: dmbeq ish
|
|
|
|
; CHECK-T2: bxeq lr
|
2016-02-23 04:55:50 +08:00
|
|
|
; CHECK-T2: ldrex [[OLDVAL]], [r[[ADDR]]]
|
|
|
|
; CHECK-T2: cmp [[OLDVAL]], r1
|
|
|
|
; CHECK-T2: beq [[LOOP_BB]]
|
|
|
|
; CHECK-T2: clrex
|
2014-04-03 21:06:54 +08:00
|
|
|
|
|
|
|
ret i32 %oldval
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @test_cmpxchg_fail_order1(i32 *%addr, i32 %desired, i32 %new) {
|
|
|
|
; CHECK-LABEL: test_cmpxchg_fail_order1:
|
|
|
|
|
IR: add "cmpxchg weak" variant to support permitted failure.
This commit adds a weak variant of the cmpxchg operation, as described
in C++11. A cmpxchg instruction with this modifier is permitted to
fail to store, even if the comparison indicated it should.
As a result, cmpxchg instructions must return a flag indicating
success in addition to their original iN value loaded. Thus, for
uniformity *all* cmpxchg instructions now return "{ iN, i1 }". The
second flag is 1 when the store succeeded.
At the DAG level, a new ATOMIC_CMP_SWAP_WITH_SUCCESS node has been
added as the natural representation for the new cmpxchg instructions.
It is a strong cmpxchg.
By default this gets Expanded to the existing ATOMIC_CMP_SWAP during
Legalization, so existing backends should see no change in behaviour.
If they wish to deal with the enhanced node instead, they can call
setOperationAction on it. Beware: as a node with 2 results, it cannot
be selected from TableGen.
Currently, no use is made of the extra information provided in this
patch. Test updates are almost entirely adapting the input IR to the
new scheme.
Summary for out of tree users:
------------------------------
+ Legacy Bitcode files are upgraded during read.
+ Legacy assembly IR files will be invalid.
+ Front-ends must adapt to different type for "cmpxchg".
+ Backends should be unaffected by default.
llvm-svn: 210903
2014-06-13 22:24:07 +08:00
|
|
|
%pair = cmpxchg i32* %addr, i32 %desired, i32 %new acquire acquire
|
|
|
|
%oldval = extractvalue { i32, i1 } %pair, 0
|
2014-04-03 21:06:54 +08:00
|
|
|
; CHECK-NOT: dmb ish
|
|
|
|
; CHECK: [[LOOP_BB:\.?LBB[0-9]+_1]]:
|
|
|
|
; CHECK: ldrex [[OLDVAL:r[0-9]+]], [r[[ADDR:[0-9]+]]]
|
|
|
|
; CHECK: cmp [[OLDVAL]], r1
|
2015-09-23 01:22:58 +08:00
|
|
|
; CHECK: bne [[FAIL_BB:\.?LBB[0-9]+_[0-9]+]]
|
2014-04-03 21:06:54 +08:00
|
|
|
; CHECK: strex [[SUCCESS:r[0-9]+]], r2, [r[[ADDR]]]
|
|
|
|
; CHECK: cmp [[SUCCESS]], #0
|
|
|
|
; CHECK: bne [[LOOP_BB]]
|
2017-02-01 07:48:32 +08:00
|
|
|
; CHECK: dmb ish
|
|
|
|
; CHECK: bx lr
|
2015-09-23 01:22:58 +08:00
|
|
|
; CHECK: [[FAIL_BB]]:
|
|
|
|
; CHECK-NEXT: clrex
|
2014-04-03 21:06:54 +08:00
|
|
|
; CHECK: dmb ish
|
|
|
|
; CHECK: bx lr
|
|
|
|
|
|
|
|
ret i32 %oldval
|
|
|
|
}
|
2014-08-21 22:35:47 +08:00
|
|
|
|
|
|
|
define i32 @load_load_add_acquire(i32* %mem1, i32* %mem2) nounwind {
|
|
|
|
; CHECK-LABEL: load_load_add_acquire
|
2015-02-28 05:17:42 +08:00
|
|
|
%val1 = load atomic i32, i32* %mem1 acquire, align 4
|
|
|
|
%val2 = load atomic i32, i32* %mem2 acquire, align 4
|
2014-08-21 22:35:47 +08:00
|
|
|
%tmp = add i32 %val1, %val2
|
|
|
|
|
|
|
|
; CHECK: ldr {{r[0-9]}}, [r0]
|
|
|
|
; CHECK: dmb
|
|
|
|
; CHECK: ldr {{r[0-9]}}, [r1]
|
|
|
|
; CHECK: dmb
|
|
|
|
; CHECK: add r0,
|
|
|
|
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: ldr {{r[0-9]}}, [r0]
|
|
|
|
; CHECK-T1-M0: dmb
|
|
|
|
; CHECK-T1-M0: ldr {{r[0-9]}}, [r1]
|
|
|
|
; CHECK-T1-M0: dmb
|
|
|
|
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: ___sync_val_compare_and_swap_4
|
|
|
|
; CHECK-T1: ___sync_val_compare_and_swap_4
|
2014-08-21 22:35:47 +08:00
|
|
|
|
|
|
|
; CHECK-BAREMETAL: ldr {{r[0-9]}}, [r0]
|
|
|
|
; CHECK-BAREMETAL-NOT: dmb
|
|
|
|
; CHECK-BAREMETAL: ldr {{r[0-9]}}, [r1]
|
|
|
|
; CHECK-BAREMETAL-NOT: dmb
|
|
|
|
; CHECK-BAREMETAL: add r0,
|
|
|
|
|
|
|
|
ret i32 %tmp
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @store_store_release(i32* %mem1, i32 %val1, i32* %mem2, i32 %val2) {
|
|
|
|
; CHECK-LABEL: store_store_release
|
|
|
|
store atomic i32 %val1, i32* %mem1 release, align 4
|
|
|
|
store atomic i32 %val2, i32* %mem2 release, align 4
|
|
|
|
|
|
|
|
; CHECK: dmb
|
|
|
|
; CHECK: str r1, [r0]
|
|
|
|
; CHECK: dmb
|
|
|
|
; CHECK: str r3, [r2]
|
|
|
|
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: ___sync_lock_test_and_set
|
|
|
|
; CHECK-T1: ___sync_lock_test_and_set
|
2014-08-21 22:35:47 +08:00
|
|
|
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: dmb
|
|
|
|
; CHECK-T1-M0: str r1, [r0]
|
|
|
|
; CHECK-T1-M0: dmb
|
|
|
|
; CHECK-T1-M0: str r3, [r2]
|
|
|
|
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL-NOT: dmb
|
2018-07-04 21:28:39 +08:00
|
|
|
; CHECK-BAREMETAL: str r1, [r0]
|
2014-08-21 22:35:47 +08:00
|
|
|
; CHECK-BAREMETAL-NOT: dmb
|
2018-07-04 21:28:39 +08:00
|
|
|
; CHECK-BAREMETAL: str r3, [r2]
|
2014-08-21 22:35:47 +08:00
|
|
|
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @load_fence_store_monotonic(i32* %mem1, i32* %mem2) {
|
|
|
|
; CHECK-LABEL: load_fence_store_monotonic
|
2015-02-28 05:17:42 +08:00
|
|
|
%val = load atomic i32, i32* %mem1 monotonic, align 4
|
2014-08-21 22:35:47 +08:00
|
|
|
fence seq_cst
|
|
|
|
store atomic i32 %val, i32* %mem2 monotonic, align 4
|
|
|
|
|
|
|
|
; CHECK: ldr [[R0:r[0-9]]], [r0]
|
|
|
|
; CHECK: dmb
|
|
|
|
; CHECK: str [[R0]], [r1]
|
|
|
|
|
2016-11-04 05:49:08 +08:00
|
|
|
; CHECK-T1-M0: ldr [[R0:r[0-9]]], [r0]
|
|
|
|
; CHECK-T1-M0: dmb
|
|
|
|
; CHECK-T1-M0: str [[R0]], [r1]
|
|
|
|
|
2016-05-11 03:17:47 +08:00
|
|
|
; CHECK-T1: ldr [[R0:r[0-9]]], [{{r[0-9]+}}]
|
|
|
|
; CHECK-T1: {{dmb|bl ___sync_synchronize}}
|
|
|
|
; CHECK-T1: str [[R0]], [{{r[0-9]+}}]
|
2014-08-21 22:35:47 +08:00
|
|
|
|
|
|
|
; CHECK-BAREMETAL: ldr [[R0:r[0-9]]], [r0]
|
|
|
|
; CHECK-BAREMETAL-NOT: dmb
|
|
|
|
; CHECK-BAREMETAL: str [[R0]], [r1]
|
|
|
|
|
|
|
|
ret void
|
|
|
|
}
|