2012-04-09 09:43:17 +08:00
|
|
|
; RUN: llc < %s -march=x86 -mtriple=i386-linux-gnu | FileCheck -check-prefix=X32_LINUX %s
|
|
|
|
; RUN: llc < %s -march=x86-64 -mtriple=x86_64-linux-gnu | FileCheck -check-prefix=X64_LINUX %s
|
|
|
|
; RUN: llc < %s -march=x86 -mtriple=x86-pc-win32 | FileCheck -check-prefix=X32_WIN %s
|
|
|
|
; RUN: llc < %s -march=x86-64 -mtriple=x86_64-pc-win32 | FileCheck -check-prefix=X64_WIN %s
|
|
|
|
|
|
|
|
@i1 = thread_local global i32 15
|
|
|
|
@i2 = external thread_local global i32
|
|
|
|
@i3 = internal thread_local global i32 15
|
|
|
|
@i4 = hidden thread_local global i32 15
|
|
|
|
@i5 = external hidden thread_local global i32
|
|
|
|
@s1 = thread_local global i16 15
|
|
|
|
@b1 = thread_local global i8 0
|
|
|
|
|
|
|
|
define i32 @f1() {
|
|
|
|
; X32_LINUX: f1:
|
|
|
|
; X32_LINUX: movl %gs:i1@NTPOFF, %eax
|
|
|
|
; X32_LINUX-NEXT: ret
|
|
|
|
; X64_LINUX: f1:
|
|
|
|
; X64_LINUX: movl %fs:i1@TPOFF, %eax
|
|
|
|
; X64_LINUX-NEXT: ret
|
|
|
|
; X32_WIN: f1:
|
|
|
|
; X32_WIN: movl __tls_index, %eax
|
|
|
|
; X32_WIN-NEXT: movl %fs:__tls_array, %ecx
|
|
|
|
; X32_WIN-NEXT: movl (%ecx,%eax,4), %eax
|
|
|
|
; X32_WIN-NEXT: movl _i1@SECREL(%eax), %eax
|
|
|
|
; X32_WIN-NEXT: ret
|
|
|
|
; X64_WIN: f1:
|
|
|
|
; X64_WIN: movl _tls_index(%rip), %eax
|
|
|
|
; X64_WIN-NEXT: movq %gs:88, %rcx
|
|
|
|
; X64_WIN-NEXT: movq (%rcx,%rax,8), %rax
|
Cleanup and relax a restriction on the matching of global offsets into
x86 addressing modes. This allows PIE-based TLS offsets to fit directly
into an addressing mode immediate offset, which is the last remaining
code quality issue from PR12380. With this patch, that PR is completely
fixed.
To understand why this patch is correct to match these offsets into
addressing mode immediates, break it down by cases:
1) 32-bit is trivially correct, and unmodified here.
2) 64-bit non-small mode is unchanged and never matches.
3) 64-bit small PIC code which is RIP-relative is handled specially in
the match to try to fit RIP into the base register. If it fails, it
now early exits. This behavior is unchanged by the patch.
4) 64-bit small non-PIC code which is not RIP-relative continues to work
as it did before. The reason these immediates are safe is because the
ABI ensures they fit in small mode. This behavior is unchanged.
5) 64-bit small PIC code which is *not* using RIP-relative addressing.
This is the only case changed by the patch, and the primary place you
see it is in TLS, either the win64 section offset TLS or Linux
local-exec TLS model in a PIC compilation. Here the ABI again ensures
that the immediates fit because we are in small mode, and any other
operations required due to the PIC relocation model have been handled
externally to the Wrapper node (extra loads etc are made around the
wrapper node in ISelLowering).
I've tested this as much as I can comparing it with GCC's output, and
everything appears safe. I discussed this with Anton and it made sense
to him at least at face value. That said, if there are issues with PIC
code after this patch, yell and we can revert it.
llvm-svn: 154304
2012-04-09 10:13:06 +08:00
|
|
|
; X64_WIN-NEXT: movl i1@SECREL(%rax), %eax
|
2012-04-09 09:43:17 +08:00
|
|
|
; X64_WIN-NEXT: ret
|
|
|
|
|
|
|
|
entry:
|
|
|
|
%tmp1 = load i32* @i1
|
|
|
|
ret i32 %tmp1
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32* @f2() {
|
|
|
|
; X32_LINUX: f2:
|
|
|
|
; X32_LINUX: movl %gs:0, %eax
|
|
|
|
; X32_LINUX-NEXT: leal i1@NTPOFF(%eax), %eax
|
|
|
|
; X32_LINUX-NEXT: ret
|
|
|
|
; X64_LINUX: f2:
|
|
|
|
; X64_LINUX: movq %fs:0, %rax
|
|
|
|
; X64_LINUX-NEXT: leaq i1@TPOFF(%rax), %rax
|
|
|
|
; X64_LINUX-NEXT: ret
|
|
|
|
; X32_WIN: f2:
|
|
|
|
; X32_WIN: movl __tls_index, %eax
|
|
|
|
; X32_WIN-NEXT: movl %fs:__tls_array, %ecx
|
|
|
|
; X32_WIN-NEXT: movl (%ecx,%eax,4), %eax
|
|
|
|
; X32_WIN-NEXT: leal _i1@SECREL(%eax), %eax
|
|
|
|
; X32_WIN-NEXT: ret
|
|
|
|
; X64_WIN: f2:
|
|
|
|
; X64_WIN: movl _tls_index(%rip), %eax
|
|
|
|
; X64_WIN-NEXT: movq %gs:88, %rcx
|
|
|
|
; X64_WIN-NEXT: movq (%rcx,%rax,8), %rax
|
Cleanup and relax a restriction on the matching of global offsets into
x86 addressing modes. This allows PIE-based TLS offsets to fit directly
into an addressing mode immediate offset, which is the last remaining
code quality issue from PR12380. With this patch, that PR is completely
fixed.
To understand why this patch is correct to match these offsets into
addressing mode immediates, break it down by cases:
1) 32-bit is trivially correct, and unmodified here.
2) 64-bit non-small mode is unchanged and never matches.
3) 64-bit small PIC code which is RIP-relative is handled specially in
the match to try to fit RIP into the base register. If it fails, it
now early exits. This behavior is unchanged by the patch.
4) 64-bit small non-PIC code which is not RIP-relative continues to work
as it did before. The reason these immediates are safe is because the
ABI ensures they fit in small mode. This behavior is unchanged.
5) 64-bit small PIC code which is *not* using RIP-relative addressing.
This is the only case changed by the patch, and the primary place you
see it is in TLS, either the win64 section offset TLS or Linux
local-exec TLS model in a PIC compilation. Here the ABI again ensures
that the immediates fit because we are in small mode, and any other
operations required due to the PIC relocation model have been handled
externally to the Wrapper node (extra loads etc are made around the
wrapper node in ISelLowering).
I've tested this as much as I can comparing it with GCC's output, and
everything appears safe. I discussed this with Anton and it made sense
to him at least at face value. That said, if there are issues with PIC
code after this patch, yell and we can revert it.
llvm-svn: 154304
2012-04-09 10:13:06 +08:00
|
|
|
; X64_WIN-NEXT: leaq i1@SECREL(%rax), %rax
|
2012-04-09 09:43:17 +08:00
|
|
|
; X64_WIN-NEXT: ret
|
|
|
|
|
|
|
|
entry:
|
|
|
|
ret i32* @i1
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @f3() nounwind {
|
|
|
|
; X32_LINUX: f3:
|
|
|
|
; X32_LINUX: movl i2@INDNTPOFF, %eax
|
|
|
|
; X32_LINUX-NEXT: movl %gs:(%eax), %eax
|
|
|
|
; X32_LINUX-NEXT: ret
|
|
|
|
; X64_LINUX: f3:
|
|
|
|
; X64_LINUX: movq i2@GOTTPOFF(%rip), %rax
|
|
|
|
; X64_LINUX-NEXT: movl %fs:(%rax), %eax
|
|
|
|
; X64_LINUX-NEXT: ret
|
|
|
|
; X32_WIN: f3:
|
|
|
|
; X32_WIN: movl __tls_index, %eax
|
|
|
|
; X32_WIN-NEXT: movl %fs:__tls_array, %ecx
|
|
|
|
; X32_WIN-NEXT: movl (%ecx,%eax,4), %eax
|
|
|
|
; X32_WIN-NEXT: movl _i2@SECREL(%eax), %eax
|
|
|
|
; X32_WIN-NEXT: ret
|
|
|
|
; X64_WIN: f3:
|
|
|
|
; X64_WIN: movl _tls_index(%rip), %eax
|
|
|
|
; X64_WIN-NEXT: movq %gs:88, %rcx
|
|
|
|
; X64_WIN-NEXT: movq (%rcx,%rax,8), %rax
|
Cleanup and relax a restriction on the matching of global offsets into
x86 addressing modes. This allows PIE-based TLS offsets to fit directly
into an addressing mode immediate offset, which is the last remaining
code quality issue from PR12380. With this patch, that PR is completely
fixed.
To understand why this patch is correct to match these offsets into
addressing mode immediates, break it down by cases:
1) 32-bit is trivially correct, and unmodified here.
2) 64-bit non-small mode is unchanged and never matches.
3) 64-bit small PIC code which is RIP-relative is handled specially in
the match to try to fit RIP into the base register. If it fails, it
now early exits. This behavior is unchanged by the patch.
4) 64-bit small non-PIC code which is not RIP-relative continues to work
as it did before. The reason these immediates are safe is because the
ABI ensures they fit in small mode. This behavior is unchanged.
5) 64-bit small PIC code which is *not* using RIP-relative addressing.
This is the only case changed by the patch, and the primary place you
see it is in TLS, either the win64 section offset TLS or Linux
local-exec TLS model in a PIC compilation. Here the ABI again ensures
that the immediates fit because we are in small mode, and any other
operations required due to the PIC relocation model have been handled
externally to the Wrapper node (extra loads etc are made around the
wrapper node in ISelLowering).
I've tested this as much as I can comparing it with GCC's output, and
everything appears safe. I discussed this with Anton and it made sense
to him at least at face value. That said, if there are issues with PIC
code after this patch, yell and we can revert it.
llvm-svn: 154304
2012-04-09 10:13:06 +08:00
|
|
|
; X64_WIN-NEXT: movl i2@SECREL(%rax), %eax
|
2012-04-09 09:43:17 +08:00
|
|
|
; X64_WIN-NEXT: ret
|
|
|
|
|
|
|
|
entry:
|
|
|
|
%tmp1 = load i32* @i2
|
|
|
|
ret i32 %tmp1
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32* @f4() {
|
|
|
|
; X32_LINUX: f4:
|
|
|
|
; X32_LINUX: movl %gs:0, %eax
|
|
|
|
; X32_LINUX-NEXT: addl i2@INDNTPOFF, %eax
|
|
|
|
; X32_LINUX-NEXT: ret
|
|
|
|
; X64_LINUX: f4:
|
|
|
|
; X64_LINUX: movq %fs:0, %rax
|
|
|
|
; X64_LINUX-NEXT: addq i2@GOTTPOFF(%rip), %rax
|
|
|
|
; X64_LINUX-NEXT: ret
|
|
|
|
; X32_WIN: f4:
|
|
|
|
; X32_WIN: movl __tls_index, %eax
|
|
|
|
; X32_WIN-NEXT: movl %fs:__tls_array, %ecx
|
|
|
|
; X32_WIN-NEXT: movl (%ecx,%eax,4), %eax
|
|
|
|
; X32_WIN-NEXT: leal _i2@SECREL(%eax), %eax
|
|
|
|
; X32_WIN-NEXT: ret
|
|
|
|
; X64_WIN: f4:
|
|
|
|
; X64_WIN: movl _tls_index(%rip), %eax
|
|
|
|
; X64_WIN-NEXT: movq %gs:88, %rcx
|
|
|
|
; X64_WIN-NEXT: movq (%rcx,%rax,8), %rax
|
Cleanup and relax a restriction on the matching of global offsets into
x86 addressing modes. This allows PIE-based TLS offsets to fit directly
into an addressing mode immediate offset, which is the last remaining
code quality issue from PR12380. With this patch, that PR is completely
fixed.
To understand why this patch is correct to match these offsets into
addressing mode immediates, break it down by cases:
1) 32-bit is trivially correct, and unmodified here.
2) 64-bit non-small mode is unchanged and never matches.
3) 64-bit small PIC code which is RIP-relative is handled specially in
the match to try to fit RIP into the base register. If it fails, it
now early exits. This behavior is unchanged by the patch.
4) 64-bit small non-PIC code which is not RIP-relative continues to work
as it did before. The reason these immediates are safe is because the
ABI ensures they fit in small mode. This behavior is unchanged.
5) 64-bit small PIC code which is *not* using RIP-relative addressing.
This is the only case changed by the patch, and the primary place you
see it is in TLS, either the win64 section offset TLS or Linux
local-exec TLS model in a PIC compilation. Here the ABI again ensures
that the immediates fit because we are in small mode, and any other
operations required due to the PIC relocation model have been handled
externally to the Wrapper node (extra loads etc are made around the
wrapper node in ISelLowering).
I've tested this as much as I can comparing it with GCC's output, and
everything appears safe. I discussed this with Anton and it made sense
to him at least at face value. That said, if there are issues with PIC
code after this patch, yell and we can revert it.
llvm-svn: 154304
2012-04-09 10:13:06 +08:00
|
|
|
; X64_WIN-NEXT: leaq i2@SECREL(%rax), %rax
|
2012-04-09 09:43:17 +08:00
|
|
|
; X64_WIN-NEXT: ret
|
|
|
|
|
|
|
|
entry:
|
|
|
|
ret i32* @i2
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @f5() nounwind {
|
|
|
|
; X32_LINUX: f5:
|
|
|
|
; X32_LINUX: movl %gs:i3@NTPOFF, %eax
|
|
|
|
; X32_LINUX-NEXT: ret
|
|
|
|
; X64_LINUX: f5:
|
|
|
|
; X64_LINUX: movl %fs:i3@TPOFF, %eax
|
|
|
|
; X64_LINUX-NEXT: ret
|
|
|
|
; X32_WIN: f5:
|
|
|
|
; X32_WIN: movl __tls_index, %eax
|
|
|
|
; X32_WIN-NEXT: movl %fs:__tls_array, %ecx
|
|
|
|
; X32_WIN-NEXT: movl (%ecx,%eax,4), %eax
|
|
|
|
; X32_WIN-NEXT: movl _i3@SECREL(%eax), %eax
|
|
|
|
; X32_WIN-NEXT: ret
|
|
|
|
; X64_WIN: f5:
|
|
|
|
; X64_WIN: movl _tls_index(%rip), %eax
|
|
|
|
; X64_WIN-NEXT: movq %gs:88, %rcx
|
|
|
|
; X64_WIN-NEXT: movq (%rcx,%rax,8), %rax
|
Cleanup and relax a restriction on the matching of global offsets into
x86 addressing modes. This allows PIE-based TLS offsets to fit directly
into an addressing mode immediate offset, which is the last remaining
code quality issue from PR12380. With this patch, that PR is completely
fixed.
To understand why this patch is correct to match these offsets into
addressing mode immediates, break it down by cases:
1) 32-bit is trivially correct, and unmodified here.
2) 64-bit non-small mode is unchanged and never matches.
3) 64-bit small PIC code which is RIP-relative is handled specially in
the match to try to fit RIP into the base register. If it fails, it
now early exits. This behavior is unchanged by the patch.
4) 64-bit small non-PIC code which is not RIP-relative continues to work
as it did before. The reason these immediates are safe is because the
ABI ensures they fit in small mode. This behavior is unchanged.
5) 64-bit small PIC code which is *not* using RIP-relative addressing.
This is the only case changed by the patch, and the primary place you
see it is in TLS, either the win64 section offset TLS or Linux
local-exec TLS model in a PIC compilation. Here the ABI again ensures
that the immediates fit because we are in small mode, and any other
operations required due to the PIC relocation model have been handled
externally to the Wrapper node (extra loads etc are made around the
wrapper node in ISelLowering).
I've tested this as much as I can comparing it with GCC's output, and
everything appears safe. I discussed this with Anton and it made sense
to him at least at face value. That said, if there are issues with PIC
code after this patch, yell and we can revert it.
llvm-svn: 154304
2012-04-09 10:13:06 +08:00
|
|
|
; X64_WIN-NEXT: movl i3@SECREL(%rax), %eax
|
2012-04-09 09:43:17 +08:00
|
|
|
; X64_WIN-NEXT: ret
|
|
|
|
|
|
|
|
entry:
|
|
|
|
%tmp1 = load i32* @i3
|
|
|
|
ret i32 %tmp1
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32* @f6() {
|
|
|
|
; X32_LINUX: f6:
|
|
|
|
; X32_LINUX: movl %gs:0, %eax
|
|
|
|
; X32_LINUX-NEXT: leal i3@NTPOFF(%eax), %eax
|
|
|
|
; X32_LINUX-NEXT: ret
|
|
|
|
; X64_LINUX: f6:
|
|
|
|
; X64_LINUX: movq %fs:0, %rax
|
|
|
|
; X64_LINUX-NEXT: leaq i3@TPOFF(%rax), %rax
|
|
|
|
; X64_LINUX-NEXT: ret
|
|
|
|
; X32_WIN: f6:
|
|
|
|
; X32_WIN: movl __tls_index, %eax
|
|
|
|
; X32_WIN-NEXT: movl %fs:__tls_array, %ecx
|
|
|
|
; X32_WIN-NEXT: movl (%ecx,%eax,4), %eax
|
|
|
|
; X32_WIN-NEXT: leal _i3@SECREL(%eax), %eax
|
|
|
|
; X32_WIN-NEXT: ret
|
|
|
|
; X64_WIN: f6:
|
|
|
|
; X64_WIN: movl _tls_index(%rip), %eax
|
|
|
|
; X64_WIN-NEXT: movq %gs:88, %rcx
|
|
|
|
; X64_WIN-NEXT: movq (%rcx,%rax,8), %rax
|
Cleanup and relax a restriction on the matching of global offsets into
x86 addressing modes. This allows PIE-based TLS offsets to fit directly
into an addressing mode immediate offset, which is the last remaining
code quality issue from PR12380. With this patch, that PR is completely
fixed.
To understand why this patch is correct to match these offsets into
addressing mode immediates, break it down by cases:
1) 32-bit is trivially correct, and unmodified here.
2) 64-bit non-small mode is unchanged and never matches.
3) 64-bit small PIC code which is RIP-relative is handled specially in
the match to try to fit RIP into the base register. If it fails, it
now early exits. This behavior is unchanged by the patch.
4) 64-bit small non-PIC code which is not RIP-relative continues to work
as it did before. The reason these immediates are safe is because the
ABI ensures they fit in small mode. This behavior is unchanged.
5) 64-bit small PIC code which is *not* using RIP-relative addressing.
This is the only case changed by the patch, and the primary place you
see it is in TLS, either the win64 section offset TLS or Linux
local-exec TLS model in a PIC compilation. Here the ABI again ensures
that the immediates fit because we are in small mode, and any other
operations required due to the PIC relocation model have been handled
externally to the Wrapper node (extra loads etc are made around the
wrapper node in ISelLowering).
I've tested this as much as I can comparing it with GCC's output, and
everything appears safe. I discussed this with Anton and it made sense
to him at least at face value. That said, if there are issues with PIC
code after this patch, yell and we can revert it.
llvm-svn: 154304
2012-04-09 10:13:06 +08:00
|
|
|
; X64_WIN-NEXT: leaq i3@SECREL(%rax), %rax
|
2012-04-09 09:43:17 +08:00
|
|
|
; X64_WIN-NEXT: ret
|
|
|
|
|
|
|
|
entry:
|
|
|
|
ret i32* @i3
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @f7() {
|
|
|
|
; X32_LINUX: f7:
|
|
|
|
; X32_LINUX: movl %gs:i4@NTPOFF, %eax
|
|
|
|
; X32_LINUX-NEXT: ret
|
|
|
|
; X64_LINUX: f7:
|
|
|
|
; X64_LINUX: movl %fs:i4@TPOFF, %eax
|
|
|
|
; X64_LINUX-NEXT: ret
|
|
|
|
|
|
|
|
entry:
|
|
|
|
%tmp1 = load i32* @i4
|
|
|
|
ret i32 %tmp1
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32* @f8() {
|
|
|
|
; X32_LINUX: f8:
|
|
|
|
; X32_LINUX: movl %gs:0, %eax
|
|
|
|
; X32_LINUX-NEXT: leal i4@NTPOFF(%eax), %eax
|
|
|
|
; X32_LINUX-NEXT: ret
|
|
|
|
; X64_LINUX: f8:
|
|
|
|
; X64_LINUX: movq %fs:0, %rax
|
|
|
|
; X64_LINUX-NEXT: leaq i4@TPOFF(%rax), %rax
|
|
|
|
; X64_LINUX-NEXT: ret
|
|
|
|
|
|
|
|
entry:
|
|
|
|
ret i32* @i4
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @f9() {
|
|
|
|
; X32_LINUX: f9:
|
|
|
|
; X32_LINUX: movl %gs:i5@NTPOFF, %eax
|
|
|
|
; X32_LINUX-NEXT: ret
|
|
|
|
; X64_LINUX: f9:
|
|
|
|
; X64_LINUX: movl %fs:i5@TPOFF, %eax
|
|
|
|
; X64_LINUX-NEXT: ret
|
|
|
|
|
|
|
|
entry:
|
|
|
|
%tmp1 = load i32* @i5
|
|
|
|
ret i32 %tmp1
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32* @f10() {
|
|
|
|
; X32_LINUX: f10:
|
|
|
|
; X32_LINUX: movl %gs:0, %eax
|
|
|
|
; X32_LINUX-NEXT: leal i5@NTPOFF(%eax), %eax
|
|
|
|
; X32_LINUX-NEXT: ret
|
|
|
|
; X64_LINUX: f10:
|
|
|
|
; X64_LINUX: movq %fs:0, %rax
|
|
|
|
; X64_LINUX-NEXT: leaq i5@TPOFF(%rax), %rax
|
|
|
|
; X64_LINUX-NEXT: ret
|
|
|
|
|
|
|
|
entry:
|
|
|
|
ret i32* @i5
|
|
|
|
}
|
|
|
|
|
|
|
|
define i16 @f11() {
|
|
|
|
; X32_LINUX: f11:
|
|
|
|
; X32_LINUX: movzwl %gs:s1@NTPOFF, %eax
|
|
|
|
; Why is this kill line here, but no where else?
|
|
|
|
; X32_LINUX-NEXT: # kill
|
|
|
|
; X32_LINUX-NEXT: ret
|
|
|
|
; X64_LINUX: f11:
|
|
|
|
; X64_LINUX: movzwl %fs:s1@TPOFF, %eax
|
|
|
|
; X64_LINUX-NEXT: # kill
|
|
|
|
; X64_LINUX-NEXT: ret
|
|
|
|
; X32_WIN: f11:
|
|
|
|
; X32_WIN: movl __tls_index, %eax
|
|
|
|
; X32_WIN-NEXT: movl %fs:__tls_array, %ecx
|
|
|
|
; X32_WIN-NEXT: movl (%ecx,%eax,4), %eax
|
|
|
|
; X32_WIN-NEXT: movzwl _s1@SECREL(%eax), %eax
|
|
|
|
; X32_WIN-NEXT: # kill
|
|
|
|
; X32_WIN-NEXT: ret
|
|
|
|
; X64_WIN: f11:
|
|
|
|
; X64_WIN: movl _tls_index(%rip), %eax
|
|
|
|
; X64_WIN-NEXT: movq %gs:88, %rcx
|
|
|
|
; X64_WIN-NEXT: movq (%rcx,%rax,8), %rax
|
Cleanup and relax a restriction on the matching of global offsets into
x86 addressing modes. This allows PIE-based TLS offsets to fit directly
into an addressing mode immediate offset, which is the last remaining
code quality issue from PR12380. With this patch, that PR is completely
fixed.
To understand why this patch is correct to match these offsets into
addressing mode immediates, break it down by cases:
1) 32-bit is trivially correct, and unmodified here.
2) 64-bit non-small mode is unchanged and never matches.
3) 64-bit small PIC code which is RIP-relative is handled specially in
the match to try to fit RIP into the base register. If it fails, it
now early exits. This behavior is unchanged by the patch.
4) 64-bit small non-PIC code which is not RIP-relative continues to work
as it did before. The reason these immediates are safe is because the
ABI ensures they fit in small mode. This behavior is unchanged.
5) 64-bit small PIC code which is *not* using RIP-relative addressing.
This is the only case changed by the patch, and the primary place you
see it is in TLS, either the win64 section offset TLS or Linux
local-exec TLS model in a PIC compilation. Here the ABI again ensures
that the immediates fit because we are in small mode, and any other
operations required due to the PIC relocation model have been handled
externally to the Wrapper node (extra loads etc are made around the
wrapper node in ISelLowering).
I've tested this as much as I can comparing it with GCC's output, and
everything appears safe. I discussed this with Anton and it made sense
to him at least at face value. That said, if there are issues with PIC
code after this patch, yell and we can revert it.
llvm-svn: 154304
2012-04-09 10:13:06 +08:00
|
|
|
; X64_WIN-NEXT: movzwl s1@SECREL(%rax), %eax
|
2012-04-09 09:43:17 +08:00
|
|
|
; X64_WIN-NEXT: # kill
|
|
|
|
; X64_WIN-NEXT: ret
|
|
|
|
|
|
|
|
entry:
|
|
|
|
%tmp1 = load i16* @s1
|
|
|
|
ret i16 %tmp1
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @f12() {
|
|
|
|
; X32_LINUX: f12:
|
|
|
|
; X32_LINUX: movswl %gs:s1@NTPOFF, %eax
|
|
|
|
; X32_LINUX-NEXT: ret
|
|
|
|
; X64_LINUX: f12:
|
|
|
|
; X64_LINUX: movswl %fs:s1@TPOFF, %eax
|
|
|
|
; X64_LINUX-NEXT: ret
|
|
|
|
; X32_WIN: f12:
|
|
|
|
; X32_WIN: movl __tls_index, %eax
|
|
|
|
; X32_WIN-NEXT: movl %fs:__tls_array, %ecx
|
|
|
|
; X32_WIN-NEXT: movl (%ecx,%eax,4), %eax
|
|
|
|
; X32_WIN-NEXT: movswl _s1@SECREL(%eax), %eax
|
|
|
|
; X32_WIN-NEXT: ret
|
|
|
|
; X64_WIN: f12:
|
|
|
|
; X64_WIN: movl _tls_index(%rip), %eax
|
|
|
|
; X64_WIN-NEXT: movq %gs:88, %rcx
|
|
|
|
; X64_WIN-NEXT: movq (%rcx,%rax,8), %rax
|
Cleanup and relax a restriction on the matching of global offsets into
x86 addressing modes. This allows PIE-based TLS offsets to fit directly
into an addressing mode immediate offset, which is the last remaining
code quality issue from PR12380. With this patch, that PR is completely
fixed.
To understand why this patch is correct to match these offsets into
addressing mode immediates, break it down by cases:
1) 32-bit is trivially correct, and unmodified here.
2) 64-bit non-small mode is unchanged and never matches.
3) 64-bit small PIC code which is RIP-relative is handled specially in
the match to try to fit RIP into the base register. If it fails, it
now early exits. This behavior is unchanged by the patch.
4) 64-bit small non-PIC code which is not RIP-relative continues to work
as it did before. The reason these immediates are safe is because the
ABI ensures they fit in small mode. This behavior is unchanged.
5) 64-bit small PIC code which is *not* using RIP-relative addressing.
This is the only case changed by the patch, and the primary place you
see it is in TLS, either the win64 section offset TLS or Linux
local-exec TLS model in a PIC compilation. Here the ABI again ensures
that the immediates fit because we are in small mode, and any other
operations required due to the PIC relocation model have been handled
externally to the Wrapper node (extra loads etc are made around the
wrapper node in ISelLowering).
I've tested this as much as I can comparing it with GCC's output, and
everything appears safe. I discussed this with Anton and it made sense
to him at least at face value. That said, if there are issues with PIC
code after this patch, yell and we can revert it.
llvm-svn: 154304
2012-04-09 10:13:06 +08:00
|
|
|
; X64_WIN-NEXT: movswl s1@SECREL(%rax), %eax
|
2012-04-09 09:43:17 +08:00
|
|
|
; X64_WIN-NEXT: ret
|
|
|
|
|
|
|
|
entry:
|
|
|
|
%tmp1 = load i16* @s1
|
|
|
|
%tmp2 = sext i16 %tmp1 to i32
|
|
|
|
ret i32 %tmp2
|
|
|
|
}
|
|
|
|
|
|
|
|
define i8 @f13() {
|
|
|
|
; X32_LINUX: f13:
|
|
|
|
; X32_LINUX: movb %gs:b1@NTPOFF, %al
|
|
|
|
; X32_LINUX-NEXT: ret
|
|
|
|
; X64_LINUX: f13:
|
|
|
|
; X64_LINUX: movb %fs:b1@TPOFF, %al
|
|
|
|
; X64_LINUX-NEXT: ret
|
|
|
|
; X32_WIN: f13:
|
|
|
|
; X32_WIN: movl __tls_index, %eax
|
|
|
|
; X32_WIN-NEXT: movl %fs:__tls_array, %ecx
|
|
|
|
; X32_WIN-NEXT: movl (%ecx,%eax,4), %eax
|
|
|
|
; X32_WIN-NEXT: movb _b1@SECREL(%eax), %al
|
|
|
|
; X32_WIN-NEXT: ret
|
|
|
|
; X64_WIN: f13:
|
|
|
|
; X64_WIN: movl _tls_index(%rip), %eax
|
|
|
|
; X64_WIN-NEXT: movq %gs:88, %rcx
|
|
|
|
; X64_WIN-NEXT: movq (%rcx,%rax,8), %rax
|
Cleanup and relax a restriction on the matching of global offsets into
x86 addressing modes. This allows PIE-based TLS offsets to fit directly
into an addressing mode immediate offset, which is the last remaining
code quality issue from PR12380. With this patch, that PR is completely
fixed.
To understand why this patch is correct to match these offsets into
addressing mode immediates, break it down by cases:
1) 32-bit is trivially correct, and unmodified here.
2) 64-bit non-small mode is unchanged and never matches.
3) 64-bit small PIC code which is RIP-relative is handled specially in
the match to try to fit RIP into the base register. If it fails, it
now early exits. This behavior is unchanged by the patch.
4) 64-bit small non-PIC code which is not RIP-relative continues to work
as it did before. The reason these immediates are safe is because the
ABI ensures they fit in small mode. This behavior is unchanged.
5) 64-bit small PIC code which is *not* using RIP-relative addressing.
This is the only case changed by the patch, and the primary place you
see it is in TLS, either the win64 section offset TLS or Linux
local-exec TLS model in a PIC compilation. Here the ABI again ensures
that the immediates fit because we are in small mode, and any other
operations required due to the PIC relocation model have been handled
externally to the Wrapper node (extra loads etc are made around the
wrapper node in ISelLowering).
I've tested this as much as I can comparing it with GCC's output, and
everything appears safe. I discussed this with Anton and it made sense
to him at least at face value. That said, if there are issues with PIC
code after this patch, yell and we can revert it.
llvm-svn: 154304
2012-04-09 10:13:06 +08:00
|
|
|
; X64_WIN-NEXT: movb b1@SECREL(%rax), %al
|
2012-04-09 09:43:17 +08:00
|
|
|
; X64_WIN-NEXT: ret
|
|
|
|
|
|
|
|
entry:
|
|
|
|
%tmp1 = load i8* @b1
|
|
|
|
ret i8 %tmp1
|
|
|
|
}
|
|
|
|
|
|
|
|
define i32 @f14() {
|
|
|
|
; X32_LINUX: f14:
|
|
|
|
; X32_LINUX: movsbl %gs:b1@NTPOFF, %eax
|
|
|
|
; X32_LINUX-NEXT: ret
|
|
|
|
; X64_LINUX: f14:
|
|
|
|
; X64_LINUX: movsbl %fs:b1@TPOFF, %eax
|
|
|
|
; X64_LINUX-NEXT: ret
|
|
|
|
; X32_WIN: f14:
|
|
|
|
; X32_WIN: movl __tls_index, %eax
|
|
|
|
; X32_WIN-NEXT: movl %fs:__tls_array, %ecx
|
|
|
|
; X32_WIN-NEXT: movl (%ecx,%eax,4), %eax
|
|
|
|
; X32_WIN-NEXT: movsbl _b1@SECREL(%eax), %eax
|
|
|
|
; X32_WIN-NEXT: ret
|
|
|
|
; X64_WIN: f14:
|
|
|
|
; X64_WIN: movl _tls_index(%rip), %eax
|
|
|
|
; X64_WIN-NEXT: movq %gs:88, %rcx
|
|
|
|
; X64_WIN-NEXT: movq (%rcx,%rax,8), %rax
|
Cleanup and relax a restriction on the matching of global offsets into
x86 addressing modes. This allows PIE-based TLS offsets to fit directly
into an addressing mode immediate offset, which is the last remaining
code quality issue from PR12380. With this patch, that PR is completely
fixed.
To understand why this patch is correct to match these offsets into
addressing mode immediates, break it down by cases:
1) 32-bit is trivially correct, and unmodified here.
2) 64-bit non-small mode is unchanged and never matches.
3) 64-bit small PIC code which is RIP-relative is handled specially in
the match to try to fit RIP into the base register. If it fails, it
now early exits. This behavior is unchanged by the patch.
4) 64-bit small non-PIC code which is not RIP-relative continues to work
as it did before. The reason these immediates are safe is because the
ABI ensures they fit in small mode. This behavior is unchanged.
5) 64-bit small PIC code which is *not* using RIP-relative addressing.
This is the only case changed by the patch, and the primary place you
see it is in TLS, either the win64 section offset TLS or Linux
local-exec TLS model in a PIC compilation. Here the ABI again ensures
that the immediates fit because we are in small mode, and any other
operations required due to the PIC relocation model have been handled
externally to the Wrapper node (extra loads etc are made around the
wrapper node in ISelLowering).
I've tested this as much as I can comparing it with GCC's output, and
everything appears safe. I discussed this with Anton and it made sense
to him at least at face value. That said, if there are issues with PIC
code after this patch, yell and we can revert it.
llvm-svn: 154304
2012-04-09 10:13:06 +08:00
|
|
|
; X64_WIN-NEXT: movsbl b1@SECREL(%rax), %eax
|
2012-04-09 09:43:17 +08:00
|
|
|
; X64_WIN-NEXT: ret
|
|
|
|
|
|
|
|
entry:
|
|
|
|
%tmp1 = load i8* @b1
|
|
|
|
%tmp2 = sext i8 %tmp1 to i32
|
|
|
|
ret i32 %tmp2
|
|
|
|
}
|
|
|
|
|