2015-06-06 00:11:14 +08:00
|
|
|
; RUN: llc < %s -march=bpfel -show-mc-encoding | FileCheck %s
|
BPF backend
Summary:
V8->V9:
- cleanup tests
V7->V8:
- addressed feedback from David:
- switched to range-based 'for' loops
- fixed formatting of tests
V6->V7:
- rebased and adjusted AsmPrinter args
- CamelCased .td, fixed formatting, cleaned up names, removed unused patterns
- diffstat: 3 files changed, 203 insertions(+), 227 deletions(-)
V5->V6:
- addressed feedback from Chandler:
- reinstated full verbose standard banner in all files
- fixed variables that were not in CamelCase
- fixed names of #ifdef in header files
- removed redundant braces in if/else chains with single statements
- fixed comments
- removed trailing empty line
- dropped debug annotations from tests
- diffstat of these changes:
46 files changed, 456 insertions(+), 469 deletions(-)
V4->V5:
- fix setLoadExtAction() interface
- clang-formated all where it made sense
V3->V4:
- added CODE_OWNERS entry for BPF backend
V2->V3:
- fix metadata in tests
V1->V2:
- addressed feedback from Tom and Matt
- removed top level change to configure (now everything via 'experimental-backend')
- reworked error reporting via DiagnosticInfo (similar to R600)
- added few more tests
- added cmake build
- added Triple::bpf
- tested on linux and darwin
V1 cover letter:
---------------------
recently linux gained "universal in-kernel virtual machine" which is called
eBPF or extended BPF. The name comes from "Berkeley Packet Filter", since
new instruction set is based on it.
This patch adds a new backend that emits extended BPF instruction set.
The concept and development are covered by the following articles:
http://lwn.net/Articles/599755/
http://lwn.net/Articles/575531/
http://lwn.net/Articles/603983/
http://lwn.net/Articles/606089/
http://lwn.net/Articles/612878/
One of use cases: dtrace/systemtap alternative.
bpf syscall manpage:
https://git.kernel.org/cgit/linux/kernel/git/torvalds/linux.git/commit/?id=b4fc1a460f3017e958e6a8ea560ea0afd91bf6fe
instruction set description and differences vs classic BPF:
http://git.kernel.org/cgit/linux/kernel/git/torvalds/linux.git/tree/Documentation/networking/filter.txt
Short summary of instruction set:
- 64-bit registers
R0 - return value from in-kernel function, and exit value for BPF program
R1 - R5 - arguments from BPF program to in-kernel function
R6 - R9 - callee saved registers that in-kernel function will preserve
R10 - read-only frame pointer to access stack
- two-operand instructions like +, -, *, mov, load/store
- implicit prologue/epilogue (invisible stack pointer)
- no floating point, no simd
Short history of extended BPF in kernel:
interpreter in 3.15, x64 JIT in 3.16, arm64 JIT, verifier, bpf syscall in 3.18, more to come in the future.
It's a very small and simple backend.
There is no support for global variables, arbitrary function calls, floating point, varargs,
exceptions, indirect jumps, arbitrary pointer arithmetic, alloca, etc.
From C front-end point of view it's very restricted. It's done on purpose, since kernel
rejects all programs that it cannot prove safe. It rejects programs with loops
and with memory accesses via arbitrary pointers. When kernel accepts the program it is
guaranteed that program will terminate and will not crash the kernel.
This patch implements all 'must have' bits. There are several things on TODO list,
so this is not the end of development.
Most of the code is a boiler plate code, copy-pasted from other backends.
Only odd things are lack or < and <= instructions, specialized load_byte intrinsics
and 'compare and goto' as single instruction.
Current instruction set is fixed, but more instructions can be added in the future.
Signed-off-by: Alexei Starovoitov <alexei.starovoitov@gmail.com>
Subscribers: majnemer, chandlerc, echristo, joerg, pete, rengolin, kristof.beyls, arsenm, t.p.northover, tstellarAMD, aemerson, llvm-commits
Differential Revision: http://reviews.llvm.org/D6494
llvm-svn: 227008
2015-01-25 01:51:26 +08:00
|
|
|
|
|
|
|
define void @test() #0 {
|
|
|
|
entry:
|
|
|
|
; CHECK: test:
|
|
|
|
|
|
|
|
; CHECK: mov r1, 123 # encoding: [0xb7,0x01,0x00,0x00,0x7b,0x00,0x00,0x00]
|
|
|
|
; CHECK: call f_i16
|
|
|
|
call void @f_i16(i16 123)
|
|
|
|
|
|
|
|
; CHECK: mov r1, 12345678 # encoding: [0xb7,0x01,0x00,0x00,0x4e,0x61,0xbc,0x00]
|
|
|
|
; CHECK: call f_i32
|
|
|
|
call void @f_i32(i32 12345678)
|
|
|
|
|
|
|
|
; CHECK: ld_64 r1, 72623859790382856 # encoding: [0x18,0x01,0x00,0x00,0x08,0x07,0x06,0x05,0x00,0x00,0x00,0x00,0x04,0x03,0x02,0x01]
|
|
|
|
; CHECK: call f_i64
|
|
|
|
call void @f_i64(i64 72623859790382856)
|
|
|
|
|
|
|
|
; CHECK: mov r1, 1234
|
|
|
|
; CHECK: mov r2, 5678
|
|
|
|
; CHECK: call f_i32_i32
|
|
|
|
call void @f_i32_i32(i32 1234, i32 5678)
|
|
|
|
|
|
|
|
; CHECK: mov r1, 2
|
|
|
|
; CHECK: mov r2, 3
|
|
|
|
; CHECK: mov r3, 4
|
|
|
|
; CHECK: call f_i16_i32_i16
|
|
|
|
call void @f_i16_i32_i16(i16 2, i32 3, i16 4)
|
|
|
|
|
|
|
|
; CHECK: mov r1, 5
|
|
|
|
; CHECK: ld_64 r2, 7262385979038285
|
|
|
|
; CHECK: mov r3, 6
|
|
|
|
; CHECK: call f_i16_i64_i16
|
|
|
|
call void @f_i16_i64_i16(i16 5, i64 7262385979038285, i16 6)
|
|
|
|
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
@g_i16 = common global i16 0, align 2
|
|
|
|
@g_i32 = common global i32 0, align 2
|
|
|
|
@g_i64 = common global i64 0, align 4
|
|
|
|
|
|
|
|
define void @f_i16(i16 %a) #0 {
|
|
|
|
; CHECK: f_i16:
|
|
|
|
; CHECK: sth 0(r2), r1 # encoding: [0x6b,0x12,0x00,0x00,0x00,0x00,0x00,0x00]
|
|
|
|
store volatile i16 %a, i16* @g_i16, align 2
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @f_i32(i32 %a) #0 {
|
|
|
|
; CHECK: f_i32:
|
|
|
|
; CHECK: sth 0(r2), r1 # encoding: [0x6b,0x12,0x00,0x00,0x00,0x00,0x00,0x00]
|
|
|
|
; CHECK: sth 2(r2), r1 # encoding: [0x6b,0x12,0x02,0x00,0x00,0x00,0x00,0x00]
|
|
|
|
store volatile i32 %a, i32* @g_i32, align 2
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @f_i64(i64 %a) #0 {
|
|
|
|
; CHECK: f_i64:
|
|
|
|
; CHECK: stw 0(r2), r1
|
|
|
|
; CHECK: stw 4(r2), r1 # encoding: [0x63,0x12,0x04,0x00,0x00,0x00,0x00,0x00]
|
|
|
|
store volatile i64 %a, i64* @g_i64, align 2
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @f_i32_i32(i32 %a, i32 %b) #0 {
|
|
|
|
; CHECK: f_i32_i32:
|
|
|
|
; CHECK: stw 0(r3), r1
|
|
|
|
store volatile i32 %a, i32* @g_i32, align 4
|
|
|
|
; CHECK: stw 0(r3), r2
|
|
|
|
store volatile i32 %b, i32* @g_i32, align 4
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @f_i16_i32_i16(i16 %a, i32 %b, i16 %c) #0 {
|
|
|
|
; CHECK: f_i16_i32_i16:
|
|
|
|
; CHECK: sth 0(r4), r1
|
|
|
|
store volatile i16 %a, i16* @g_i16, align 2
|
|
|
|
; CHECK: stw 0(r1), r2
|
|
|
|
store volatile i32 %b, i32* @g_i32, align 4
|
|
|
|
; CHECK: sth 0(r4), r3
|
|
|
|
store volatile i16 %c, i16* @g_i16, align 2
|
|
|
|
ret void
|
|
|
|
}
|
|
|
|
|
|
|
|
define void @f_i16_i64_i16(i16 %a, i64 %b, i16 %c) #0 {
|
|
|
|
; CHECK: f_i16_i64_i16:
|
|
|
|
; CHECK: sth 0(r4), r1
|
|
|
|
store volatile i16 %a, i16* @g_i16, align 2
|
|
|
|
; CHECK: std 0(r1), r2 # encoding: [0x7b,0x21,0x00,0x00,0x00,0x00,0x00,0x00]
|
|
|
|
store volatile i64 %b, i64* @g_i64, align 8
|
|
|
|
; CHECK: sth 0(r4), r3
|
|
|
|
store volatile i16 %c, i16* @g_i16, align 2
|
|
|
|
ret void
|
|
|
|
}
|