forked from OSchip/llvm-project
[WebAssembly] memory.copy
Summary: Depends on D57495. Reviewers: aheejin, dschuff Subscribers: sbc100, jgravelle-google, hiraditya, sunfish Differential Revision: https://reviews.llvm.org/D57498 llvm-svn: 353127
This commit is contained in:
parent
1a17032b78
commit
d99af23765
|
@ -25,5 +25,6 @@ HANDLE_NODETYPE(VEC_SHL)
|
|||
HANDLE_NODETYPE(VEC_SHR_S)
|
||||
HANDLE_NODETYPE(VEC_SHR_U)
|
||||
HANDLE_NODETYPE(THROW)
|
||||
HANDLE_NODETYPE(MEMORY_COPY)
|
||||
|
||||
// add memory opcodes starting at ISD::FIRST_TARGET_MEMORY_OPCODE here...
|
||||
|
|
|
@ -243,6 +243,12 @@ WebAssemblyTargetLowering::WebAssemblyTargetLowering(
|
|||
setOperationAction(ISD::INTRINSIC_VOID, MVT::Other, Custom);
|
||||
|
||||
setMaxAtomicSizeInBitsSupported(64);
|
||||
|
||||
if (Subtarget->hasBulkMemory()) {
|
||||
// Using memory.copy is always better than using multiple loads and stores
|
||||
MaxStoresPerMemcpy = 1;
|
||||
MaxStoresPerMemcpyOptSize = 1;
|
||||
}
|
||||
}
|
||||
|
||||
TargetLowering::AtomicExpansionKind
|
||||
|
|
|
@ -0,0 +1,39 @@
|
|||
// WebAssemblyInstrBulkMemory.td - bulk memory codegen support --*- tablegen -*-
|
||||
//
|
||||
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
||||
// See https://llvm.org/LICENSE.txt for license information.
|
||||
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
||||
//
|
||||
//===----------------------------------------------------------------------===//
|
||||
///
|
||||
/// \file
|
||||
/// WebAssembly bulk memory codegen constructs.
|
||||
///
|
||||
//===----------------------------------------------------------------------===//
|
||||
|
||||
// Instruction requiring HasBulkMemory and the bulk memory prefix byte
|
||||
multiclass BULK_I<dag oops_r, dag iops_r, dag oops_s, dag iops_s,
|
||||
list<dag> pattern_r, string asmstr_r = "",
|
||||
string asmstr_s = "", bits<32> simdop = -1> {
|
||||
defm "" : I<oops_r, iops_r, oops_s, iops_s, pattern_r, asmstr_r, asmstr_s,
|
||||
!or(0xfc00, !and(0xff, simdop))>,
|
||||
Requires<[HasBulkMemory]>;
|
||||
}
|
||||
|
||||
// Bespoke types and nodes for bulk memory ops
|
||||
def wasm_memcpy_t : SDTypeProfile<0, 3,
|
||||
[SDTCisPtrTy<0>, SDTCisPtrTy<1>, SDTCisInt<2>]
|
||||
>;
|
||||
def wasm_memcpy : SDNode<"WebAssemblyISD::MEMORY_COPY", wasm_memcpy_t,
|
||||
[SDNPHasChain, SDNPMayLoad, SDNPMayStore]>;
|
||||
|
||||
//===----------------------------------------------------------------------===//
|
||||
// memory.copy
|
||||
//===----------------------------------------------------------------------===//
|
||||
|
||||
let mayLoad = 1, mayStore = 1 in
|
||||
defm MEMORY_COPY : BULK_I<(outs), (ins I32:$dst, I32:$src, I32:$len),
|
||||
(outs), (ins),
|
||||
[(wasm_memcpy I32:$dst, I32:$src, I32:$len)],
|
||||
"memory.copy\t$dst, $src, $len",
|
||||
"memory.copy", 0x0a>;
|
|
@ -315,3 +315,4 @@ include "WebAssemblyInstrFloat.td"
|
|||
include "WebAssemblyInstrAtomics.td"
|
||||
include "WebAssemblyInstrSIMD.td"
|
||||
include "WebAssemblyInstrExceptRef.td"
|
||||
include "WebAssemblyInstrBulkMemory.td"
|
||||
|
|
|
@ -17,3 +17,16 @@ using namespace llvm;
|
|||
#define DEBUG_TYPE "wasm-selectiondag-info"
|
||||
|
||||
WebAssemblySelectionDAGInfo::~WebAssemblySelectionDAGInfo() = default; // anchor
|
||||
|
||||
SDValue WebAssemblySelectionDAGInfo::EmitTargetCodeForMemcpy(
|
||||
SelectionDAG &DAG, const SDLoc &DL, SDValue Chain, SDValue Op1, SDValue Op2,
|
||||
SDValue Op3, unsigned Align, bool isVolatile, bool AlwaysInline,
|
||||
MachinePointerInfo DstPtrInfo, MachinePointerInfo SrcPtrInfo) const {
|
||||
if (!DAG.getMachineFunction()
|
||||
.getSubtarget<WebAssemblySubtarget>()
|
||||
.hasBulkMemory())
|
||||
return SDValue();
|
||||
|
||||
return DAG.getNode(WebAssemblyISD::MEMORY_COPY, DL, MVT::Other, Chain, Op1,
|
||||
Op2, Op3);
|
||||
}
|
||||
|
|
|
@ -22,6 +22,12 @@ namespace llvm {
|
|||
class WebAssemblySelectionDAGInfo final : public SelectionDAGTargetInfo {
|
||||
public:
|
||||
~WebAssemblySelectionDAGInfo() override;
|
||||
SDValue EmitTargetCodeForMemcpy(SelectionDAG &DAG, const SDLoc &dl,
|
||||
SDValue Chain, SDValue Op1, SDValue Op2,
|
||||
SDValue Op3, unsigned Align, bool isVolatile,
|
||||
bool AlwaysInline,
|
||||
MachinePointerInfo DstPtrInfo,
|
||||
MachinePointerInfo SrcPtrInfo) const override;
|
||||
};
|
||||
|
||||
} // end namespace llvm
|
||||
|
|
|
@ -1,7 +1,54 @@
|
|||
; RUN: llc < %s -asm-verbose=false -verify-machineinstrs -disable-wasm-fallthrough-return-opt -wasm-disable-explicit-locals -wasm-keep-registers -mattr=+bulk-memory
|
||||
; RUN: llc < %s -asm-verbose=false -verify-machineinstrs -disable-wasm-fallthrough-return-opt -wasm-disable-explicit-locals -wasm-keep-registers -mattr=+bulk-memory | FileCheck %s --check-prefixes CHECK,BULK-MEM
|
||||
; RUN: llc < %s -asm-verbose=false -verify-machineinstrs -disable-wasm-fallthrough-return-opt -wasm-disable-explicit-locals -wasm-keep-registers -mattr=-bulk-memory | FileCheck %s --check-prefixes CHECK,NO-BULK-MEM
|
||||
|
||||
; Test that basic bulk memory codegen works correctly
|
||||
; TODO: implement basic bulk memory codegen
|
||||
|
||||
target datalayout = "e-m:e-p:32:32-i64:64-n32:64-S128"
|
||||
target triple = "wasm32-unknown-unknown"
|
||||
|
||||
; CHECK-LABEL: memcpy_i8:
|
||||
; NO-BULK-MEM-NOT: memory.copy
|
||||
; BULK-MEM-NEXT: .functype memcpy_i8 (i32, i32, i32) -> ()
|
||||
; BULK-MEM-NEXT: memory.copy $0, $1, $2
|
||||
; BULK-MEM-NEXT: return
|
||||
declare void @llvm.memcpy.p0i8.p0i8.i32(
|
||||
i8* %dest, i8* %src, i32 %len, i1 %volatile
|
||||
)
|
||||
define void @memcpy_i8(i8* %dest, i8* %src, i32 %len) {
|
||||
call void @llvm.memcpy.p0i8.p0i8.i32(i8* %dest, i8* %src, i32 %len, i1 0)
|
||||
ret void
|
||||
}
|
||||
|
||||
; CHECK-LABEL: memcpy_i32:
|
||||
; NO-BULK-MEM-NOT: memory.copy
|
||||
; BULK-MEM-NEXT: .functype memcpy_i32 (i32, i32, i32) -> ()
|
||||
; BULK-MEM-NEXT: memory.copy $0, $1, $2
|
||||
; BULK-MEM-NEXT: return
|
||||
declare void @llvm.memcpy.p0i32.p0i32.i32(
|
||||
i32* %dest, i32* %src, i32 %len, i1 %volatile
|
||||
)
|
||||
define void @memcpy_i32(i32* %dest, i32* %src, i32 %len) {
|
||||
call void @llvm.memcpy.p0i32.p0i32.i32(i32* %dest, i32* %src, i32 %len, i1 0)
|
||||
ret void
|
||||
}
|
||||
|
||||
; CHECK-LABEL: memcpy_1:
|
||||
; CHECK-NEXT: .functype memcpy_1 (i32, i32) -> ()
|
||||
; CHECK-NEXT: i32.load8_u $push[[L0:[0-9]+]]=, 0($1)
|
||||
; CHECK-NEXT: i32.store8 0($0), $pop[[L0]]
|
||||
; CHECK-NEXT: return
|
||||
define void @memcpy_1(i8* %dest, i8* %src) {
|
||||
call void @llvm.memcpy.p0i8.p0i8.i32(i8* %dest, i8* %src, i32 1, i1 0)
|
||||
ret void
|
||||
}
|
||||
|
||||
; CHECK-LABEL: memcpy_1024:
|
||||
; NO-BULK-MEM-NOT: memory.copy
|
||||
; BULK-MEM-NEXT: .functype memcpy_1024 (i32, i32) -> ()
|
||||
; BULK-MEM-NEXT: i32.const $push[[L0:[0-9]+]]=, 1024
|
||||
; BULK-MEM-NEXT: memory.copy $0, $1, $pop[[L0]]
|
||||
; BULK-MEM-NEXT: return
|
||||
define void @memcpy_1024(i8* %dest, i8* %src) {
|
||||
call void @llvm.memcpy.p0i8.p0i8.i32(i8* %dest, i8* %src, i32 1024, i1 0)
|
||||
ret void
|
||||
}
|
||||
|
|
Loading…
Reference in New Issue