You've already forked linux-packaging-mono
acceptance-tests
data
docs
external
Newtonsoft.Json
api-doc-tools
api-snapshot
aspnetwebstack
bdwgc
binary-reference-assemblies
bockbuild
boringssl
cecil
cecil-legacy
corefx
corert
helix-binaries
ikdasm
ikvm
illinker-test-assets
linker
llvm-project
clang
clang-tools-extra
compiler-rt
eng
libcxx
libcxxabi
libunwind
lld
lldb
llvm
bindings
cmake
docs
examples
include
lib
Analysis
AsmParser
BinaryFormat
Bitcode
CodeGen
DebugInfo
Demangle
ExecutionEngine
FuzzMutate
Fuzzer
IR
IRReader
LTO
LineEditor
Linker
MC
Object
ObjectYAML
Option
Passes
ProfileData
Support
TableGen
Target
AArch64
AMDGPU
ARC
ARM
AsmParser
Disassembler
InstPrinter
MCTargetDesc
TargetInfo
Utils
A15SDOptimizer.cpp
ARM.h
ARM.td
ARMAsmPrinter.cpp
ARMAsmPrinter.h
ARMBaseInstrInfo.cpp.REMOVED.git-id
ARMBaseInstrInfo.h
ARMBaseRegisterInfo.cpp
ARMBaseRegisterInfo.h
ARMBasicBlockInfo.h
ARMCallLowering.cpp
ARMCallLowering.h
ARMCallingConv.h
ARMCallingConv.td
ARMComputeBlockSize.cpp
ARMConstantIslandPass.cpp
ARMConstantPoolValue.cpp
ARMConstantPoolValue.h
ARMExpandPseudoInsts.cpp
ARMFastISel.cpp.REMOVED.git-id
ARMFeatures.h
ARMFrameLowering.cpp
ARMFrameLowering.h
ARMHazardRecognizer.cpp
ARMHazardRecognizer.h
ARMISelDAGToDAG.cpp.REMOVED.git-id
ARMISelLowering.cpp.REMOVED.git-id
ARMISelLowering.h
ARMInstrFormats.td
ARMInstrInfo.cpp
ARMInstrInfo.h
ARMInstrInfo.td.REMOVED.git-id
ARMInstrNEON.td.REMOVED.git-id
ARMInstrThumb.td
ARMInstrThumb2.td.REMOVED.git-id
ARMInstrVFP.td
ARMInstructionSelector.cpp
ARMLegalizerInfo.cpp
ARMLegalizerInfo.h
ARMLoadStoreOptimizer.cpp
ARMMCInstLower.cpp
ARMMachineFunctionInfo.cpp
ARMMachineFunctionInfo.h
ARMMacroFusion.cpp
ARMMacroFusion.h
ARMOptimizeBarriersPass.cpp
ARMPerfectShuffle.h.REMOVED.git-id
ARMRegisterBankInfo.cpp
ARMRegisterBankInfo.h
ARMRegisterBanks.td
ARMRegisterInfo.cpp
ARMRegisterInfo.h
ARMRegisterInfo.td
ARMSchedule.td
ARMScheduleA57.td
ARMScheduleA57WriteRes.td
ARMScheduleA8.td
ARMScheduleA9.td.REMOVED.git-id
ARMScheduleM3.td
ARMScheduleR52.td
ARMScheduleSwift.td
ARMScheduleV6.td
ARMSelectionDAGInfo.cpp
ARMSelectionDAGInfo.h
ARMSubtarget.cpp
ARMSubtarget.h
ARMSystemRegister.td
ARMTargetMachine.cpp
ARMTargetMachine.h
ARMTargetObjectFile.cpp
ARMTargetObjectFile.h
ARMTargetTransformInfo.cpp
ARMTargetTransformInfo.h
CMakeLists.txt
LICENSE.TXT
LLVMBuild.txt
MLxExpansionPass.cpp
README-Thumb.txt
README-Thumb2.txt
README.txt
Thumb1FrameLowering.cpp
Thumb1FrameLowering.h
Thumb1InstrInfo.cpp
Thumb1InstrInfo.h
Thumb2ITBlockPass.cpp
Thumb2InstrInfo.cpp
Thumb2InstrInfo.h
Thumb2SizeReduction.cpp
ThumbRegisterInfo.cpp
ThumbRegisterInfo.h
AVR
BPF
Hexagon
Lanai
MSP430
Mips
NVPTX
Nios2
PowerPC
RISCV
Sparc
SystemZ
WebAssembly
X86
XCore
CMakeLists.txt
LLVMBuild.txt
README.txt
Target.cpp
TargetIntrinsicInfo.cpp
TargetLoweringObjectFile.cpp
TargetMachine.cpp
TargetMachineC.cpp
Testing
ToolDrivers
Transforms
WindowsManifest
XRay
CMakeLists.txt
LLVMBuild.txt
projects
resources
runtimes
scripts
test
tools
unittests
utils
.arcconfig
.clang-format
.clang-tidy
.gitattributes
.gitignore
CMakeLists.txt
CODE_OWNERS.TXT
CREDITS.TXT
LICENSE.TXT
LLVMBuild.txt
README.txt
RELEASE_TESTERS.TXT
configure
llvm.spec.in
version.txt.in
nuget
openmp
polly
Directory.Build.props
Directory.Build.targets
NuGet.config
azure-pipelines.yml
build.cmd
build.sh
dir.common.props
global.json
llvm.proj
mxe-Win64.cmake.in
nuget-buildtasks
nunit-lite
roslyn-binaries
rx
xunit-binaries
how-to-bump-roslyn-binaries.md
ikvm-native
llvm
m4
man
mcs
mono
msvc
netcore
po
runtime
samples
scripts
support
tools
COPYING.LIB
LICENSE
Makefile.am
Makefile.in
NEWS
README.md
acinclude.m4
aclocal.m4
autogen.sh
code_of_conduct.md
compile
config.guess
config.h.in
config.rpath
config.sub
configure.REMOVED.git-id
configure.ac.REMOVED.git-id
depcomp
install-sh
ltmain.sh.REMOVED.git-id
missing
mkinstalldirs
mono-uninstalled.pc.in
test-driver
winconfig.h
257 lines
9.2 KiB
C++
257 lines
9.2 KiB
C++
//===-- ARMSelectionDAGInfo.cpp - ARM SelectionDAG Info -------------------===//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file implements the ARMSelectionDAGInfo class.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "ARMTargetMachine.h"
|
|
#include "llvm/CodeGen/SelectionDAG.h"
|
|
#include "llvm/IR/DerivedTypes.h"
|
|
using namespace llvm;
|
|
|
|
#define DEBUG_TYPE "arm-selectiondag-info"
|
|
|
|
// Emit, if possible, a specialized version of the given Libcall. Typically this
|
|
// means selecting the appropriately aligned version, but we also convert memset
|
|
// of 0 into memclr.
|
|
SDValue ARMSelectionDAGInfo::EmitSpecializedLibcall(
|
|
SelectionDAG &DAG, const SDLoc &dl, SDValue Chain, SDValue Dst, SDValue Src,
|
|
SDValue Size, unsigned Align, RTLIB::Libcall LC) const {
|
|
const ARMSubtarget &Subtarget =
|
|
DAG.getMachineFunction().getSubtarget<ARMSubtarget>();
|
|
const ARMTargetLowering *TLI = Subtarget.getTargetLowering();
|
|
|
|
// Only use a specialized AEABI function if the default version of this
|
|
// Libcall is an AEABI function.
|
|
if (std::strncmp(TLI->getLibcallName(LC), "__aeabi", 7) != 0)
|
|
return SDValue();
|
|
|
|
// Translate RTLIB::Libcall to AEABILibcall. We only do this in order to be
|
|
// able to translate memset to memclr and use the value to index the function
|
|
// name array.
|
|
enum {
|
|
AEABI_MEMCPY = 0,
|
|
AEABI_MEMMOVE,
|
|
AEABI_MEMSET,
|
|
AEABI_MEMCLR
|
|
} AEABILibcall;
|
|
switch (LC) {
|
|
case RTLIB::MEMCPY:
|
|
AEABILibcall = AEABI_MEMCPY;
|
|
break;
|
|
case RTLIB::MEMMOVE:
|
|
AEABILibcall = AEABI_MEMMOVE;
|
|
break;
|
|
case RTLIB::MEMSET:
|
|
AEABILibcall = AEABI_MEMSET;
|
|
if (ConstantSDNode *ConstantSrc = dyn_cast<ConstantSDNode>(Src))
|
|
if (ConstantSrc->getZExtValue() == 0)
|
|
AEABILibcall = AEABI_MEMCLR;
|
|
break;
|
|
default:
|
|
return SDValue();
|
|
}
|
|
|
|
// Choose the most-aligned libcall variant that we can
|
|
enum {
|
|
ALIGN1 = 0,
|
|
ALIGN4,
|
|
ALIGN8
|
|
} AlignVariant;
|
|
if ((Align & 7) == 0)
|
|
AlignVariant = ALIGN8;
|
|
else if ((Align & 3) == 0)
|
|
AlignVariant = ALIGN4;
|
|
else
|
|
AlignVariant = ALIGN1;
|
|
|
|
TargetLowering::ArgListTy Args;
|
|
TargetLowering::ArgListEntry Entry;
|
|
Entry.Ty = DAG.getDataLayout().getIntPtrType(*DAG.getContext());
|
|
Entry.Node = Dst;
|
|
Args.push_back(Entry);
|
|
if (AEABILibcall == AEABI_MEMCLR) {
|
|
Entry.Node = Size;
|
|
Args.push_back(Entry);
|
|
} else if (AEABILibcall == AEABI_MEMSET) {
|
|
// Adjust parameters for memset, EABI uses format (ptr, size, value),
|
|
// GNU library uses (ptr, value, size)
|
|
// See RTABI section 4.3.4
|
|
Entry.Node = Size;
|
|
Args.push_back(Entry);
|
|
|
|
// Extend or truncate the argument to be an i32 value for the call.
|
|
if (Src.getValueType().bitsGT(MVT::i32))
|
|
Src = DAG.getNode(ISD::TRUNCATE, dl, MVT::i32, Src);
|
|
else if (Src.getValueType().bitsLT(MVT::i32))
|
|
Src = DAG.getNode(ISD::ZERO_EXTEND, dl, MVT::i32, Src);
|
|
|
|
Entry.Node = Src;
|
|
Entry.Ty = Type::getInt32Ty(*DAG.getContext());
|
|
Entry.IsSExt = false;
|
|
Args.push_back(Entry);
|
|
} else {
|
|
Entry.Node = Src;
|
|
Args.push_back(Entry);
|
|
|
|
Entry.Node = Size;
|
|
Args.push_back(Entry);
|
|
}
|
|
|
|
char const *FunctionNames[4][3] = {
|
|
{ "__aeabi_memcpy", "__aeabi_memcpy4", "__aeabi_memcpy8" },
|
|
{ "__aeabi_memmove", "__aeabi_memmove4", "__aeabi_memmove8" },
|
|
{ "__aeabi_memset", "__aeabi_memset4", "__aeabi_memset8" },
|
|
{ "__aeabi_memclr", "__aeabi_memclr4", "__aeabi_memclr8" }
|
|
};
|
|
TargetLowering::CallLoweringInfo CLI(DAG);
|
|
CLI.setDebugLoc(dl)
|
|
.setChain(Chain)
|
|
.setLibCallee(
|
|
TLI->getLibcallCallingConv(LC), Type::getVoidTy(*DAG.getContext()),
|
|
DAG.getExternalSymbol(FunctionNames[AEABILibcall][AlignVariant],
|
|
TLI->getPointerTy(DAG.getDataLayout())),
|
|
std::move(Args))
|
|
.setDiscardResult();
|
|
std::pair<SDValue,SDValue> CallResult = TLI->LowerCallTo(CLI);
|
|
|
|
return CallResult.second;
|
|
}
|
|
|
|
SDValue ARMSelectionDAGInfo::EmitTargetCodeForMemcpy(
|
|
SelectionDAG &DAG, const SDLoc &dl, SDValue Chain, SDValue Dst, SDValue Src,
|
|
SDValue Size, unsigned Align, bool isVolatile, bool AlwaysInline,
|
|
MachinePointerInfo DstPtrInfo, MachinePointerInfo SrcPtrInfo) const {
|
|
const ARMSubtarget &Subtarget =
|
|
DAG.getMachineFunction().getSubtarget<ARMSubtarget>();
|
|
// Do repeated 4-byte loads and stores. To be improved.
|
|
// This requires 4-byte alignment.
|
|
if ((Align & 3) != 0)
|
|
return SDValue();
|
|
// This requires the copy size to be a constant, preferably
|
|
// within a subtarget-specific limit.
|
|
ConstantSDNode *ConstantSize = dyn_cast<ConstantSDNode>(Size);
|
|
if (!ConstantSize)
|
|
return EmitSpecializedLibcall(DAG, dl, Chain, Dst, Src, Size, Align,
|
|
RTLIB::MEMCPY);
|
|
uint64_t SizeVal = ConstantSize->getZExtValue();
|
|
if (!AlwaysInline && SizeVal > Subtarget.getMaxInlineSizeThreshold())
|
|
return EmitSpecializedLibcall(DAG, dl, Chain, Dst, Src, Size, Align,
|
|
RTLIB::MEMCPY);
|
|
|
|
unsigned BytesLeft = SizeVal & 3;
|
|
unsigned NumMemOps = SizeVal >> 2;
|
|
unsigned EmittedNumMemOps = 0;
|
|
EVT VT = MVT::i32;
|
|
unsigned VTSize = 4;
|
|
unsigned i = 0;
|
|
// Emit a maximum of 4 loads in Thumb1 since we have fewer registers
|
|
const unsigned MaxLoadsInLDM = Subtarget.isThumb1Only() ? 4 : 6;
|
|
SDValue TFOps[6];
|
|
SDValue Loads[6];
|
|
uint64_t SrcOff = 0, DstOff = 0;
|
|
|
|
// FIXME: We should invent a VMEMCPY pseudo-instruction that lowers to
|
|
// VLDM/VSTM and make this code emit it when appropriate. This would reduce
|
|
// pressure on the general purpose registers. However this seems harder to map
|
|
// onto the register allocator's view of the world.
|
|
|
|
// The number of MEMCPY pseudo-instructions to emit. We use up to
|
|
// MaxLoadsInLDM registers per mcopy, which will get lowered into ldm/stm
|
|
// later on. This is a lower bound on the number of MEMCPY operations we must
|
|
// emit.
|
|
unsigned NumMEMCPYs = (NumMemOps + MaxLoadsInLDM - 1) / MaxLoadsInLDM;
|
|
|
|
// Code size optimisation: do not inline memcpy if expansion results in
|
|
// more instructions than the libary call.
|
|
if (NumMEMCPYs > 1 && DAG.getMachineFunction().getFunction().optForMinSize()) {
|
|
return SDValue();
|
|
}
|
|
|
|
SDVTList VTs = DAG.getVTList(MVT::i32, MVT::i32, MVT::Other, MVT::Glue);
|
|
|
|
for (unsigned I = 0; I != NumMEMCPYs; ++I) {
|
|
// Evenly distribute registers among MEMCPY operations to reduce register
|
|
// pressure.
|
|
unsigned NextEmittedNumMemOps = NumMemOps * (I + 1) / NumMEMCPYs;
|
|
unsigned NumRegs = NextEmittedNumMemOps - EmittedNumMemOps;
|
|
|
|
Dst = DAG.getNode(ARMISD::MEMCPY, dl, VTs, Chain, Dst, Src,
|
|
DAG.getConstant(NumRegs, dl, MVT::i32));
|
|
Src = Dst.getValue(1);
|
|
Chain = Dst.getValue(2);
|
|
|
|
DstPtrInfo = DstPtrInfo.getWithOffset(NumRegs * VTSize);
|
|
SrcPtrInfo = SrcPtrInfo.getWithOffset(NumRegs * VTSize);
|
|
|
|
EmittedNumMemOps = NextEmittedNumMemOps;
|
|
}
|
|
|
|
if (BytesLeft == 0)
|
|
return Chain;
|
|
|
|
// Issue loads / stores for the trailing (1 - 3) bytes.
|
|
auto getRemainingValueType = [](unsigned BytesLeft) {
|
|
return (BytesLeft >= 2) ? MVT::i16 : MVT::i8;
|
|
};
|
|
auto getRemainingSize = [](unsigned BytesLeft) {
|
|
return (BytesLeft >= 2) ? 2 : 1;
|
|
};
|
|
|
|
unsigned BytesLeftSave = BytesLeft;
|
|
i = 0;
|
|
while (BytesLeft) {
|
|
VT = getRemainingValueType(BytesLeft);
|
|
VTSize = getRemainingSize(BytesLeft);
|
|
Loads[i] = DAG.getLoad(VT, dl, Chain,
|
|
DAG.getNode(ISD::ADD, dl, MVT::i32, Src,
|
|
DAG.getConstant(SrcOff, dl, MVT::i32)),
|
|
SrcPtrInfo.getWithOffset(SrcOff));
|
|
TFOps[i] = Loads[i].getValue(1);
|
|
++i;
|
|
SrcOff += VTSize;
|
|
BytesLeft -= VTSize;
|
|
}
|
|
Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
|
|
makeArrayRef(TFOps, i));
|
|
|
|
i = 0;
|
|
BytesLeft = BytesLeftSave;
|
|
while (BytesLeft) {
|
|
VT = getRemainingValueType(BytesLeft);
|
|
VTSize = getRemainingSize(BytesLeft);
|
|
TFOps[i] = DAG.getStore(Chain, dl, Loads[i],
|
|
DAG.getNode(ISD::ADD, dl, MVT::i32, Dst,
|
|
DAG.getConstant(DstOff, dl, MVT::i32)),
|
|
DstPtrInfo.getWithOffset(DstOff));
|
|
++i;
|
|
DstOff += VTSize;
|
|
BytesLeft -= VTSize;
|
|
}
|
|
return DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
|
|
makeArrayRef(TFOps, i));
|
|
}
|
|
|
|
SDValue ARMSelectionDAGInfo::EmitTargetCodeForMemmove(
|
|
SelectionDAG &DAG, const SDLoc &dl, SDValue Chain, SDValue Dst, SDValue Src,
|
|
SDValue Size, unsigned Align, bool isVolatile,
|
|
MachinePointerInfo DstPtrInfo, MachinePointerInfo SrcPtrInfo) const {
|
|
return EmitSpecializedLibcall(DAG, dl, Chain, Dst, Src, Size, Align,
|
|
RTLIB::MEMMOVE);
|
|
}
|
|
|
|
SDValue ARMSelectionDAGInfo::EmitTargetCodeForMemset(
|
|
SelectionDAG &DAG, const SDLoc &dl, SDValue Chain, SDValue Dst, SDValue Src,
|
|
SDValue Size, unsigned Align, bool isVolatile,
|
|
MachinePointerInfo DstPtrInfo) const {
|
|
return EmitSpecializedLibcall(DAG, dl, Chain, Dst, Src, Size, Align,
|
|
RTLIB::MEMSET);
|
|
}
|