10b57cec5SDimitry Andric //===-- AMDGPUMachineFunctionInfo.cpp ---------------------------------------=//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric
90b57cec5SDimitry Andric #include "AMDGPUMachineFunction.h"
100b57cec5SDimitry Andric #include "AMDGPUPerfHintAnalysis.h"
11af732203SDimitry Andric #include "AMDGPUSubtarget.h"
120b57cec5SDimitry Andric #include "llvm/CodeGen/MachineModuleInfo.h"
13af732203SDimitry Andric #include "llvm/Target/TargetMachine.h"
140b57cec5SDimitry Andric
150b57cec5SDimitry Andric using namespace llvm;
160b57cec5SDimitry Andric
AMDGPUMachineFunction(const MachineFunction & MF)17af732203SDimitry Andric AMDGPUMachineFunction::AMDGPUMachineFunction(const MachineFunction &MF)
18af732203SDimitry Andric : MachineFunctionInfo(), Mode(MF.getFunction()),
19af732203SDimitry Andric IsEntryFunction(
20af732203SDimitry Andric AMDGPU::isEntryFunctionCC(MF.getFunction().getCallingConv())),
21af732203SDimitry Andric IsModuleEntryFunction(
22af732203SDimitry Andric AMDGPU::isModuleEntryFunctionCC(MF.getFunction().getCallingConv())),
235ffd83dbSDimitry Andric NoSignedZerosFPMath(MF.getTarget().Options.NoSignedZerosFPMath) {
240b57cec5SDimitry Andric const AMDGPUSubtarget &ST = AMDGPUSubtarget::get(MF);
250b57cec5SDimitry Andric
260b57cec5SDimitry Andric // FIXME: Should initialize KernArgSize based on ExplicitKernelArgOffset,
270b57cec5SDimitry Andric // except reserved size is not correctly aligned.
280b57cec5SDimitry Andric const Function &F = MF.getFunction();
290b57cec5SDimitry Andric
300b57cec5SDimitry Andric Attribute MemBoundAttr = F.getFnAttribute("amdgpu-memory-bound");
31*5f7ddb14SDimitry Andric MemoryBound = MemBoundAttr.getValueAsBool();
320b57cec5SDimitry Andric
330b57cec5SDimitry Andric Attribute WaveLimitAttr = F.getFnAttribute("amdgpu-wave-limiter");
34*5f7ddb14SDimitry Andric WaveLimiter = WaveLimitAttr.getValueAsBool();
350b57cec5SDimitry Andric
360b57cec5SDimitry Andric CallingConv::ID CC = F.getCallingConv();
370b57cec5SDimitry Andric if (CC == CallingConv::AMDGPU_KERNEL || CC == CallingConv::SPIR_KERNEL)
380b57cec5SDimitry Andric ExplicitKernArgSize = ST.getExplicitKernArgSize(F, MaxKernArgAlign);
390b57cec5SDimitry Andric }
400b57cec5SDimitry Andric
allocateLDSGlobal(const DataLayout & DL,const GlobalVariable & GV)410b57cec5SDimitry Andric unsigned AMDGPUMachineFunction::allocateLDSGlobal(const DataLayout &DL,
425ffd83dbSDimitry Andric const GlobalVariable &GV) {
430b57cec5SDimitry Andric auto Entry = LocalMemoryObjects.insert(std::make_pair(&GV, 0));
440b57cec5SDimitry Andric if (!Entry.second)
450b57cec5SDimitry Andric return Entry.first->second;
460b57cec5SDimitry Andric
475ffd83dbSDimitry Andric Align Alignment =
485ffd83dbSDimitry Andric DL.getValueOrABITypeAlignment(GV.getAlign(), GV.getValueType());
490b57cec5SDimitry Andric
500b57cec5SDimitry Andric /// TODO: We should sort these to minimize wasted space due to alignment
510b57cec5SDimitry Andric /// padding. Currently the padding is decided by the first encountered use
520b57cec5SDimitry Andric /// during lowering.
53af732203SDimitry Andric unsigned Offset = StaticLDSSize = alignTo(StaticLDSSize, Alignment);
540b57cec5SDimitry Andric
550b57cec5SDimitry Andric Entry.first->second = Offset;
56af732203SDimitry Andric StaticLDSSize += DL.getTypeAllocSize(GV.getValueType());
57af732203SDimitry Andric
58af732203SDimitry Andric // Update the LDS size considering the padding to align the dynamic shared
59af732203SDimitry Andric // memory.
60af732203SDimitry Andric LDSSize = alignTo(StaticLDSSize, DynLDSAlign);
610b57cec5SDimitry Andric
620b57cec5SDimitry Andric return Offset;
630b57cec5SDimitry Andric }
64af732203SDimitry Andric
allocateModuleLDSGlobal(const Module * M)65*5f7ddb14SDimitry Andric void AMDGPUMachineFunction::allocateModuleLDSGlobal(const Module *M) {
66*5f7ddb14SDimitry Andric if (isModuleEntryFunction()) {
67*5f7ddb14SDimitry Andric const GlobalVariable *GV = M->getNamedGlobal("llvm.amdgcn.module.lds");
68*5f7ddb14SDimitry Andric if (GV) {
69*5f7ddb14SDimitry Andric unsigned Offset = allocateLDSGlobal(M->getDataLayout(), *GV);
70*5f7ddb14SDimitry Andric (void)Offset;
71*5f7ddb14SDimitry Andric assert(Offset == 0 &&
72*5f7ddb14SDimitry Andric "Module LDS expected to be allocated before other LDS");
73*5f7ddb14SDimitry Andric }
74*5f7ddb14SDimitry Andric }
75*5f7ddb14SDimitry Andric }
76*5f7ddb14SDimitry Andric
setDynLDSAlign(const DataLayout & DL,const GlobalVariable & GV)77af732203SDimitry Andric void AMDGPUMachineFunction::setDynLDSAlign(const DataLayout &DL,
78af732203SDimitry Andric const GlobalVariable &GV) {
79af732203SDimitry Andric assert(DL.getTypeAllocSize(GV.getValueType()).isZero());
80af732203SDimitry Andric
81af732203SDimitry Andric Align Alignment =
82af732203SDimitry Andric DL.getValueOrABITypeAlignment(GV.getAlign(), GV.getValueType());
83af732203SDimitry Andric if (Alignment <= DynLDSAlign)
84af732203SDimitry Andric return;
85af732203SDimitry Andric
86af732203SDimitry Andric LDSSize = alignTo(StaticLDSSize, Alignment);
87af732203SDimitry Andric DynLDSAlign = Alignment;
88af732203SDimitry Andric }
89