AMDGPUMachineFunction.cpp revision 360660
1263348Sjmmv//===-- AMDGPUMachineFunctionInfo.cpp ---------------------------------------=//
2263348Sjmmv//
3263348Sjmmv// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4263348Sjmmv// See https://llvm.org/LICENSE.txt for license information.
5263348Sjmmv// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6263348Sjmmv//
7263348Sjmmv//===----------------------------------------------------------------------===//
8263348Sjmmv
9263348Sjmmv#include "AMDGPUMachineFunction.h"
10263348Sjmmv#include "AMDGPUSubtarget.h"
11263348Sjmmv#include "AMDGPUPerfHintAnalysis.h"
12263348Sjmmv#include "llvm/CodeGen/MachineModuleInfo.h"
13263348Sjmmv
14263348Sjmmvusing namespace llvm;
15263348Sjmmv
16263348SjmmvAMDGPUMachineFunction::AMDGPUMachineFunction(const MachineFunction &MF) :
17263348Sjmmv  MachineFunctionInfo(),
18263348Sjmmv  LocalMemoryObjects(),
19263348Sjmmv  ExplicitKernArgSize(0),
20263348Sjmmv  MaxKernArgAlign(0),
21263348Sjmmv  LDSSize(0),
22263348Sjmmv  IsEntryFunction(AMDGPU::isEntryFunctionCC(MF.getFunction().getCallingConv())),
23263348Sjmmv  NoSignedZerosFPMath(MF.getTarget().Options.NoSignedZerosFPMath),
24263348Sjmmv  MemoryBound(false),
25263348Sjmmv  WaveLimiter(false) {
26263348Sjmmv  const AMDGPUSubtarget &ST = AMDGPUSubtarget::get(MF);
27263348Sjmmv
28263348Sjmmv  // FIXME: Should initialize KernArgSize based on ExplicitKernelArgOffset,
29263348Sjmmv  // except reserved size is not correctly aligned.
30263348Sjmmv  const Function &F = MF.getFunction();
31263348Sjmmv
32263348Sjmmv  Attribute MemBoundAttr = F.getFnAttribute("amdgpu-memory-bound");
33  MemoryBound = MemBoundAttr.isStringAttribute() &&
34                MemBoundAttr.getValueAsString() == "true";
35
36  Attribute WaveLimitAttr = F.getFnAttribute("amdgpu-wave-limiter");
37  WaveLimiter = WaveLimitAttr.isStringAttribute() &&
38                WaveLimitAttr.getValueAsString() == "true";
39
40  CallingConv::ID CC = F.getCallingConv();
41  if (CC == CallingConv::AMDGPU_KERNEL || CC == CallingConv::SPIR_KERNEL)
42    ExplicitKernArgSize = ST.getExplicitKernArgSize(F, MaxKernArgAlign);
43}
44
45unsigned AMDGPUMachineFunction::allocateLDSGlobal(const DataLayout &DL,
46                                                  const GlobalValue &GV) {
47  auto Entry = LocalMemoryObjects.insert(std::make_pair(&GV, 0));
48  if (!Entry.second)
49    return Entry.first->second;
50
51  unsigned Align = GV.getAlignment();
52  if (Align == 0)
53    Align = DL.getABITypeAlignment(GV.getValueType());
54
55  /// TODO: We should sort these to minimize wasted space due to alignment
56  /// padding. Currently the padding is decided by the first encountered use
57  /// during lowering.
58  unsigned Offset = LDSSize = alignTo(LDSSize, Align);
59
60  Entry.first->second = Offset;
61  LDSSize += DL.getTypeAllocSize(GV.getValueType());
62
63  return Offset;
64}
65