//===- AMDGPULDSUtils.cpp -------------------------------------------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // // AMDGPU LDS related helper utility functions. // //===----------------------------------------------------------------------===// #include "AMDGPULDSUtils.h" #include "AMDGPU.h" #include "Utils/AMDGPUBaseInfo.h" #include "llvm/ADT/DepthFirstIterator.h" #include "llvm/ADT/SetVector.h" #include "llvm/IR/Constants.h" #include "llvm/IR/ReplaceConstant.h" using namespace llvm; namespace llvm { namespace AMDGPU { bool isKernelCC(const Function *Func) { return AMDGPU::isModuleEntryFunctionCC(Func->getCallingConv()); } Align getAlign(DataLayout const &DL, const GlobalVariable *GV) { return DL.getValueOrABITypeAlignment(GV->getPointerAlignment(DL), GV->getValueType()); } static void collectFunctionUses(User *U, const Function *F, SetVector &InstUsers) { SmallVector Stack{U}; while (!Stack.empty()) { U = Stack.pop_back_val(); if (auto *I = dyn_cast(U)) { if (I->getFunction() == F) InstUsers.insert(I); continue; } if (!isa(U)) continue; append_range(Stack, U->users()); } } void replaceConstantUsesInFunction(ConstantExpr *C, const Function *F) { SetVector InstUsers; collectFunctionUses(C, F, InstUsers); for (Instruction *I : InstUsers) { convertConstantExprsToInstructions(I, C); } } static bool shouldLowerLDSToStruct(const GlobalVariable &GV, const Function *F) { // We are not interested in kernel LDS lowering for module LDS itself. if (F && GV.getName() == "llvm.amdgcn.module.lds") return false; bool Ret = false; SmallPtrSet Visited; SmallVector Stack(GV.users()); assert(!F || isKernelCC(F)); while (!Stack.empty()) { const User *V = Stack.pop_back_val(); Visited.insert(V); if (isa(V)) { // This use of the LDS variable is the initializer of a global variable. // This is ill formed. The address of an LDS variable is kernel dependent // and unknown until runtime. It can't be written to a global variable. continue; } if (auto *I = dyn_cast(V)) { const Function *UF = I->getFunction(); if (UF == F) { // Used from this kernel, we want to put it into the structure. Ret = true; } else if (!F) { // For module LDS lowering, lowering is required if the user instruction // is from non-kernel function. Ret |= !isKernelCC(UF); } continue; } // User V should be a constant, recursively visit users of V. assert(isa(V) && "Expected a constant."); append_range(Stack, V->users()); } return Ret; } std::vector findVariablesToLower(Module &M, const Function *F) { std::vector LocalVars; for (auto &GV : M.globals()) { if (GV.getType()->getPointerAddressSpace() != AMDGPUAS::LOCAL_ADDRESS) { continue; } if (!GV.hasInitializer()) { // addrspace(3) without initializer implies cuda/hip extern __shared__ // the semantics for such a variable appears to be that all extern // __shared__ variables alias one another, in which case this transform // is not required continue; } if (!isa(GV.getInitializer())) { // Initializers are unimplemented for LDS address space. // Leave such variables in place for consistent error reporting. continue; } if (GV.isConstant()) { // A constant undef variable can't be written to, and any load is // undef, so it should be eliminated by the optimizer. It could be // dropped by the back end if not. This pass skips over it. continue; } if (!shouldLowerLDSToStruct(GV, F)) { continue; } LocalVars.push_back(&GV); } return LocalVars; } } // end namespace AMDGPU } // end namespace llvm