2017-08-09 01:53:55 +02:00
|
|
|
//===- AMDGPUAliasAnalysis ------------------------------------------------===//
|
2017-03-18 00:56:58 +01:00
|
|
|
//
|
2019-01-19 09:50:56 +01:00
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2017-03-18 00:56:58 +01:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
/// \file
|
|
|
|
/// This is the AMGPU address space based alias analysis pass.
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#include "AMDGPUAliasAnalysis.h"
|
2017-06-06 13:49:48 +02:00
|
|
|
#include "llvm/Analysis/ValueTracking.h"
|
2020-12-09 13:06:50 +01:00
|
|
|
#include "llvm/IR/Instructions.h"
|
2017-03-18 00:56:58 +01:00
|
|
|
|
|
|
|
using namespace llvm;
|
|
|
|
|
|
|
|
#define DEBUG_TYPE "amdgpu-aa"
|
|
|
|
|
2020-12-29 21:30:25 +01:00
|
|
|
AnalysisKey AMDGPUAA::Key;
|
|
|
|
|
2017-03-18 00:56:58 +01:00
|
|
|
// Register this pass...
|
|
|
|
char AMDGPUAAWrapperPass::ID = 0;
|
2018-11-07 21:26:42 +01:00
|
|
|
char AMDGPUExternalAAWrapper::ID = 0;
|
2017-08-09 01:53:55 +02:00
|
|
|
|
2017-03-18 00:56:58 +01:00
|
|
|
INITIALIZE_PASS(AMDGPUAAWrapperPass, "amdgpu-aa",
|
|
|
|
"AMDGPU Address space based Alias Analysis", false, true)
|
|
|
|
|
2018-11-07 21:26:42 +01:00
|
|
|
INITIALIZE_PASS(AMDGPUExternalAAWrapper, "amdgpu-aa-wrapper",
|
|
|
|
"AMDGPU Address space based Alias Analysis Wrapper", false, true)
|
|
|
|
|
2017-03-18 00:56:58 +01:00
|
|
|
ImmutablePass *llvm::createAMDGPUAAWrapperPass() {
|
|
|
|
return new AMDGPUAAWrapperPass();
|
|
|
|
}
|
|
|
|
|
2018-11-07 21:26:42 +01:00
|
|
|
ImmutablePass *llvm::createAMDGPUExternalAAWrapperPass() {
|
|
|
|
return new AMDGPUExternalAAWrapper();
|
|
|
|
}
|
|
|
|
|
2017-03-18 00:56:58 +01:00
|
|
|
void AMDGPUAAWrapperPass::getAnalysisUsage(AnalysisUsage &AU) const {
|
|
|
|
AU.setPreservesAll();
|
|
|
|
}
|
|
|
|
|
2018-09-11 06:00:49 +02:00
|
|
|
static AliasResult getAliasResult(unsigned AS1, unsigned AS2) {
|
2019-03-18 15:44:28 +01:00
|
|
|
static_assert(AMDGPUAS::MAX_AMDGPU_ADDRESS <= 7, "Addr space out of range");
|
2018-08-31 07:49:54 +02:00
|
|
|
|
2018-09-11 06:00:49 +02:00
|
|
|
if (AS1 > AMDGPUAS::MAX_AMDGPU_ADDRESS || AS2 > AMDGPUAS::MAX_AMDGPU_ADDRESS)
|
2021-03-05 11:58:13 +01:00
|
|
|
return AliasResult::MayAlias;
|
|
|
|
|
|
|
|
#define ASMay AliasResult::MayAlias
|
|
|
|
#define ASNo AliasResult::NoAlias
|
|
|
|
// This array is indexed by address space value enum elements 0 ... to 7
|
|
|
|
static const AliasResult ASAliasRules[8][8] = {
|
|
|
|
/* Flat Global Region Group Constant Private Const32 Buf Fat Ptr */
|
|
|
|
/* Flat */ {ASMay, ASMay, ASNo, ASMay, ASMay, ASMay, ASMay, ASMay},
|
|
|
|
/* Global */ {ASMay, ASMay, ASNo, ASNo, ASMay, ASNo, ASMay, ASMay},
|
|
|
|
/* Region */ {ASNo, ASNo, ASMay, ASNo, ASNo, ASNo, ASNo, ASNo},
|
|
|
|
/* Group */ {ASMay, ASNo, ASNo, ASMay, ASNo, ASNo, ASNo, ASNo},
|
|
|
|
/* Constant */ {ASMay, ASMay, ASNo, ASNo, ASNo, ASNo, ASMay, ASMay},
|
|
|
|
/* Private */ {ASMay, ASNo, ASNo, ASNo, ASNo, ASMay, ASNo, ASNo},
|
|
|
|
/* Constant 32-bit */ {ASMay, ASMay, ASNo, ASNo, ASMay, ASNo, ASNo, ASMay},
|
|
|
|
/* Buffer Fat Ptr */ {ASMay, ASMay, ASNo, ASNo, ASMay, ASNo, ASMay, ASMay}
|
|
|
|
};
|
|
|
|
#undef ASMay
|
|
|
|
#undef ASNo
|
2017-03-31 21:26:23 +02:00
|
|
|
|
2018-09-11 06:00:49 +02:00
|
|
|
return ASAliasRules[AS1][AS2];
|
2017-03-27 16:04:01 +02:00
|
|
|
}
|
|
|
|
|
2017-03-18 00:56:58 +01:00
|
|
|
AliasResult AMDGPUAAResult::alias(const MemoryLocation &LocA,
|
[AliasAnalysis] Second prototype to cache BasicAA / anyAA state.
Summary:
Adding contained caching to AliasAnalysis. BasicAA is currently the only one using it.
AA changes:
- This patch is pulling the caches from BasicAAResults to AAResults, meaning the getModRefInfo call benefits from the IsCapturedCache as well when in "batch mode".
- All AAResultBase implementations add the QueryInfo member to all APIs. AAResults APIs maintain wrapper APIs such that all alias()/getModRefInfo call sites are unchanged.
- AA now provides a BatchAAResults type as a wrapper to AAResults. It keeps the AAResults instance and a QueryInfo instantiated to batch mode. It delegates all work to the AAResults instance with the batched QueryInfo. More API wrappers may be needed in BatchAAResults; only the minimum needed is currently added.
MemorySSA changes:
- All walkers are now templated on the AA used (AliasAnalysis=AAResults or BatchAAResults).
- At build time, we optimize uses; now we create a local walker (lives only as long as OptimizeUses does) using BatchAAResults.
- All Walkers have an internal AA and only use that now, never the AA in MemorySSA. The Walkers receive the AA they will use when built.
- The walker we use for queries after the build is instantiated on AliasAnalysis and is built after building MemorySSA and setting AA.
- All static methods doing walking are now templated on AliasAnalysisType if they are used both during build and after. If used only during build, the method now only takes a BatchAAResults. If used only after build, the method now takes an AliasAnalysis.
Subscribers: sanjoy, arsenm, jvesely, nhaehnle, jlebar, george.burgess.iv, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59315
llvm-svn: 356783
2019-03-22 18:22:19 +01:00
|
|
|
const MemoryLocation &LocB,
|
|
|
|
AAQueryInfo &AAQI) {
|
2017-03-18 00:56:58 +01:00
|
|
|
unsigned asA = LocA.Ptr->getType()->getPointerAddressSpace();
|
|
|
|
unsigned asB = LocB.Ptr->getType()->getPointerAddressSpace();
|
|
|
|
|
2018-09-11 06:00:49 +02:00
|
|
|
AliasResult Result = getAliasResult(asA, asB);
|
2021-03-05 11:58:13 +01:00
|
|
|
if (Result == AliasResult::NoAlias)
|
2018-09-11 06:00:49 +02:00
|
|
|
return Result;
|
2017-03-18 00:56:58 +01:00
|
|
|
|
2020-10-09 00:46:00 +02:00
|
|
|
// In general, FLAT (generic) pointers could be aliased to LOCAL or PRIVATE
|
|
|
|
// pointers. However, as LOCAL or PRIVATE pointers point to local objects, in
|
|
|
|
// certain cases, it's still viable to check whether a FLAT pointer won't
|
|
|
|
// alias to a LOCAL or PRIVATE pointer.
|
|
|
|
MemoryLocation A = LocA;
|
|
|
|
MemoryLocation B = LocB;
|
|
|
|
// Canonicalize the location order to simplify the following alias check.
|
|
|
|
if (asA != AMDGPUAS::FLAT_ADDRESS) {
|
|
|
|
std::swap(asA, asB);
|
|
|
|
std::swap(A, B);
|
|
|
|
}
|
|
|
|
if (asA == AMDGPUAS::FLAT_ADDRESS &&
|
|
|
|
(asB == AMDGPUAS::LOCAL_ADDRESS || asB == AMDGPUAS::PRIVATE_ADDRESS)) {
|
|
|
|
const auto *ObjA =
|
2021-02-14 21:24:36 +01:00
|
|
|
getUnderlyingObject(A.Ptr->stripPointerCastsForAliasAnalysis());
|
2020-10-09 00:46:00 +02:00
|
|
|
if (const LoadInst *LI = dyn_cast<LoadInst>(ObjA)) {
|
|
|
|
// If a generic pointer is loaded from the constant address space, it
|
|
|
|
// could only be a GLOBAL or CONSTANT one as that address space is soley
|
|
|
|
// prepared on the host side, where only GLOBAL or CONSTANT variables are
|
|
|
|
// visible. Note that this even holds for regular functions.
|
|
|
|
if (LI->getPointerAddressSpace() == AMDGPUAS::CONSTANT_ADDRESS)
|
2021-03-05 11:58:13 +01:00
|
|
|
return AliasResult::NoAlias;
|
2020-10-09 00:46:00 +02:00
|
|
|
} else if (const Argument *Arg = dyn_cast<Argument>(ObjA)) {
|
|
|
|
const Function *F = Arg->getParent();
|
|
|
|
switch (F->getCallingConv()) {
|
|
|
|
case CallingConv::AMDGPU_KERNEL:
|
|
|
|
// In the kernel function, kernel arguments won't alias to (local)
|
|
|
|
// variables in shared or private address space.
|
2021-03-05 11:58:13 +01:00
|
|
|
return AliasResult::NoAlias;
|
2020-10-09 00:46:00 +02:00
|
|
|
default:
|
|
|
|
// TODO: In the regular function, if that local variable in the
|
|
|
|
// location B is not captured, that argument pointer won't alias to it
|
|
|
|
// as well.
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-03-18 00:56:58 +01:00
|
|
|
// Forward the query to the next alias analysis.
|
[AliasAnalysis] Second prototype to cache BasicAA / anyAA state.
Summary:
Adding contained caching to AliasAnalysis. BasicAA is currently the only one using it.
AA changes:
- This patch is pulling the caches from BasicAAResults to AAResults, meaning the getModRefInfo call benefits from the IsCapturedCache as well when in "batch mode".
- All AAResultBase implementations add the QueryInfo member to all APIs. AAResults APIs maintain wrapper APIs such that all alias()/getModRefInfo call sites are unchanged.
- AA now provides a BatchAAResults type as a wrapper to AAResults. It keeps the AAResults instance and a QueryInfo instantiated to batch mode. It delegates all work to the AAResults instance with the batched QueryInfo. More API wrappers may be needed in BatchAAResults; only the minimum needed is currently added.
MemorySSA changes:
- All walkers are now templated on the AA used (AliasAnalysis=AAResults or BatchAAResults).
- At build time, we optimize uses; now we create a local walker (lives only as long as OptimizeUses does) using BatchAAResults.
- All Walkers have an internal AA and only use that now, never the AA in MemorySSA. The Walkers receive the AA they will use when built.
- The walker we use for queries after the build is instantiated on AliasAnalysis and is built after building MemorySSA and setting AA.
- All static methods doing walking are now templated on AliasAnalysisType if they are used both during build and after. If used only during build, the method now only takes a BatchAAResults. If used only after build, the method now takes an AliasAnalysis.
Subscribers: sanjoy, arsenm, jvesely, nhaehnle, jlebar, george.burgess.iv, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59315
llvm-svn: 356783
2019-03-22 18:22:19 +01:00
|
|
|
return AAResultBase::alias(LocA, LocB, AAQI);
|
2017-03-18 00:56:58 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
bool AMDGPUAAResult::pointsToConstantMemory(const MemoryLocation &Loc,
|
[AliasAnalysis] Second prototype to cache BasicAA / anyAA state.
Summary:
Adding contained caching to AliasAnalysis. BasicAA is currently the only one using it.
AA changes:
- This patch is pulling the caches from BasicAAResults to AAResults, meaning the getModRefInfo call benefits from the IsCapturedCache as well when in "batch mode".
- All AAResultBase implementations add the QueryInfo member to all APIs. AAResults APIs maintain wrapper APIs such that all alias()/getModRefInfo call sites are unchanged.
- AA now provides a BatchAAResults type as a wrapper to AAResults. It keeps the AAResults instance and a QueryInfo instantiated to batch mode. It delegates all work to the AAResults instance with the batched QueryInfo. More API wrappers may be needed in BatchAAResults; only the minimum needed is currently added.
MemorySSA changes:
- All walkers are now templated on the AA used (AliasAnalysis=AAResults or BatchAAResults).
- At build time, we optimize uses; now we create a local walker (lives only as long as OptimizeUses does) using BatchAAResults.
- All Walkers have an internal AA and only use that now, never the AA in MemorySSA. The Walkers receive the AA they will use when built.
- The walker we use for queries after the build is instantiated on AliasAnalysis and is built after building MemorySSA and setting AA.
- All static methods doing walking are now templated on AliasAnalysisType if they are used both during build and after. If used only during build, the method now only takes a BatchAAResults. If used only after build, the method now takes an AliasAnalysis.
Subscribers: sanjoy, arsenm, jvesely, nhaehnle, jlebar, george.burgess.iv, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59315
llvm-svn: 356783
2019-03-22 18:22:19 +01:00
|
|
|
AAQueryInfo &AAQI, bool OrLocal) {
|
2020-05-08 21:53:41 +02:00
|
|
|
unsigned AS = Loc.Ptr->getType()->getPointerAddressSpace();
|
|
|
|
if (AS == AMDGPUAS::CONSTANT_ADDRESS ||
|
|
|
|
AS == AMDGPUAS::CONSTANT_ADDRESS_32BIT)
|
|
|
|
return true;
|
|
|
|
|
2020-07-31 11:09:54 +02:00
|
|
|
const Value *Base = getUnderlyingObject(Loc.Ptr);
|
2020-05-08 21:53:41 +02:00
|
|
|
AS = Base->getType()->getPointerAddressSpace();
|
2018-08-31 07:49:54 +02:00
|
|
|
if (AS == AMDGPUAS::CONSTANT_ADDRESS ||
|
2020-05-08 21:53:41 +02:00
|
|
|
AS == AMDGPUAS::CONSTANT_ADDRESS_32BIT)
|
2017-03-18 00:56:58 +01:00
|
|
|
return true;
|
|
|
|
|
|
|
|
if (const GlobalVariable *GV = dyn_cast<GlobalVariable>(Base)) {
|
|
|
|
if (GV->isConstant())
|
|
|
|
return true;
|
|
|
|
} else if (const Argument *Arg = dyn_cast<Argument>(Base)) {
|
|
|
|
const Function *F = Arg->getParent();
|
|
|
|
|
|
|
|
// Only assume constant memory for arguments on kernels.
|
|
|
|
switch (F->getCallingConv()) {
|
|
|
|
default:
|
[AliasAnalysis] Second prototype to cache BasicAA / anyAA state.
Summary:
Adding contained caching to AliasAnalysis. BasicAA is currently the only one using it.
AA changes:
- This patch is pulling the caches from BasicAAResults to AAResults, meaning the getModRefInfo call benefits from the IsCapturedCache as well when in "batch mode".
- All AAResultBase implementations add the QueryInfo member to all APIs. AAResults APIs maintain wrapper APIs such that all alias()/getModRefInfo call sites are unchanged.
- AA now provides a BatchAAResults type as a wrapper to AAResults. It keeps the AAResults instance and a QueryInfo instantiated to batch mode. It delegates all work to the AAResults instance with the batched QueryInfo. More API wrappers may be needed in BatchAAResults; only the minimum needed is currently added.
MemorySSA changes:
- All walkers are now templated on the AA used (AliasAnalysis=AAResults or BatchAAResults).
- At build time, we optimize uses; now we create a local walker (lives only as long as OptimizeUses does) using BatchAAResults.
- All Walkers have an internal AA and only use that now, never the AA in MemorySSA. The Walkers receive the AA they will use when built.
- The walker we use for queries after the build is instantiated on AliasAnalysis and is built after building MemorySSA and setting AA.
- All static methods doing walking are now templated on AliasAnalysisType if they are used both during build and after. If used only during build, the method now only takes a BatchAAResults. If used only after build, the method now takes an AliasAnalysis.
Subscribers: sanjoy, arsenm, jvesely, nhaehnle, jlebar, george.burgess.iv, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59315
llvm-svn: 356783
2019-03-22 18:22:19 +01:00
|
|
|
return AAResultBase::pointsToConstantMemory(Loc, AAQI, OrLocal);
|
2017-09-29 11:51:22 +02:00
|
|
|
case CallingConv::AMDGPU_LS:
|
|
|
|
case CallingConv::AMDGPU_HS:
|
|
|
|
case CallingConv::AMDGPU_ES:
|
2017-03-18 00:56:58 +01:00
|
|
|
case CallingConv::AMDGPU_GS:
|
2017-09-29 11:51:22 +02:00
|
|
|
case CallingConv::AMDGPU_VS:
|
2017-03-18 00:56:58 +01:00
|
|
|
case CallingConv::AMDGPU_PS:
|
|
|
|
case CallingConv::AMDGPU_CS:
|
|
|
|
case CallingConv::AMDGPU_KERNEL:
|
|
|
|
case CallingConv::SPIR_KERNEL:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
unsigned ArgNo = Arg->getArgNo();
|
|
|
|
/* On an argument, ReadOnly attribute indicates that the function does
|
|
|
|
not write through this pointer argument, even though it may write
|
|
|
|
to the memory that the pointer points to.
|
|
|
|
On an argument, ReadNone attribute indicates that the function does
|
|
|
|
not dereference that pointer argument, even though it may read or write
|
|
|
|
the memory that the pointer points to if accessed through other pointers.
|
|
|
|
*/
|
2017-04-14 01:12:13 +02:00
|
|
|
if (F->hasParamAttribute(ArgNo, Attribute::NoAlias) &&
|
|
|
|
(F->hasParamAttribute(ArgNo, Attribute::ReadNone) ||
|
|
|
|
F->hasParamAttribute(ArgNo, Attribute::ReadOnly))) {
|
2017-03-18 00:56:58 +01:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
[AliasAnalysis] Second prototype to cache BasicAA / anyAA state.
Summary:
Adding contained caching to AliasAnalysis. BasicAA is currently the only one using it.
AA changes:
- This patch is pulling the caches from BasicAAResults to AAResults, meaning the getModRefInfo call benefits from the IsCapturedCache as well when in "batch mode".
- All AAResultBase implementations add the QueryInfo member to all APIs. AAResults APIs maintain wrapper APIs such that all alias()/getModRefInfo call sites are unchanged.
- AA now provides a BatchAAResults type as a wrapper to AAResults. It keeps the AAResults instance and a QueryInfo instantiated to batch mode. It delegates all work to the AAResults instance with the batched QueryInfo. More API wrappers may be needed in BatchAAResults; only the minimum needed is currently added.
MemorySSA changes:
- All walkers are now templated on the AA used (AliasAnalysis=AAResults or BatchAAResults).
- At build time, we optimize uses; now we create a local walker (lives only as long as OptimizeUses does) using BatchAAResults.
- All Walkers have an internal AA and only use that now, never the AA in MemorySSA. The Walkers receive the AA they will use when built.
- The walker we use for queries after the build is instantiated on AliasAnalysis and is built after building MemorySSA and setting AA.
- All static methods doing walking are now templated on AliasAnalysisType if they are used both during build and after. If used only during build, the method now only takes a BatchAAResults. If used only after build, the method now takes an AliasAnalysis.
Subscribers: sanjoy, arsenm, jvesely, nhaehnle, jlebar, george.burgess.iv, llvm-commits
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D59315
llvm-svn: 356783
2019-03-22 18:22:19 +01:00
|
|
|
return AAResultBase::pointsToConstantMemory(Loc, AAQI, OrLocal);
|
2017-03-18 00:56:58 +01:00
|
|
|
}
|