27#define DEBUG_TYPE "dxil-data-scalarization"
70 typedef std::tuple<AllocaInst *, Type *, SmallVector<Value *, 4>>
75 VectorToArrayMap VectorAllocaMap;
86 bool MadeChange =
false;
92 VectorAllocaMap.clear();
97DataScalarizerVisitor::lookupReplacementGlobal(
Value *CurrOperand) {
99 auto It = GlobalMap.find(OldGlobal);
100 if (It != GlobalMap.end()) {
122 Type *NewElementType =
138 Builder.CreateAlloca(NewType,
nullptr, AI.
getName() +
".scalarized");
148 if (CE && CE->getOpcode() == Instruction::GetElementPtr) {
159 if (
GlobalVariable *NewGlobal = lookupReplacementGlobal(PtrOperand))
166 Value *PtrOperand =
SI.getPointerOperand();
168 if (CE && CE->getOpcode() == Instruction::GetElementPtr) {
172 StoreInst *NewStore = Builder.CreateStore(
SI.getValueOperand(), OldGEP);
174 SI.replaceAllUsesWith(NewStore);
175 SI.eraseFromParent();
179 if (
GlobalVariable *NewGlobal = lookupReplacementGlobal(PtrOperand))
180 SI.setOperand(
SI.getPointerOperandIndex(), NewGlobal);
185DataScalarizerVisitor::AllocaAndGEPs
186DataScalarizerVisitor::createArrayFromVector(
IRBuilder<> &Builder,
Value *Vec,
187 const Twine &Name =
"") {
190 return VectorAllocaMap[Vec];
195 Builder.SetInsertPointPastAllocas(Builder.GetInsertBlock()->getParent());
205 AllocaInst *ArrAlloca =
214 SmallVector<Value *, 4> GEPs(ArrNumElems);
215 for (
unsigned I = 0;
I < ArrNumElems; ++
I) {
218 EE = Builder.
CreateZExt(EE, ArrElemTy, Name +
".zext");
225 VectorAllocaMap.insert({Vec, {ArrAlloca, ArrTy, GEPs}});
227 return {ArrAlloca, ArrTy, GEPs};
232static std::pair<Value *, Value *>
235 Value *
GEP = Builder.CreateInBoundsGEP(
236 ArrTy, ArrAlloca, {Builder.getInt32(0), Index}, Name +
".index");
239 return std::make_pair(
GEP, Load);
242bool DataScalarizerVisitor::replaceDynamicInsertElementInst(
250 AllocaAndGEPs ArrAllocaAndGEPs =
251 createArrayFromVector(Builder, Vec, IEI.
getName());
252 AllocaInst *ArrAlloca = std::get<0>(ArrAllocaAndGEPs);
253 Type *ArrTy = std::get<1>(ArrAllocaAndGEPs);
254 SmallVector<Value *, 4> &ArrGEPs = std::get<2>(ArrAllocaAndGEPs);
261 bool WidenBool = ArrElemTy != VecElemTy && VecElemTy->
isIntegerTy(1);
268 Value *StoreVal = Val;
297 return replaceDynamicInsertElementInst(IEI);
300bool DataScalarizerVisitor::replaceDynamicExtractElementInst(
304 AllocaAndGEPs ArrAllocaAndGEPs =
306 AllocaInst *ArrAlloca = std::get<0>(ArrAllocaAndGEPs);
307 Type *ArrTy = std::get<1>(ArrAllocaAndGEPs);
311 Value *Load = GEPAndLoad.second;
316 if (Load->getType() != EEI.
getType()) {
318 "Unexpected type mismatch: only i32 -> i1 widening is supported");
319 Load = Builder.CreateTrunc(Load, EEI.
getType(), EEI.
getName() +
".trunc");
332 return replaceDynamicExtractElementInst(EEI);
343 PtrOpGEPCE && PtrOpGEPCE->getOpcode() == Instruction::GetElementPtr) {
354 "Expected newly-created GEP to be an instruction");
365 Value *NewPtrOperand = PtrOperand;
366 if (
GlobalVariable *NewGlobal = lookupReplacementGlobal(PtrOperand))
367 NewPtrOperand = NewGlobal;
369 bool NeedsTransform = NewPtrOperand != PtrOperand || NewGEPType != GEPType;
375 Value *NewGEP = Builder.CreateGEP(NewGEPType, NewPtrOperand, Indices,
381 OldGEPI->eraseFromParent();
404 for (
unsigned I = 0;
I !=
E; ++
I)
409 "Expected fixed length constant aggregate for vector initializer!");
416 assert(ArrayInit &&
"Expected a ConstantArray for array initializer!");
419 for (
unsigned I = 0;
I < ArrayTy->getNumElements(); ++
I) {
422 ArrayInit->getOperand(
I), ArrayTy->getElementType(),
435 bool MadeChange =
false;
440 Type *OrigType =
G.getValueType();
443 if (OrigType != NewType) {
447 M, NewType,
G.isConstant(),
G.getLinkage(),
448 nullptr,
G.getName() +
".scalarized", &
G,
449 G.getThreadLocalMode(),
G.getAddressSpace(),
450 G.isExternallyInitialized());
454 if (
G.getAlignment() > 0) {
458 if (
G.hasInitializer()) {
466 Impl.GlobalMap[&
G] = NewGlobal;
471 if (
F.isDeclaration())
473 MadeChange |= Impl.visit(
F);
477 for (
auto &[Old, New] : Impl.GlobalMap) {
478 Old->eraseFromParent();
500 "DXIL Data Scalarization",
false,
false)
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static bool findAndReplaceVectors(Module &M)
static std::pair< Value *, Value * > dynamicallyLoadArray(IRBuilder<> &Builder, AllocaInst *ArrAlloca, Type *ArrTy, Value *Index, const Twine &Name="")
Returns a pair of Value* with the first being a GEP into ArrAlloca using indices {0,...
static bool isVectorOrArrayOfVectors(Type *T)
static Type * equivalentArrayTypeFromVector(Type *T)
static const int MaxVecSize
static Constant * transformInitializer(Constant *Init, Type *OrigType, Type *NewType, LLVMContext &Ctx)
Module.h This file contains the declarations for the Module class.
This header defines various interfaces for pass management in LLVM.
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
This file builds on the ADT/GraphTraits.h file to build a generic graph post order iterator.
bool runOnModule(Module &M) override
runOnModule - Virtual method overriden by subclasses to process the module being operated on.
DXILDataScalarizationLegacy()
bool visitCallInst(CallInst &ICI)
bool visitInstruction(Instruction &I)
bool visitBinaryOperator(BinaryOperator &BO)
bool visitInsertElementInst(InsertElementInst &IEI)
bool visitGetElementPtrInst(GetElementPtrInst &GEPI)
bool visitStoreInst(StoreInst &SI)
bool visitFreezeInst(FreezeInst &FI)
bool visitBitCastInst(BitCastInst &BCI)
bool visitCastInst(CastInst &CI)
bool visitFCmpInst(FCmpInst &FCI)
bool visitLoadInst(LoadInst &LI)
bool visitSelectInst(SelectInst &SI)
bool visitUnaryOperator(UnaryOperator &UO)
bool visitICmpInst(ICmpInst &ICI)
bool visitShuffleVectorInst(ShuffleVectorInst &SVI)
bool visitAllocaInst(AllocaInst &AI)
bool visitPHINode(PHINode &PHI)
bool visitExtractElementInst(ExtractElementInst &EEI)
friend bool findAndReplaceVectors(llvm::Module &M)
an instruction to allocate memory on the stack
Align getAlign() const
Return the alignment of the memory that is being allocated by the instruction.
Type * getAllocatedType() const
Return the type that is being allocated by the instruction.
void setAlignment(Align Align)
static LLVM_ABI ArrayType * get(Type *ElementType, uint64_t NumElements)
This static method is the primary way to construct an ArrayType.
LLVM Basic Block Representation.
This class represents a no-op cast from one type to another.
This class represents a function call, abstracting a target machine's calling convention.
This is the base class for all instructions that perform data casts.
static LLVM_ABI ConstantAggregateZero * get(Type *Ty)
static LLVM_ABI Constant * get(ArrayType *T, ArrayRef< Constant * > V)
A constant value that is initialized with an expression using other constant values.
This is an important base class in LLVM.
PreservedAnalyses run(Module &M, ModuleAnalysisManager &)
bool contains(const_arg_type_t< KeyT > Val) const
Return true if the specified key is in the map, false otherwise.
This instruction compares its operands according to the predicate given to the constructor.
This class represents a freeze function that returns random concrete value if an operand is either a ...
LLVM_ABI Type * getSourceElementType() const
Value * getPointerOperand()
GEPNoWrapFlags getNoWrapFlags() const
an instruction for type-safe pointer arithmetic to access elements of arrays and structs
iterator_range< op_iterator > indices()
Type * getSourceElementType() const
LLVM_ABI GEPNoWrapFlags getNoWrapFlags() const
Get the nowrap flags for the GEP instruction.
void setUnnamedAddr(UnnamedAddr Val)
LLVM_ABI void setInitializer(Constant *InitVal)
setInitializer - Sets the initializer for this global variable, removing any existing initializer if ...
void setAlignment(Align Align)
Sets the alignment attribute of the GlobalVariable.
This instruction compares its operands according to the predicate given to the constructor.
Value * CreateInsertElement(Type *VecTy, Value *NewElt, Value *Idx, const Twine &Name="")
AllocaInst * CreateAlloca(Type *Ty, unsigned AddrSpace, Value *ArraySize=nullptr, const Twine &Name="")
Value * CreateExtractElement(Value *Vec, Value *Idx, const Twine &Name="")
BasicBlock::iterator GetInsertPoint() const
Value * CreateInBoundsGEP(Type *Ty, Value *Ptr, ArrayRef< Value * > IdxList, const Twine &Name="")
ConstantInt * getInt32(uint32_t C)
Get a constant 32-bit value.
LoadInst * CreateLoad(Type *Ty, Value *Ptr, const char *Name)
Provided to resolve 'CreateLoad(Ty, Ptr, "...")' correctly, instead of converting the string to 'bool...
Value * CreateZExt(Value *V, Type *DestTy, const Twine &Name="", bool IsNonNeg=false)
StoreInst * CreateStore(Value *Val, Value *Ptr, bool isVolatile=false)
Value * CreateTrunc(Value *V, Type *DestTy, const Twine &Name="", bool IsNUW=false, bool IsNSW=false)
void SetInsertPoint(BasicBlock *TheBB)
This specifies that created instructions should be appended to the end of the specified block.
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
This instruction inserts a single (scalar) element into a VectorType value.
Base class for instruction visitors.
void visit(Iterator Start, Iterator End)
LLVM_ABI void insertBefore(InstListType::iterator InsertPos)
Insert an unlinked instruction into a basic block immediately before the specified position.
LLVM_ABI InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
This is an important class for using LLVM in a threaded context.
An instruction for reading from memory.
void setAlignment(Align Align)
Value * getPointerOperand()
static unsigned getPointerOperandIndex()
Align getAlign() const
Return the alignment of the access that is being performed.
ModulePass class - This class is used to implement unstructured interprocedural optimizations and ana...
A Module instance is used to store all the information related to an LLVM module.
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
A set of analyses that are preserved following a run of a transformation pass.
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
This class represents the LLVM 'select' instruction.
This instruction constructs a fixed permutation of two input vectors.
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
An instruction for storing to memory.
void setAlignment(Align Align)
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
The instances of the Type class are immutable: once they are created, they are never changed.
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
Type * getArrayElementType() const
LLVM_ABI uint64_t getArrayNumElements() const
bool isIntegerTy() const
True if this is an instance of IntegerType.
static LLVM_ABI UndefValue * get(Type *T)
Static factory methods - Return an 'undef' object of the specified type.
void setOperand(unsigned i, Value *Val)
Value * getOperand(unsigned i) const
LLVM Value Representation.
Type * getType() const
All values are typed, get the type of this value.
LLVM_ABI void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
LLVM_ABI StringRef getName() const
Return a constant reference to the value's name.
self_iterator getIterator()
NodeAddr< InstrNode * > Instr
This is an optimization pass for GlobalISel generic memory operations.
FunctionAddr VTableAddr Value
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
ModulePass * createDXILDataScalarizationLegacyPass()
Pass to scalarize llvm global data into a DXIL legal form.
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
IRBuilder(LLVMContext &, FolderTy, InserterTy, MDNode *, ArrayRef< OperandBundleDef >) -> IRBuilder< FolderTy, InserterTy >
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
AnalysisManager< Module > ModuleAnalysisManager
Convenience typedef for the Module analysis manager.