This pass does misc. More...

#include "AMDGPU.h"
#include "AMDGPUTargetMachine.h"
#include "SIModeRegisterDefaults.h"
#include "llvm/Analysis/AssumptionCache.h"
#include "llvm/Analysis/ConstantFolding.h"
#include "llvm/Analysis/TargetLibraryInfo.h"
#include "llvm/Analysis/UniformityAnalysis.h"
#include "llvm/Analysis/ValueTracking.h"
#include "llvm/CodeGen/TargetPassConfig.h"
#include "llvm/IR/Dominators.h"
#include "llvm/IR/IRBuilder.h"
#include "llvm/IR/InstVisitor.h"
#include "llvm/IR/IntrinsicsAMDGPU.h"
#include "llvm/IR/PatternMatch.h"
#include "llvm/InitializePasses.h"
#include "llvm/Pass.h"
#include "llvm/Support/KnownBits.h"
#include "llvm/Transforms/Utils/IntegerDivision.h"
#include "llvm/Transforms/Utils/Local.h"

Classes
class	VectorSlice
	Helper class for "break large PHIs" (visitPHINode). More...

Macros
#define	DEBUG_TYPE "amdgpu-codegenprepare"

Functions
static bool	promotedOpIsNSW (const Instruction &I)

static bool	promotedOpIsNUW (const Instruction &I)

static void	extractValues (IRBuilder<> &Builder, SmallVectorImpl< Value * > &Values, Value *V)

static Value *	insertValues (IRBuilder<> &Builder, Type Ty, SmallVectorImpl< Value > &Values)

static SelectInst *	findSelectThroughCast (Value V, CastInst &Cast)

static Value *	emitRsqIEEE1ULP (IRBuilder<> &Builder, Value *Src, bool IsNegative)
	Emit an expansion of 1.0 / sqrt(Src) good for 1ulp that supports denormals.

static std::pair< Value , Value >	getMul64 (IRBuilder<> &Builder, Value LHS, Value RHS)

static Value *	getMulHu (IRBuilder<> &Builder, Value LHS, Value RHS)

static Value *	getSign32 (Value *V, IRBuilder<> &Builder, const DataLayout DL)

static bool	areInSameBB (const Value A, const Value B)

static bool	isInterestingPHIIncomingValue (const Value *V)

static void	collectPHINodes (const PHINode &I, SmallPtrSet< const PHINode *, 8 > &SeenPHIs)

static bool	isPtrKnownNeverNull (const Value *V, const DataLayout &DL, const AMDGPUTargetMachine &TM, unsigned AS)

static bool	isOneOrNegOne (const Value *Val)

	INITIALIZE_PASS_BEGIN (AMDGPUCodeGenPrepare, DEBUG_TYPE, "AMDGPU IR optimizations", false, false) INITIALIZE_PASS_END(AMDGPUCodeGenPrepare

Variables
	DEBUG_TYPE

AMDGPU IR	optimizations

AMDGPU IR	false

Detailed Description

This pass does misc.

AMDGPU optimizations on IR before instruction selection.

Definition in file AMDGPUCodeGenPrepare.cpp.

Macro Definition Documentation

◆ DEBUG_TYPE

#define DEBUG_TYPE "amdgpu-codegenprepare"

Definition at line 35 of file AMDGPUCodeGenPrepare.cpp.

Function Documentation

◆ areInSameBB()

static bool areInSameBB	(	const Value *	A,
		const Value *	B
	)

static

Definition at line 1751 of file AMDGPUCodeGenPrepare.cpp.

References A, and B.

Referenced by isInterestingPHIIncomingValue().

◆ collectPHINodes()

static void collectPHINodes	(	const PHINode &	I,
		SmallPtrSet< const PHINode *, 8 > &	SeenPHIs
	)

static

Definition at line 1814 of file AMDGPUCodeGenPrepare.cpp.

References collectPHINodes(), I, and llvm::SmallPtrSetImpl< PtrType >::insert().

Referenced by collectPHINodes().

◆ emitRsqIEEE1ULP()

static Value * emitRsqIEEE1ULP	(	IRBuilder<> &	Builder,
		Value *	Src,
		bool	IsNegative
	)

static

Emit an expansion of 1.0 / sqrt(Src) good for 1ulp that supports denormals.

Definition at line 869 of file AMDGPUCodeGenPrepare.cpp.

References llvm::IRBuilderBase::CreateFCmpOLT(), llvm::IRBuilderBase::CreateFMul(), llvm::IRBuilderBase::CreateSelect(), llvm::IRBuilderBase::CreateUnaryIntrinsic(), llvm::Type::getFltSemantics(), and llvm::APFloat::getSmallestNormalized().

◆ extractValues()

static void extractValues	(	IRBuilder<> &	Builder,
		SmallVectorImpl< Value * > &	Values,
		Value *	V
	)

static

Definition at line 608 of file AMDGPUCodeGenPrepare.cpp.

References llvm::IRBuilderBase::CreateExtractElement(), I, and llvm::SmallVectorTemplateBase< T, bool >::push_back().

◆ findSelectThroughCast()

static SelectInst * findSelectThroughCast	(	Value *	V,
		CastInst *&	Cast
	)

static

Definition at line 700 of file AMDGPUCodeGenPrepare.cpp.

References llvm::User::getOperand().

◆ getMul64()

static std::pair< Value , Value > getMul64	(	IRBuilder<> &	Builder,
		Value *	LHS,
		Value *	RHS
	)

static

Definition at line 1173 of file AMDGPUCodeGenPrepare.cpp.

References llvm::IRBuilderBase::CreateLShr(), llvm::IRBuilderBase::CreateMul(), llvm::IRBuilderBase::CreateTrunc(), llvm::IRBuilderBase::CreateZExt(), llvm::IRBuilderBase::getInt32Ty(), llvm::IRBuilderBase::getInt64(), llvm::IRBuilderBase::getInt64Ty(), Hi, LHS, Lo, and RHS.

Referenced by getMulHu().

◆ getMulHu()

static Value * getMulHu	(	IRBuilder<> &	Builder,
		Value *	LHS,
		Value *	RHS
	)

static

Definition at line 1187 of file AMDGPUCodeGenPrepare.cpp.

References getMul64(), LHS, and RHS.

◆ getSign32()

static Value * getSign32	(	Value *	V,
		IRBuilder<> &	Builder,
		const DataLayout	DL
	)

static

Definition at line 1382 of file AMDGPUCodeGenPrepare.cpp.

References llvm::computeKnownBits(), llvm::IRBuilderBase::CreateAShr(), DL, llvm::Constant::getAllOnesValue(), llvm::IRBuilderBase::getInt32(), llvm::Constant::getNullValue(), llvm::KnownBits::isNegative(), and llvm::KnownBits::isNonNegative().

◆ INITIALIZE_PASS_BEGIN()

INITIALIZE_PASS_BEGIN	(	AMDGPUCodeGenPrepare	,
		DEBUG_TYPE	,
		"AMDGPU IR optimizations"	,
		false	,
		false
	)

◆ insertValues()

static Value * insertValues	(	IRBuilder<> &	Builder,
		Type *	Ty,
		SmallVectorImpl< Value * > &	Values
	)

static

Definition at line 620 of file AMDGPUCodeGenPrepare.cpp.

References assert(), llvm::IRBuilderBase::CreateInsertElement(), llvm::PoisonValue::get(), I, llvm::Type::isVectorTy(), and llvm::SmallVectorBase< Size_T >::size().

◆ isInterestingPHIIncomingValue()

static bool isInterestingPHIIncomingValue ( const Value * V )

static

Definition at line 1759 of file AMDGPUCodeGenPrepare.cpp.

References llvm::BitVector::all(), areInSameBB(), Idx, and llvm::BitVector::set().

◆ isOneOrNegOne()

static bool isOneOrNegOne ( const Value * Val )

static

Definition at line 2218 of file AMDGPUCodeGenPrepare.cpp.

References llvm::CallingConv::C, llvm::PatternMatch::m_APFloat(), and llvm::PatternMatch::match().

◆ isPtrKnownNeverNull()

static bool isPtrKnownNeverNull	(	const Value *	V,
		const DataLayout &	DL,
		const AMDGPUTargetMachine &	TM,
		unsigned	AS
	)

static

Parameters

V	Value to check
DL	DataLayout
TM	TargetMachine (TODO: remove once DL contains nullptr values)
AS	Target Address Space

Returns: true if V cannot be the null value of AS, false otherwise.

Definition at line 2045 of file AMDGPUCodeGenPrepare.cpp.

References assert(), llvm::computeKnownBits(), and DL.

◆ promotedOpIsNSW()

static bool promotedOpIsNSW ( const Instruction & I )

static

Definition at line 437 of file AMDGPUCodeGenPrepare.cpp.

References I.

◆ promotedOpIsNUW()

static bool promotedOpIsNUW ( const Instruction & I )

static

Definition at line 451 of file AMDGPUCodeGenPrepare.cpp.

References I.

Variable Documentation

◆ DEBUG_TYPE

DEBUG_TYPE

Definition at line 2323 of file AMDGPUCodeGenPrepare.cpp.

◆ false

AMDGPU IR false

Definition at line 2324 of file AMDGPUCodeGenPrepare.cpp.

◆ optimizations

AMDGPU IR optimizations

Definition at line 2323 of file AMDGPUCodeGenPrepare.cpp.

Classes

Macros

Functions

Variables

Detailed Description

Macro Definition Documentation

◆ DEBUG_TYPE

Function Documentation

◆ areInSameBB()

◆ collectPHINodes()

◆ emitRsqIEEE1ULP()

◆ extractValues()

◆ findSelectThroughCast()

◆ getMul64()

◆ getMulHu()

◆ getSign32()

◆ INITIALIZE_PASS_BEGIN()

◆ insertValues()

◆ isInterestingPHIIncomingValue()

◆ isOneOrNegOne()

◆ isPtrKnownNeverNull()

◆ promotedOpIsNSW()

◆ promotedOpIsNUW()

Variable Documentation

◆ DEBUG_TYPE

◆ false

◆ optimizations