LLVM 23.0.0git
MCInstrAnalysis.h
Go to the documentation of this file.
1//===- llvm/MC/MCInstrAnalysis.h - InstrDesc target hooks -------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file defines the MCInstrAnalysis class which the MCTargetDescs can
10// derive from to give additional information to MC.
11//
12//===----------------------------------------------------------------------===//
13
14#ifndef LLVM_MC_MCINSTRANALYSIS_H
15#define LLVM_MC_MCINSTRANALYSIS_H
16
17#include "llvm/ADT/ArrayRef.h"
18#include "llvm/MC/MCInst.h"
19#include "llvm/MC/MCInstrDesc.h"
20#include "llvm/MC/MCInstrInfo.h"
23#include <cstdint>
24#include <vector>
25
26namespace llvm {
27
28class MCRegisterInfo;
29class Triple;
30
32protected:
33 friend class Target;
34
36
37public:
39 virtual ~MCInstrAnalysis() = default;
40
41 /// Clear the internal state. See updateState for more information.
42 virtual void resetState() {}
43
44 /// Update internal state with \p Inst at \p Addr.
45 ///
46 /// For some types of analyses, inspecting a single instruction is not
47 /// sufficient. Some examples are auipc/jalr pairs on RISC-V or adrp/ldr pairs
48 /// on AArch64. To support inspecting multiple instructions, targets may keep
49 /// track of an internal state while analysing instructions. Clients should
50 /// call updateState for every instruction which allows later calls to one of
51 /// the analysis functions to take previous instructions into account.
52 /// Whenever state becomes irrelevant (e.g., when starting to disassemble a
53 /// new function), clients should call resetState to clear it.
54 virtual void updateState(const MCInst &Inst, const MCSubtargetInfo *STI,
55 uint64_t Addr) {}
56
57 virtual bool isBranch(const MCInst &Inst) const {
58 return Info->get(Inst.getOpcode()).isBranch();
59 }
60
61 virtual bool isConditionalBranch(const MCInst &Inst) const {
62 return Info->get(Inst.getOpcode()).isConditionalBranch();
63 }
64
65 virtual bool isUnconditionalBranch(const MCInst &Inst) const {
66 return Info->get(Inst.getOpcode()).isUnconditionalBranch();
67 }
68
69 virtual bool isIndirectBranch(const MCInst &Inst) const {
70 return Info->get(Inst.getOpcode()).isIndirectBranch();
71 }
72
73 virtual bool isCall(const MCInst &Inst) const {
74 return Info->get(Inst.getOpcode()).isCall();
75 }
76
77 virtual bool isReturn(const MCInst &Inst) const {
78 return Info->get(Inst.getOpcode()).isReturn();
79 }
80
81 virtual bool isTerminator(const MCInst &Inst) const {
82 return Info->get(Inst.getOpcode()).isTerminator();
83 }
84
85 virtual bool isBarrier(const MCInst &Inst) const {
86 return Info->get(Inst.getOpcode()).isBarrier();
87 }
88
89 virtual bool mayAffectControlFlow(const MCInst &Inst,
90 const MCRegisterInfo &MCRI) const {
91 if (isBranch(Inst) || isCall(Inst) || isReturn(Inst) ||
92 isIndirectBranch(Inst))
93 return true;
94 MCRegister PC = MCRI.getProgramCounter();
95 if (!PC)
96 return false;
97 return Info->get(Inst.getOpcode()).hasDefOfPhysReg(Inst, PC, MCRI);
98 }
99
100 /// Returns true if at least one of the register writes performed by
101 /// \param Inst implicitly clears the upper portion of all super-registers.
102 ///
103 /// Example: on X86-64, a write to EAX implicitly clears the upper half of
104 /// RAX. Also (still on x86) an XMM write perfomed by an AVX 128-bit
105 /// instruction implicitly clears the upper portion of the correspondent
106 /// YMM register.
107 ///
108 /// This method also updates an APInt which is used as mask of register
109 /// writes. There is one bit for every explicit/implicit write performed by
110 /// the instruction. If a write implicitly clears its super-registers, then
111 /// the corresponding bit is set (vic. the corresponding bit is cleared).
112 ///
113 /// The first bits in the APint are related to explicit writes. The remaining
114 /// bits are related to implicit writes. The sequence of writes follows the
115 /// machine operand sequence. For implicit writes, the sequence is defined by
116 /// the MCInstrDesc.
117 ///
118 /// The assumption is that the bit-width of the APInt is correctly set by
119 /// the caller. The default implementation conservatively assumes that none of
120 /// the writes clears the upper portion of a super-register.
121 virtual bool clearsSuperRegisters(const MCRegisterInfo &MRI,
122 const MCInst &Inst,
123 APInt &Writes) const;
124
125 /// Returns true if MI is a dependency breaking zero-idiom for the given
126 /// subtarget.
127 ///
128 /// Mask is used to identify input operands that have their dependency
129 /// broken. Each bit of the mask is associated with a specific input operand.
130 /// Bits associated with explicit input operands are laid out first in the
131 /// mask; implicit operands come after explicit operands.
132 ///
133 /// Dependencies are broken only for operands that have their corresponding bit
134 /// set. Operands that have their bit cleared, or that don't have a
135 /// corresponding bit in the mask don't have their dependency broken. Note
136 /// that Mask may not be big enough to describe all operands. The assumption
137 /// for operands that don't have a correspondent bit in the mask is that those
138 /// are still data dependent.
139 ///
140 /// The only exception to the rule is for when Mask has all zeroes.
141 /// A zero mask means: dependencies are broken for all explicit register
142 /// operands.
143 virtual bool isZeroIdiom(const MCInst &MI, APInt &Mask,
144 unsigned CPUID) const {
145 return false;
146 }
147
148 /// Returns true if MI is a dependency breaking instruction for the
149 /// subtarget associated with CPUID .
150 ///
151 /// The value computed by a dependency breaking instruction is not dependent
152 /// on the inputs. An example of dependency breaking instruction on X86 is
153 /// `XOR %eax, %eax`.
154 ///
155 /// If MI is a dependency breaking instruction for subtarget CPUID, then Mask
156 /// can be inspected to identify independent operands.
157 ///
158 /// Essentially, each bit of the mask corresponds to an input operand.
159 /// Explicit operands are laid out first in the mask; implicit operands follow
160 /// explicit operands. Bits are set for operands that are independent.
161 ///
162 /// Note that the number of bits in Mask may not be equivalent to the sum of
163 /// explicit and implicit operands in MI. Operands that don't have a
164 /// corresponding bit in Mask are assumed "not independente".
165 ///
166 /// The only exception is for when Mask is all zeroes. That means: explicit
167 /// input operands of MI are independent.
168 virtual bool isDependencyBreaking(const MCInst &MI, APInt &Mask,
169 unsigned CPUID) const {
170 return isZeroIdiom(MI, Mask, CPUID);
171 }
172
173 /// Returns true if MI is a candidate for move elimination.
174 ///
175 /// Different subtargets may apply different constraints to optimizable
176 /// register moves. For example, on most X86 subtargets, a candidate for move
177 /// elimination cannot specify the same register for both source and
178 /// destination.
180 unsigned CPUID) const {
181 return false;
182 }
183
184 /// Given a branch instruction try to get the address the branch
185 /// targets. Return true on success, and the address in Target.
186 virtual bool
187 evaluateBranch(const MCInst &Inst, uint64_t Addr, uint64_t Size,
188 uint64_t &Target) const;
189
190 /// Given an instruction tries to get the address of a memory operand. Returns
191 /// the address on success.
192 virtual std::optional<uint64_t>
193 evaluateMemoryOperandAddress(const MCInst &Inst, const MCSubtargetInfo *STI,
194 uint64_t Addr, uint64_t Size) const;
195
196 /// Given an instruction with a memory operand that could require relocation,
197 /// returns the offset within the instruction of that relocation.
198 virtual std::optional<uint64_t>
199 getMemoryOperandRelocationOffset(const MCInst &Inst, uint64_t Size) const;
200
201 /// Returns (PLT virtual address, GOT virtual address) pairs for PLT entries.
202 virtual std::vector<std::pair<uint64_t, uint64_t>>
203 findPltEntries(uint64_t PltSectionVA, ArrayRef<uint8_t> PltContents,
204 const MCSubtargetInfo &STI) const {
205 return {};
206 }
207};
208
209} // end namespace llvm
210
211#endif // LLVM_MC_MCINSTRANALYSIS_H
#define LLVM_ABI
Definition Compiler.h:213
IRTranslator LLVM IR MI
static bool isBranch(unsigned Opcode)
Class for arbitrary precision integers.
Definition APInt.h:78
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
Instances of this class represent a single low-level machine instruction.
Definition MCInst.h:188
unsigned getOpcode() const
Definition MCInst.h:202
virtual std::vector< std::pair< uint64_t, uint64_t > > findPltEntries(uint64_t PltSectionVA, ArrayRef< uint8_t > PltContents, const MCSubtargetInfo &STI) const
Returns (PLT virtual address, GOT virtual address) pairs for PLT entries.
virtual bool isCall(const MCInst &Inst) const
virtual bool isBranch(const MCInst &Inst) const
virtual bool isOptimizableRegisterMove(const MCInst &MI, unsigned CPUID) const
Returns true if MI is a candidate for move elimination.
virtual bool isDependencyBreaking(const MCInst &MI, APInt &Mask, unsigned CPUID) const
Returns true if MI is a dependency breaking instruction for the subtarget associated with CPUID .
virtual bool isUnconditionalBranch(const MCInst &Inst) const
virtual void updateState(const MCInst &Inst, const MCSubtargetInfo *STI, uint64_t Addr)
Update internal state with Inst at Addr.
virtual bool isZeroIdiom(const MCInst &MI, APInt &Mask, unsigned CPUID) const
Returns true if MI is a dependency breaking zero-idiom for the given subtarget.
virtual bool isTerminator(const MCInst &Inst) const
virtual bool isBarrier(const MCInst &Inst) const
virtual void resetState()
Clear the internal state. See updateState for more information.
virtual bool isConditionalBranch(const MCInst &Inst) const
virtual bool mayAffectControlFlow(const MCInst &Inst, const MCRegisterInfo &MCRI) const
virtual bool isReturn(const MCInst &Inst) const
const MCInstrInfo * Info
MCInstrAnalysis(const MCInstrInfo *Info)
virtual ~MCInstrAnalysis()=default
virtual bool isIndirectBranch(const MCInst &Inst) const
Interface to description of machine instruction set.
Definition MCInstrInfo.h:27
MCRegisterInfo base class - We assume that the target defines a static array of MCRegisterDesc object...
MCRegister getProgramCounter() const
Return the register which is the program counter.
Wrapper class representing physical registers. Should be passed by value.
Definition MCRegister.h:41
Generic base class for all target subtargets.
Target - Wrapper for Target specific information.
Triple - Helper class for working with autoconf configuration names.
Definition Triple.h:47
This is an optimization pass for GlobalISel generic memory operations.
Definition Types.h:26