-
Notifications
You must be signed in to change notification settings - Fork 50
/
Copy pathcast.hh
205 lines (182 loc) · 10.5 KB
/
cast.hh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
/* ###
* IP: GHIDRA
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
/// \file cast.hh
/// \brief API and specific strategies for applying type casts
#ifndef __CAST_HH__
#define __CAST_HH__
#include "type.hh"
namespace ghidra {
class Varnode;
class PcodeOp;
/// \brief A strategy for applying type casts
///
/// A \e cast operation in C or other languages masks a variety of possible low-level conversions,
/// such as extensions, truncations, integer to floating-point, etc. On top of this, languages allow
/// many of these types of operations to be \e implied in the source code, with no explicit token
/// representing the conversion. Conversions happen automatically for things like \e integer \e promotion,
/// between different sizes (of integers), and between signed and unsigned data-type variants.
///
/// This class is the API for making four kinds of decisions:
/// - Do we need a cast operator for a given assignment
/// - Does the given conversion operation need to be represented as a cast
/// - Does the given extension or comparison match with the expected level of integer promotion
/// - What data-type is produced by a particular integer arithmetic operation
class CastStrategy {
public:
/// \brief Types of integer promotion
///
/// For many languages, small integers are automatically \e promoted to a standard size. The decompiler
/// describes how an expression is or will be affected by integer promotion, using these codes
enum IntPromotionCode {
NO_PROMOTION = -1, ///< There is no integer promotion
UNKNOWN_PROMOTION = 0, ///< The type of integer promotion cannot be determined
UNSIGNED_EXTENSION = 1, ///< The value is promoted using unsigned extension
SIGNED_EXTENSION = 2, ///< The value is promoted using signed extension
EITHER_EXTENSION = 3 ///< The value is promoted using either signed or unsigned extension
};
protected:
TypeFactory *tlst; ///< Type factory associated with the Architecture
int4 promoteSize; ///< Size of \b int data-type, (size that integers get promoted to)
public:
CastStrategy(void) {} ///< Constructor
void setTypeFactory(TypeFactory *t); ///< Establish the data-type factory
virtual ~CastStrategy(void) {} ///< Destructor
/// \brief Decide on integer promotion by examining just local properties of the given Varnode
///
/// \param vn is the given Varnode
/// \param op is the PcodeOp reading the Varnode
/// \return an IntPromotionCode (excluding NO_PROMOTION)
virtual int4 localExtensionType(const Varnode *vn,const PcodeOp *op) const=0;
/// \brief Calculate the integer promotion code of a given Varnode
///
/// Recursively examine the expression defining the Varnode as necessary
/// \param vn is the given Varnode
/// \return the IntPromotionCode
virtual int4 intPromotionType(const Varnode *vn) const=0;
/// \brief Check if integer promotion forces a cast for the given comparison op and slot
///
/// Compute to what level the given slot has seen integer promotion and if
/// a cast is required before the comparison operator makes sense.
/// \param op is the given comparison operator
/// \param slot is the input slot being tested
/// \return \b true if a cast is required before comparing
virtual bool checkIntPromotionForCompare(const PcodeOp *op,int4 slot) const=0;
/// \brief Check if integer promotion forces a cast for the input to the given extension.
///
/// Compute to what level the given slot has seen integer promotion and if
/// a cast is required before the extension operator makes sense.
/// \param op is the given extension operator INT_ZEXT or INT_SEXT
/// \return \b true if a cast is required before extending
virtual bool checkIntPromotionForExtension(const PcodeOp *op) const=0;
/// \brief Is the given ZEXT/SEXT cast implied by the expression its in?
///
/// We've already determined that the given ZEXT or SEXT op can be viewed as a natural \e cast operation.
/// Determine if the cast is implied by the expression its and doesn't need to be printed.
/// \param op is the given ZEXT or SEXT PcodeOp
/// \param readOp is the PcodeOp consuming the output of the extensions (or null)
/// \return \b true if the op as a cast does not need to be printed
virtual bool isExtensionCastImplied(const PcodeOp *op,const PcodeOp *readOp) const=0;
/// \brief Does there need to be a visible cast between the given data-types
///
/// The cast is from a \e current data-type to an \e expected data-type. NULL is returned
/// if no cast is required, otherwise the data-type to cast to (usually the expected data-type)
/// is returned.
/// \param reqtype is the \e expected data-type
/// \param curtype is the \e current data-type
/// \param care_uint_int is \b true if we care about a change in signedness
/// \param care_ptr_uint is \b true if we care about conversions between pointers and unsigned values
/// \return NULL to indicate no cast, or the data-type to cast to
virtual Datatype *castStandard(Datatype *reqtype,Datatype *curtype,bool care_uint_int,bool care_ptr_uint) const=0;
/// \brief What is the output data-type produced by the given integer arithmetic operation
///
/// \param op is the given operation
/// \return the output data-type
virtual Datatype *arithmeticOutputStandard(const PcodeOp *op)=0;
/// \brief Is truncating an input data-type, producing an output data-type, considered a cast
///
/// Data-types must be provided from the input and output of a SUBPIECE operation.
/// \param outtype is the output data-type
/// \param intype is the input data-type
/// \param offset is number of bytes truncated by the SUBPIECE
/// \return \b true if the SUBPIECE should be represented as a cast
virtual bool isSubpieceCast(Datatype *outtype,Datatype *intype,uint4 offset) const=0;
/// \brief Is the given data-type truncation considered a cast, given endianness concerns.
///
/// This is equivalent to isSubpieceCast() but where the truncation is accomplished by pulling
/// bytes directly out of memory. We assume the input data-type is layed down in memory, and
/// we pull the output value starting at a given byte offset.
/// \param outtype is the output data-type
/// \param intype is the input data-type
/// \param offset is the given byte offset (into the input memory)
/// \param isbigend is \b true if the address space holding the memory is big endian.
/// \return \b true if the truncation should be represented as a cast
virtual bool isSubpieceCastEndian(Datatype *outtype,Datatype *intype,uint4 offset,bool isbigend) const=0;
/// \brief Is sign-extending an input data-type, producing an output data-type, considered a cast
///
/// Data-types must be provided from the input and output of an INT_SEXT operation.
/// \param outtype is the output data-type
/// \param intype is the input data-type
/// \return \b true if the INT_SEXT should be represented as a cast
virtual bool isSextCast(Datatype *outtype,Datatype *intype) const=0;
/// \brief Is zero-extending an input data-type, producing an output data-type, considered a cast
///
/// Data-types must be provided from the input and output of an INT_ZEXT operation.
/// \param outtype is the output data-type
/// \param intype is the input data-type
/// \return \b true if the INT_ZEXT should be represented as a cast
virtual bool isZextCast(Datatype *outtype,Datatype *intype) const=0;
/// \brief Check if a constant input should be explicitly labeled as an \e unsigned token
bool markExplicitUnsigned(PcodeOp *op,int4 slot) const;
/// \brief Check is a constant input should be explicitly labeled as a \e long integer token
bool markExplicitLongSize(PcodeOp *op,int4 slot) const;
/// \brief For the given PcodeOp, does it matter if a constant operand is presented as a character or integer
///
/// In most languages, character constants are promoted to integers as a matter of course, so it
/// doesn't matter if the constant is represented as an integer (a string of digits) or a character
/// (surrounded by quotes). But its possible that a particular operator does care. If the operator
/// needs an explicit character representation for an operand with a character data-type, return \b true.
/// \param vn is the constant with character data-type
/// \param op is the given PcodeOp which reads the constant (may be null)
/// \return \b true if the constant must be represented as an explicit character
bool caresAboutCharRepresentation(const Varnode *vn,const PcodeOp *op) const { return false; }
};
/// \brief Casting strategies that are specific to the C language
class CastStrategyC : public CastStrategy {
public:
virtual int4 localExtensionType(const Varnode *vn,const PcodeOp *op) const;
virtual int4 intPromotionType(const Varnode *vn) const;
virtual bool checkIntPromotionForCompare(const PcodeOp *op,int4 slot) const;
virtual bool checkIntPromotionForExtension(const PcodeOp *op) const;
virtual bool isExtensionCastImplied(const PcodeOp *op,const PcodeOp *readOp) const;
virtual Datatype *castStandard(Datatype *reqtype,Datatype *curtype,bool care_uint_int,bool care_ptr_uint) const;
virtual Datatype *arithmeticOutputStandard(const PcodeOp *op);
virtual bool isSubpieceCast(Datatype *outtype,Datatype *intype,uint4 offset) const;
virtual bool isSubpieceCastEndian(Datatype *outtype,Datatype *intype,uint4 offset,bool isbigend) const;
virtual bool isSextCast(Datatype *outtype,Datatype *intype) const;
virtual bool isZextCast(Datatype *outtype,Datatype *intype) const;
};
/// \brief Casting strategies that are specific to the Java language
///
/// This is nearly identical to the strategy for C, but there is some change to account
/// for the way object references are encoded as pointer data-types within the
/// decompiler's data-type system.
class CastStrategyJava : public CastStrategyC {
public:
virtual Datatype *castStandard(Datatype *reqtype,Datatype *curtype,bool care_uint_int,bool care_ptr_uint) const;
virtual bool isZextCast(Datatype *outtype,Datatype *intype) const;
};
} // End namespace ghidra
#endif