forked from facebook/hhvm
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathalias-class.h
More file actions
401 lines (349 loc) · 14.1 KB
/
alias-class.h
File metadata and controls
401 lines (349 loc) · 14.1 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
/*
+----------------------------------------------------------------------+
| HipHop for PHP |
+----------------------------------------------------------------------+
| Copyright (c) 2010-2016 Facebook, Inc. (http://www.facebook.com) |
+----------------------------------------------------------------------+
| This source file is subject to version 3.01 of the PHP license, |
| that is bundled with this package in the file LICENSE, and is |
| available through the world-wide-web at the following url: |
| http://www.php.net/license/3_01.txt |
| If you did not receive a copy of the PHP license and are unable to |
| obtain it through the world-wide-web, please send a note to |
| license@php.net so we can mail you a copy immediately. |
+----------------------------------------------------------------------+
*/
#ifndef incl_HPHP_ALIAS_CLASS_H_
#define incl_HPHP_ALIAS_CLASS_H_
#include "hphp/runtime/vm/minstr-state.h"
#include "hphp/runtime/vm/jit/alias-id-set.h"
#include "hphp/runtime/vm/jit/stack-offsets.h"
#include <folly/Optional.h>
#include <bitset>
#include <string>
#include <cstdint>
namespace HPHP { struct StringData; }
namespace HPHP { namespace jit {
struct SSATmp;
//////////////////////////////////////////////////////////////////////
/*
* AliasClass represents a lattice of abstract memory locations. These support
* type-system-like operations (operator<= for subset, operator| for union, and
* maybe() to test for non-zero intersections).
*
* AUnknown is the top of the lattice (is the class of all possible memory
* locations we care about). AEmpty is the bottom. AUnknownTV is a union of
* all the classes that contain TypedValue-style storage of PHP values. The
* various special location types AFoo all have an AFooAny, which is the
* superset of all AFoos.
*
* Part of the lattice currently looks like this:
*
* Unknown
* |
* |
* +-------+-------+----------+
* | | |
* UnknownTV IterPosAny IterBaseAny
* | | |
* | ... ...
* |
* +---------+---+---------------+-------------------------+
* | | | |
* | | | |
* | | | |
* | | | |
* | | HeapAny* |
* | | | |
* | | +------+------+---------+ |
* | | | | | |
* FrameAny StackAny ElemAny PropAny RefAny MIStateAny
* | | / \ | | |
* ... ... ElemIAny ElemSAny ... ... |
* | | |
* ... ... ----------------+-------------
* | | | |
* MITempBase MITvRef MITvRef2 MIBase
*
*
* (*) AHeapAny contains some things other than ElemAny, PropAny and RefAny
* that don't have explicit nodes in the lattice yet. (Like the
* lvalBlackhole, etc.) It's hard for this to matter to client code for
* now because we don't expose an intersection or difference operation.
*/
struct AliasClass;
//////////////////////////////////////////////////////////////////////
/*
* Special data for locations known to be a set of locals on the frame `fp'.
*/
struct AFrame { SSATmp* fp; AliasIdSet ids; };
/*
* A specific php iterator's position value (m_pos).
*/
struct AIterPos { SSATmp* fp; uint32_t id; };
/*
* A specific php iterator's base and initialization state, for non-mutable
* iterators.
*
* Instances of this AliasClass cover both the memory storing the pointer to
* the object being iterated, and the initialization flags (itype and next
* helper)---the reason for this is that nothing may load/store the
* initialization state if it isn't also going to load/store the base pointer.
*/
struct AIterBase { SSATmp* fp; uint32_t id; };
/*
* A location inside of an object property, with base `obj' and byte offset
* `offset' from the ObjectData*.
*/
struct AProp { SSATmp* obj; uint32_t offset; };
/*
* A integer index inside of an array, with base `arr'. The `arr' tmp is any
* kind of array (not necessarily kPackedKind or whatnot).
*/
struct AElemI { SSATmp* arr; int64_t idx; };
/*
* A location inside of an array, with base `arr', with a string key. The
* `arr' tmp is any kind of array.
*/
struct AElemS { SSATmp* arr; const StringData* key; };
/*
* A range of the stack, starting at `offset' from the outermost frame pointer,
* and extending `size' slots deeper into the stack (toward lower memory
* addresses). The frame pointer is the same for all stack ranges in the IR
* unit, and thus is not stored here. The reason ranges extend downward is
* that it is common to need to refer to the class of all stack locations below
* some depth (this can be done by putting INT32_MAX in the size).
*
* Some notes on how the evaluation stack is treated for alias analysis:
*
* o Since AStack locations are always canonicalized, different AStack
* locations must not alias if there is no overlap in the ranges.
*
* o In situations with inlined calls, we may in fact have AFrame locations
* that refer to the same concrete memory locations (in the evaluation
* stack) as other AStack locations in the same HHIR program. However, the
* portions of the HHIR program that may use that memory location in either
* of those ways may not overlap, based on the HHBC semantics of function
* calls and eval stack usage. (This may seem odd, but it's not really any
* different from knowing that a physical portion of the heap may be
* treated as both an AElemI or AProp, but not at the same time based on
* HHBC-level semantics.)
*/
struct AStack {
// We can create an AStack from either a stack pointer or a frame pointer.
// These constructors canonicalize the offset to be relative to the outermost
// frame pointer.
explicit AStack(SSATmp* fp, FPRelOffset offset, int32_t size);
explicit AStack(SSATmp* sp, IRSPRelOffset offset, int32_t size);
explicit AStack(FPRelOffset o, int32_t s) : offset(o), size(s) {}
FPRelOffset offset;
int32_t size;
};
/*
* A RefData referenced by a BoxedCell.
*/
struct ARef { SSATmp* boxed; };
//////////////////////////////////////////////////////////////////////
struct AliasClass {
enum rep : uint32_t { // bits for various location classes
BEmpty = 0,
// The relative order of the values are used in operator| to decide
// which specialization is more useful.
BFrame = 1 << 0,
BIterPos = 1 << 1,
BIterBase = 1 << 2,
BProp = 1 << 3,
BElemI = 1 << 4,
BElemS = 1 << 5,
BStack = 1 << 6,
BRef = 1 << 7,
// Have no specialization, put them last.
BMITempBase = 1 << 8,
BMITvRef = 1 << 9,
BMITvRef2 = 1 << 10,
BMIBase = 1 << 11,
BElem = BElemI | BElemS,
BHeap = BElem | BProp | BRef,
BMIStateTV = BMITempBase | BMITvRef | BMITvRef2,
BMIState = BMIStateTV | BMIBase,
BUnknownTV = ~(BIterPos | BIterBase | BMIBase),
BUnknown = static_cast<uint32_t>(-1),
};
/*
* A hashing function for alias classes.
*/
struct Hash { size_t operator()(AliasClass) const; };
/*
* Create an alias class from a bit representation. Usually you should use
* one of the other functions to create these.
*/
explicit AliasClass(rep bits) : m_bits{bits} {}
/*
* Create an alias class with more precise specialized information about
* where it is.
*/
/* implicit */ AliasClass(AFrame);
/* implicit */ AliasClass(AIterPos);
/* implicit */ AliasClass(AIterBase);
/* implicit */ AliasClass(AProp);
/* implicit */ AliasClass(AElemI);
/* implicit */ AliasClass(AElemS);
/* implicit */ AliasClass(AStack);
/* implicit */ AliasClass(ARef);
/*
* Exact equality.
*/
bool operator==(AliasClass) const;
bool operator!=(AliasClass o) const { return !(*this == o); }
/*
* Return an AliasClass that is the precise union of this class and another
* class, or folly::none if that precise union cannot be represented.
*
* Guaranteed to be commutative.
*/
folly::Optional<AliasClass> precise_union(AliasClass) const;
/*
* Create an alias class that is at least as big as the true union of this
* alias class and another one.
*
* If this.precise_union(o) is not folly::none, this function is guaranteed
* to return *this.precise_union(o). Otherwise it may return an arbitrary
* AliasClass bigger than the (unrepresentable) true union---callers should
* not rely on specifics about how much bigger it is.
*
* Guaranteed to be commutative.
*/
AliasClass operator|(AliasClass o) const;
AliasClass& operator|=(AliasClass o) { return *this = *this | o; }
/*
* Returns whether this alias class is a non-strict-subset of another one.
*/
bool operator<=(AliasClass) const;
/*
* Returns whether an alias class could possibly refer to the same concrete
* memory location as another one. Basically, do they have a non-empty
* intersection.
*/
bool maybe(AliasClass) const;
/*
* Returns whether the alias class contains a single location.
*/
bool isSingleLocation() const;
/*
* Conditionally access specific known information of various kinds.
*
* Returns folly::none if this alias class has no specialization in that way.
*/
folly::Optional<AFrame> frame() const;
folly::Optional<AIterPos> iterPos() const;
folly::Optional<AIterBase> iterBase() const;
folly::Optional<AProp> prop() const;
folly::Optional<AElemI> elemI() const;
folly::Optional<AElemS> elemS() const;
folly::Optional<AStack> stack() const;
folly::Optional<ARef> ref() const;
/*
* Conditionally access specific known information, but also checking that
* that is the only major category contained in this AliasClass.
*
* I.e., cls.is_foo() is semantically equivalent to:
*
* cls <= AFooAny ? cls.foo() : folly::none
*/
folly::Optional<AFrame> is_frame() const;
folly::Optional<AIterPos> is_iterPos() const;
folly::Optional<AIterBase> is_iterBase() const;
folly::Optional<AProp> is_prop() const;
folly::Optional<AElemI> is_elemI() const;
folly::Optional<AElemS> is_elemS() const;
folly::Optional<AStack> is_stack() const;
folly::Optional<ARef> is_ref() const;
/*
* Like the other foo() and is_foo() methods, but since we don't have an
* AMIState anymore, these return AliasClass instead.
*/
folly::Optional<AliasClass> mis() const;
folly::Optional<AliasClass> is_mis() const;
private:
enum class STag {
None,
Frame,
IterPos,
IterBase,
Prop,
ElemI,
ElemS,
Stack,
Ref,
IterBoth, // A union of base and pos for the same iter.
};
struct UIterBoth { SSATmp* fp; uint32_t id; };
private:
friend std::string show(AliasClass);
friend AliasClass canonicalize(AliasClass);
bool checkInvariants() const;
bool equivData(AliasClass) const;
bool subclassData(AliasClass) const;
bool diffSTagSubclassData(rep relevant_bits, AliasClass) const;
bool maybeData(AliasClass) const;
bool diffSTagMaybeData(rep relevant_bits, AliasClass) const;
folly::Optional<UIterBoth> asUIter() const;
bool refersToSameIterHelper(AliasClass) const;
static folly::Optional<AliasClass>
precise_diffSTag_unionData(rep newBits, AliasClass, AliasClass);
static AliasClass unionData(rep newBits, AliasClass, AliasClass);
static rep stagBits(STag tag);
private:
rep m_bits;
STag m_stag{STag::None};
union {
AFrame m_frame;
AIterPos m_iterPos;
AIterBase m_iterBase;
AProp m_prop;
AElemI m_elemI;
AElemS m_elemS;
AStack m_stack;
ARef m_ref;
UIterBoth m_iterBoth;
};
};
//////////////////////////////////////////////////////////////////////
/* General alias classes. */
auto const AEmpty = AliasClass{AliasClass::BEmpty};
auto const AFrameAny = AliasClass{AliasClass::BFrame};
auto const AIterPosAny = AliasClass{AliasClass::BIterPos};
auto const AIterBaseAny = AliasClass{AliasClass::BIterBase};
auto const APropAny = AliasClass{AliasClass::BProp};
auto const AHeapAny = AliasClass{AliasClass::BHeap};
auto const ARefAny = AliasClass{AliasClass::BRef};
auto const AStackAny = AliasClass{AliasClass::BStack};
auto const AElemIAny = AliasClass{AliasClass::BElemI};
auto const AElemSAny = AliasClass{AliasClass::BElemS};
auto const AElemAny = AliasClass{AliasClass::BElem};
auto const AMIStateTV = AliasClass{AliasClass::BMIStateTV};
auto const AMIStateAny = AliasClass{AliasClass::BMIState};
auto const AUnknownTV = AliasClass{AliasClass::BUnknownTV};
auto const AUnknown = AliasClass{AliasClass::BUnknown};
/* Alias classes for specific MInstrState fields. */
auto const AMIStateTempBase = AliasClass{AliasClass::BMITempBase};
auto const AMIStateTvRef = AliasClass{AliasClass::BMITvRef};
auto const AMIStateTvRef2 = AliasClass{AliasClass::BMITvRef2};
auto const AMIStateBase = AliasClass{AliasClass::BMIBase};
//////////////////////////////////////////////////////////////////////
/*
* Creates an AliasClass given an offset into MInstrState.
*/
AliasClass mis_from_offset(size_t);
/*
* Replace any SSATmps in an AliasClass with their canonical name (chasing
* passthrough instructions as with canonical() from analysis.h.)
*/
AliasClass canonicalize(AliasClass);
/*
* Produce a debug string for an alias class.
*/
std::string show(AliasClass);
//////////////////////////////////////////////////////////////////////
}}
#endif