-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathruntime.c
375 lines (311 loc) · 11.8 KB
/
runtime.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
#include <inttypes.h>
#include <stdlib.h>
#include <stdio.h>
#include <assert.h>
#include "runtime.h"
// Often misunderstood static global variables in C are not
// accessible to code outside of the module.
// No one besides the collector ever needs to know tospace exists.
static int64_t* tospace_begin;
static int64_t* tospace_end;
// initialized it set during initialization of the heap, and can be
// checked in order to ensure that initialization has occurred.
static int initialized = 0;
/*
Object Tag (64 bits)
#b|- 7 bit unused -|- 50 bit field [50, 0] -| 6 bits length -| 1 bit isNotForwarding Pointer
* If the bottom-most bit is zero, the tag is really a forwarding pointer.
* Otherwise, its an object tag. In that case, the next
6 bits give the length of the object (max of 50 64-bit words).
The next 50 bits say where there are pointers.
A '1' is a pointer, a '0' is not a pointer.
*/
static const int TAG_IS_NOT_FORWARD_MASK = 1;
static const int TAG_LENGTH_MASK = 126;
static const int TAG_LENGTH_RSHIFT = 1;
static const int TAG_PTR_BITFIELD_RSHIFT = 7;
// Check to see if a tag is actually a forwarding pointer.
static inline int is_forwarding(int64_t tag) {
return !(tag & TAG_IS_NOT_FORWARD_MASK);
}
// Get the length field out of a tag.
static inline int get_length(int64_t tag){
return (tag & TAG_LENGTH_MASK) >> TAG_LENGTH_RSHIFT;
}
// Get the "is pointer bitfield" out of a tag.
static inline int64_t get_ptr_bitfield(int64_t tag){
return tag >> TAG_PTR_BITFIELD_RSHIFT;
}
// initialize the state of the collector so that allocations can occur
void initialize(uint64_t rootstack_size, uint64_t heap_size)
{
// 1. Check to make sure that our assumptions about the world are correct.
assert(sizeof(int64_t) == sizeof(int64_t*));
assert((heap_size % sizeof(int64_t)) == 0);
assert((rootstack_size % sizeof(int64_t)) == 0);
// 2. Allocate memory (You should always check if malloc gave you memory)
if (!(fromspace_begin = malloc(heap_size))) {
printf("Failed to malloc %" PRIu64 " byte fromspace\n", heap_size);
exit(EXIT_FAILURE);
}
if (!(tospace_begin = malloc(heap_size))) {
printf("Failed to malloc %" PRIu64 " byte tospace\n", heap_size);
exit(EXIT_FAILURE);
}
if (!(rootstack_begin = malloc(rootstack_size))) {
printf("Failed to malloc %" PRIu64 " byte rootstack", rootstack_size);
exit(EXIT_FAILURE);
}
// 2.5 Calculate the ends memory we are using.
// Note: the pointers are for a half open interval [begin, end)
fromspace_end = fromspace_begin + (heap_size / sizeof(int64_t));
tospace_end = tospace_begin + (heap_size / sizeof(int64_t));
rootstack_end = rootstack_begin + (rootstack_size / sizeof(int64_t));
// 3 Initialize the global free pointer
free_ptr = fromspace_begin;
// Useful for debugging
initialized = 1;
}
// cheney implements cheney's copying collection algorithm
// There is a stub and explaination below.
static void cheney(int64_t** rootstack_ptr);
void collect(int64_t** rootstack_ptr, uint64_t bytes_requested)
{
// 1. Check our assumptions about the world
assert(initialized);
assert(rootstack_ptr >= rootstack_begin);
assert(rootstack_ptr < rootstack_end);
#ifndef NDEBUG
// All pointers in the rootstack point to fromspace
for(unsigned int i = 0; rootstack_begin + i < rootstack_ptr; i++){
int64_t* a_root = rootstack_begin[i];
assert(fromspace_begin <= a_root && a_root < fromspace_end);
}
#endif
// 2. Perform collection
cheney(rootstack_ptr);
// 3. Check if collection freed enough space in order to allocate
if (sizeof(int64_t) * (fromspace_end - free_ptr) < bytes_requested){
/*
If there is not enough room left for the bytes_requested,
allocate larger tospace and fromspace.
In order to determine the new size of the heap double the
heap size until it is bigger than the occupied portion of
the heap plus the bytes requested.
This covers the corner case of heaps objects that are
more than half the size of the heap. No a very likely
scenario but slightly more robust.
One corner case that isn't handled is if the heap is size
zero. My thought is that malloc probably wouldn't give
back a pointer if you asked for 0 bytes. Thus initialize
would fail, but our runtime-config.rkt file has a contract
on the heap_size parameter that the code generator uses
to determine initial heap size to this is a non-issue
in reality.
*/
unsigned long occupied_bytes = (free_ptr - fromspace_begin) * sizeof(int64_t);
unsigned long needed_bytes = occupied_bytes + bytes_requested;
unsigned long old_len = fromspace_end - fromspace_begin;
unsigned long old_bytes = old_len * sizeof(int64_t);
unsigned long new_bytes = old_bytes;
while (new_bytes < needed_bytes) new_bytes = 2 * new_bytes;
// Free and allocate a new tospace of size new_bytes
free(tospace_begin);
if (!(tospace_begin = malloc(new_bytes))) {
printf("failed to malloc %ld byte fromspace", new_bytes);
exit(EXIT_FAILURE);
}
tospace_end = tospace_begin + new_bytes / (sizeof(int64_t));
// The pointers on the stack and in the heap must be updated,
// so this cannot be just a memcopy of the heap.
// Performing cheney's algorithm again will have the correct
// effect, and we have already implemented it.
cheney(rootstack_ptr);
// Cheney flips tospace and fromspace. Thus, we allocate another
// tospace not fromspace as we might expect.
free(tospace_begin);
if (!(tospace_begin = malloc(new_bytes))) {
printf("failed to malloc %ld byte tospace", new_bytes);
exit(EXIT_FAILURE);
}
tospace_end = tospace_begin + new_bytes / (sizeof(int64_t));
}
assert(free_ptr < fromspace_end);
assert(free_ptr >= fromspace_begin);
#ifndef NDEBUG
// All pointers in the rootstack point to fromspace
for(unsigned long i = 0; rootstack_begin + i < rootstack_ptr; i++){
int64_t* a_root = rootstack_begin[i];
assert(fromspace_begin <= a_root && a_root < fromspace_end);
}
// All pointers in fromspace point to fromspace
int64_t* scan_ptr = fromspace_begin;
while(scan_ptr != free_ptr){
int64_t tag = *scan_ptr;
unsigned char len = get_length(tag);
int64_t isPtrBits = get_ptr_bitfield(tag);
int64_t* data = scan_ptr + 1;
scan_ptr = scan_ptr + len + 1;
for(unsigned char i = 0; i < len; i++){
if ((isPtrBits >> i) & 1){
int64_t* ptr = (int64_t*) data[i];
assert(ptr < fromspace_end);
assert(ptr >= fromspace_begin);
}
}
}
#endif
}
// copy_vector is responsible for doing a pointer oblivious
// move of vector data and updating the vector pointer with
// the new address of the data.
// There is a stub and explaination for copy_vector below.
static void copy_vector(int64_t** vector_ptr_loc);
/*
The cheney algorithm takes a pointer to the top of the rootstack.
It resets the free pointer to be at the begining of tospace, copies
(or reallocates) the data pointed to by the roots into tospace and
replaces the pointers in the rootset with pointers to the
copies. (See the description of copy_vector below).
While this initial copying of root vectors is occuring the free_ptr
has been maintained to remain at the next free memory location in
tospace. Cheney's algorithm then scans a vector at a time until it
reaches the free_ptr.
At each vector we use the meta information stored in the vector tag
to find the length of the vector and tell which fields inside the
vector are vector pointers. Each new vector pointer must have its
data copied and every vector pointer must be updated to to point to
the copied data. (The description of copy_vector will help keep this
organized.
This process is a breadth first graph traversal. Copying a vector
places its contents at the end of a Fifo queue and scanning a vector
removes it. Eventually the graph traversal will run out of unseen
nodes "catch up" to the free pointer. When this occurs we know that
all live data in the program is contained by tospace, and that
everything left in fromspace is unreachable by the program.
After this point the free pointer will be pointing into what until
now we considered tospace. This means the program will allocate
object here. In order to keep track of the we "flip" fromspace and
tospace by making the fromspace pointers point to tospace and vice
versa.
*/
void cheney(int64_t** rootstack_ptr)
{
}
/*
copy_vector takes a pointer, (`location`) to a vector pointer,
copies the vector data from fromspace into tospace, and updates the
vector pointer so that it points to the the data's new address in
tospace.
Precondition:
* original vector pointer location
|
V
[*] old vector pointer
|
+-> [tag or forwarding pointer | ? | ? | ? | ...] old vector data
Postcondition:
* original vector pointer location
|
V
[*] new vector pointer
|
| [ * forwarding pointer | ? | ? | ? | ...] old vector data
| |
| V
+---->[tag | ? | ? | ? | ...] new vector data
Since multiple pointers to the same vector can exist within the
memory of the program this may or may not be the first time
we called `copy_vector` on a location that contains this old vector
pointer. In order to tell if we have copied the old vector data previously we
check the vector information tag (`tag = old_vector_pointer[0]`).
If the forwarding bit is set, then is_forwarding(tag) will return
false and we know we haven't already copied the data. In order to
figure out how much data to copy we can inspect the tag's length
field. The length field indicates the number of 64-bit words the
array is storing for the user, so we need to copy `length + 1` words
in total, including the tag. After performing the
copy we need to leave a forwarding pointer in old data's tag field
to indicate the new address to subsequent copy_vector calls for this
vector pointer. Furthermore, we need to store the new vector's pointer
at the location where where we found the old vector pointer.
If the tag is a forwarding pointer, the `is_forwarding(tag) will return
true and we need to update the location storing the old vector pointer to
point to the new data instead).
As a side note any time you are allocating new data you must maintain
the invariant that the free_ptr points to the next free memory address.
*/
void copy_vector(int64_t** vector_ptr_loc)
{
}
// Read an integer from stdin
int64_t read_int() {
int64_t i;
scanf("%" SCNd64, &i);
return i;
}
// print an integer to stdout
void print_int(int64_t x) {
printf("%" PRId64, x);
}
// print a bool to stdout
void print_bool(int64_t x) {
if (x){
printf("#t");
} else {
printf("#f");
}
}
void print_void() {
printf("#<void>");
}
void print_vecbegin() {
printf("#(");
}
void print_space() {
printf(" ");
}
void print_vecend() {
printf(")");
}
void print_ellipsis() {
printf("#(...)");
}
#define ANY_TAG_MASK 3
#define ANY_TAG_LEN 2
#define ANY_TAG_INT 0
#define ANY_TAG_BOOL 1
#define ANY_TAG_VEC 2
#define ANY_TAG_FUN 3
int any_tag(int64_t any) {
return any & ANY_TAG_MASK;
}
/* to do: need to cycle detection. -Jeremy */
void print_any(int64_t any) {
switch (any_tag(any)) {
case ANY_TAG_INT:
printf("%" PRId64, any >> ANY_TAG_LEN);
break;
case ANY_TAG_BOOL:
if (any >> ANY_TAG_LEN) {
printf("#t");
} else {
printf("#f");
}
break;
case ANY_TAG_VEC: {
int64_t* vector_ptr = (int64_t*) (any & ~ANY_TAG_MASK);
int64_t tag = vector_ptr[0];
unsigned char len = get_length(tag);
printf("#(");
for (int i = 0; i != len; ++i) {
print_any(vector_ptr[i + 1]);
}
printf(")");
break;
}
case ANY_TAG_FUN:
printf("#<procedure>");
break;
}
}