Import boehm-gc snapshot, taken from
[official-gcc.git] / boehm-gc / include / private / gc_pmark.h
blobdef4a91799d00fbad891b868ab0f5c6248b13f32
1 /*
2 * Copyright (c) 1991-1994 by Xerox Corporation. All rights reserved.
3 * Copyright (c) 2001 by Hewlett-Packard Company. All rights reserved.
5 * THIS MATERIAL IS PROVIDED AS IS, WITH ABSOLUTELY NO WARRANTY EXPRESSED
6 * OR IMPLIED. ANY USE IS AT YOUR OWN RISK.
8 * Permission is hereby granted to use or copy this program
9 * for any purpose, provided the above notices are retained on all copies.
10 * Permission to modify the code and to distribute modified code is granted,
11 * provided the above notices are retained, and a notice that the code was
12 * modified is included with the above copyright notice.
16 /* Private declarations of GC marker data structures and macros */
19 * Declarations of mark stack. Needed by marker and client supplied mark
20 * routines. Transitively include gc_priv.h.
22 #ifndef GC_PMARK_H
23 #define GC_PMARK_H
25 #ifdef HAVE_CONFIG_H
26 # include "config.h"
27 #endif
29 #ifndef GC_BUILD
30 # define GC_BUILD
31 #endif
33 #if defined(KEEP_BACK_PTRS) || defined(PRINT_BLACK_LIST)
34 # include "dbg_mlc.h"
35 #endif
37 #ifndef GC_MARK_H
38 # include "../gc_mark.h"
39 #endif
41 #ifndef GC_PRIVATE_H
42 # include "gc_priv.h"
43 #endif
45 /* The real declarations of the following is in gc_priv.h, so that */
46 /* we can avoid scanning the following table. */
48 mark_proc GC_mark_procs[MAX_MARK_PROCS];
51 #ifndef MARK_DESCR_OFFSET
52 # define MARK_DESCR_OFFSET sizeof(word)
53 #endif
56 * Mark descriptor stuff that should remain private for now, mostly
57 * because it's hard to export WORDSZ without including gcconfig.h.
59 #define BITMAP_BITS (WORDSZ - GC_DS_TAG_BITS)
60 #define PROC(descr) \
61 (GC_mark_procs[((descr) >> GC_DS_TAG_BITS) & (GC_MAX_MARK_PROCS-1)])
62 #define ENV(descr) \
63 ((descr) >> (GC_DS_TAG_BITS + GC_LOG_MAX_MARK_PROCS))
64 #define MAX_ENV \
65 (((word)1 << (WORDSZ - GC_DS_TAG_BITS - GC_LOG_MAX_MARK_PROCS)) - 1)
67 GC_EXTERN unsigned GC_n_mark_procs;
69 /* Number of mark stack entries to discard on overflow. */
70 #define GC_MARK_STACK_DISCARDS (INITIAL_MARK_STACK_SIZE/8)
72 typedef struct GC_ms_entry {
73 ptr_t mse_start; /* First word of object, word aligned. */
74 union word_ptr_ao_u mse_descr;
75 /* Descriptor; low order two bits are tags, */
76 /* as described in gc_mark.h. */
77 } mse;
79 GC_EXTERN size_t GC_mark_stack_size;
81 GC_EXTERN mse * GC_mark_stack_limit;
83 #ifdef PARALLEL_MARK
84 GC_EXTERN mse * volatile GC_mark_stack_top;
85 /* FIXME: Use union to avoid casts to AO_t */
86 #else
87 GC_EXTERN mse * GC_mark_stack_top;
88 #endif
90 GC_EXTERN mse * GC_mark_stack;
92 #ifdef PARALLEL_MARK
94 * Allow multiple threads to participate in the marking process.
95 * This works roughly as follows:
96 * The main mark stack never shrinks, but it can grow.
98 * The initiating threads holds the GC lock, and sets GC_help_wanted.
100 * Other threads:
101 * 1) update helper_count (while holding mark_lock.)
102 * 2) allocate a local mark stack
103 * repeatedly:
104 * 3) Steal a global mark stack entry by atomically replacing
105 * its descriptor with 0.
106 * 4) Copy it to the local stack.
107 * 5) Mark on the local stack until it is empty, or
108 * it may be profitable to copy it back.
109 * 6) If necessary, copy local stack to global one,
110 * holding mark lock.
111 * 7) Stop when the global mark stack is empty.
112 * 8) decrement helper_count (holding mark_lock).
114 * This is an experiment to see if we can do something along the lines
115 * of the University of Tokyo SGC in a less intrusive, though probably
116 * also less performant, way.
119 /* GC_mark_stack_top is protected by mark lock. */
122 * GC_notify_all_marker() is used when GC_help_wanted is first set,
123 * when the last helper becomes inactive,
124 * when something is added to the global mark stack, and just after
125 * GC_mark_no is incremented.
126 * This could be split into multiple CVs (and probably should be to
127 * scale to really large numbers of processors.)
129 #endif /* PARALLEL_MARK */
131 GC_INNER mse * GC_signal_mark_stack_overflow(mse *msp);
133 /* Push the object obj with corresponding heap block header hhdr onto */
134 /* the mark stack. */
135 #define PUSH_OBJ(obj, hhdr, mark_stack_top, mark_stack_limit) \
137 register word _descr = (hhdr) -> hb_descr; \
138 GC_ASSERT(!HBLK_IS_FREE(hhdr)); \
139 if (_descr != 0) { \
140 mark_stack_top++; \
141 if ((word)mark_stack_top >= (word)(mark_stack_limit)) { \
142 mark_stack_top = GC_signal_mark_stack_overflow(mark_stack_top); \
144 mark_stack_top -> mse_start = (obj); \
145 mark_stack_top -> mse_descr.w = _descr; \
149 /* Push the contents of current onto the mark stack if it is a valid */
150 /* ptr to a currently unmarked object. Mark it. */
151 /* If we assumed a standard-conforming compiler, we could probably */
152 /* generate the exit_label transparently. */
153 #define PUSH_CONTENTS(current, mark_stack_top, mark_stack_limit, \
154 source, exit_label) \
156 hdr * my_hhdr; \
157 HC_GET_HDR(current, my_hhdr, source, exit_label); \
158 PUSH_CONTENTS_HDR(current, mark_stack_top, mark_stack_limit, \
159 source, exit_label, my_hhdr, TRUE); \
160 exit_label: ; \
163 /* Set mark bit, exit if it was already set. */
164 #ifdef USE_MARK_BYTES
165 /* There is a race here, and we may set */
166 /* the bit twice in the concurrent case. This can result in the */
167 /* object being pushed twice. But that's only a performance issue. */
168 # define SET_MARK_BIT_EXIT_IF_SET(hhdr,bit_no,exit_label) \
170 char * mark_byte_addr = (char *)hhdr -> hb_marks + (bit_no); \
171 if (*mark_byte_addr) goto exit_label; \
172 *mark_byte_addr = 1; \
174 #else
175 # ifdef PARALLEL_MARK
176 /* This is used only if we explicitly set USE_MARK_BITS. */
177 /* The following may fail to exit even if the bit was already set. */
178 /* For our uses, that's benign: */
179 # define OR_WORD_EXIT_IF_SET(addr, bits, exit_label) \
181 if (!(*(addr) & (bits))) { \
182 AO_or((volatile AO_t *)(addr), (AO_t)(bits)); \
183 } else { \
184 goto exit_label; \
187 # else
188 # define OR_WORD_EXIT_IF_SET(addr, bits, exit_label) \
190 word old = *(addr); \
191 word my_bits = (bits); \
192 if (old & my_bits) goto exit_label; \
193 *(addr) = (old | my_bits); \
195 # endif /* !PARALLEL_MARK */
196 # define SET_MARK_BIT_EXIT_IF_SET(hhdr,bit_no,exit_label) \
198 word * mark_word_addr = hhdr -> hb_marks + divWORDSZ(bit_no); \
199 OR_WORD_EXIT_IF_SET(mark_word_addr, (word)1 << modWORDSZ(bit_no), \
200 exit_label); \
202 #endif /* !USE_MARK_BYTES */
204 #ifdef PARALLEL_MARK
205 # define INCR_MARKS(hhdr) \
206 AO_store(&hhdr->hb_n_marks, AO_load(&hhdr->hb_n_marks) + 1)
207 #else
208 # define INCR_MARKS(hhdr) (void)(++hhdr->hb_n_marks)
209 #endif
211 #ifdef ENABLE_TRACE
212 # define TRACE(source, cmd) \
213 if (GC_trace_addr != 0 && (ptr_t)(source) == GC_trace_addr) cmd
214 # define TRACE_TARGET(target, cmd) \
215 if (GC_trace_addr != 0 && (target) == *(ptr_t *)GC_trace_addr) cmd
216 #else
217 # define TRACE(source, cmd)
218 # define TRACE_TARGET(source, cmd)
219 #endif
221 #if defined(I386) && defined(__GNUC__)
222 # define LONG_MULT(hprod, lprod, x, y) { \
223 __asm__ __volatile__("mull %2" : "=a"(lprod), "=d"(hprod) \
224 : "g"(y), "0"(x)); \
226 #else
227 # define LONG_MULT(hprod, lprod, x, y) { \
228 unsigned long long prod = (unsigned long long)(x) \
229 * (unsigned long long)(y); \
230 hprod = prod >> 32; \
231 lprod = (unsigned32)prod; \
233 #endif /* !I386 */
235 /* If the mark bit corresponding to current is not set, set it, and */
236 /* push the contents of the object on the mark stack. Current points */
237 /* to the beginning of the object. We rely on the fact that the */
238 /* preceding header calculation will succeed for a pointer past the */
239 /* first page of an object, only if it is in fact a valid pointer */
240 /* to the object. Thus we can omit the otherwise necessary tests */
241 /* here. Note in particular that the "displ" value is the displacement */
242 /* from the beginning of the heap block, which may itself be in the */
243 /* interior of a large object. */
244 #ifdef MARK_BIT_PER_GRANULE
245 # define PUSH_CONTENTS_HDR(current, mark_stack_top, mark_stack_limit, \
246 source, exit_label, hhdr, do_offset_check) \
248 size_t displ = HBLKDISPL(current); /* Displacement in block; in bytes. */\
249 /* displ is always within range. If current doesn't point to */ \
250 /* first block, then we are in the all_interior_pointers case, and */ \
251 /* it is safe to use any displacement value. */ \
252 size_t gran_displ = BYTES_TO_GRANULES(displ); \
253 size_t gran_offset = hhdr -> hb_map[gran_displ]; \
254 size_t byte_offset = displ & (GRANULE_BYTES - 1); \
255 ptr_t base = current; \
256 /* The following always fails for large block references. */ \
257 if (EXPECT((gran_offset | byte_offset) != 0, FALSE)) { \
258 if (hhdr -> hb_large_block) { \
259 /* gran_offset is bogus. */ \
260 size_t obj_displ; \
261 base = (ptr_t)(hhdr -> hb_block); \
262 obj_displ = (ptr_t)(current) - base; \
263 if (obj_displ != displ) { \
264 GC_ASSERT(obj_displ < hhdr -> hb_sz); \
265 /* Must be in all_interior_pointer case, not first block */ \
266 /* already did validity check on cache miss. */ \
267 } else { \
268 if (do_offset_check && !GC_valid_offsets[obj_displ]) { \
269 GC_ADD_TO_BLACK_LIST_NORMAL(current, source); \
270 goto exit_label; \
273 gran_displ = 0; \
274 GC_ASSERT(hhdr -> hb_sz > HBLKSIZE || \
275 hhdr -> hb_block == HBLKPTR(current)); \
276 GC_ASSERT((word)hhdr->hb_block <= (word)(current)); \
277 } else { \
278 size_t obj_displ = GRANULES_TO_BYTES(gran_offset) \
279 + byte_offset; \
280 if (do_offset_check && !GC_valid_offsets[obj_displ]) { \
281 GC_ADD_TO_BLACK_LIST_NORMAL(current, source); \
282 goto exit_label; \
284 gran_displ -= gran_offset; \
285 base -= obj_displ; \
288 GC_ASSERT(hhdr == GC_find_header(base)); \
289 GC_ASSERT(gran_displ % BYTES_TO_GRANULES(hhdr -> hb_sz) == 0); \
290 TRACE(source, GC_log_printf("GC:%u: passed validity tests\n", \
291 (unsigned)GC_gc_no)); \
292 SET_MARK_BIT_EXIT_IF_SET(hhdr, gran_displ, exit_label); \
293 TRACE(source, GC_log_printf("GC:%u: previously unmarked\n", \
294 (unsigned)GC_gc_no)); \
295 TRACE_TARGET(base, \
296 GC_log_printf("GC:%u: marking %p from %p instead\n", \
297 (unsigned)GC_gc_no, base, source)); \
298 INCR_MARKS(hhdr); \
299 GC_STORE_BACK_PTR((ptr_t)source, base); \
300 PUSH_OBJ(base, hhdr, mark_stack_top, mark_stack_limit); \
302 #endif /* MARK_BIT_PER_GRANULE */
304 #ifdef MARK_BIT_PER_OBJ
305 # define PUSH_CONTENTS_HDR(current, mark_stack_top, mark_stack_limit, \
306 source, exit_label, hhdr, do_offset_check) \
308 size_t displ = HBLKDISPL(current); /* Displacement in block; in bytes. */\
309 unsigned32 low_prod, high_prod; \
310 unsigned32 inv_sz = hhdr -> hb_inv_sz; \
311 ptr_t base = current; \
312 LONG_MULT(high_prod, low_prod, displ, inv_sz); \
313 /* product is > and within sz_in_bytes of displ * sz_in_bytes * 2**32 */ \
314 if (EXPECT(low_prod >> 16 != 0, FALSE)) { \
315 FIXME: fails if offset is a multiple of HBLKSIZE which becomes 0 \
316 if (inv_sz == LARGE_INV_SZ) { \
317 size_t obj_displ; \
318 base = (ptr_t)(hhdr -> hb_block); \
319 obj_displ = (ptr_t)(current) - base; \
320 if (obj_displ != displ) { \
321 GC_ASSERT(obj_displ < hhdr -> hb_sz); \
322 /* Must be in all_interior_pointer case, not first block */ \
323 /* already did validity check on cache miss. */ \
324 } else { \
325 if (do_offset_check && !GC_valid_offsets[obj_displ]) { \
326 GC_ADD_TO_BLACK_LIST_NORMAL(current, source); \
327 goto exit_label; \
330 GC_ASSERT(hhdr -> hb_sz > HBLKSIZE || \
331 hhdr -> hb_block == HBLKPTR(current)); \
332 GC_ASSERT((word)hhdr->hb_block < (word)(current)); \
333 } else { \
334 /* Accurate enough if HBLKSIZE <= 2**15. */ \
335 GC_STATIC_ASSERT(HBLKSIZE <= (1 << 15)); \
336 size_t obj_displ = (((low_prod >> 16) + 1) * (hhdr->hb_sz)) >> 16; \
337 if (do_offset_check && !GC_valid_offsets[obj_displ]) { \
338 GC_ADD_TO_BLACK_LIST_NORMAL(current, source); \
339 goto exit_label; \
341 base -= obj_displ; \
344 /* May get here for pointer to start of block not at */ \
345 /* beginning of object. If so, it's valid, and we're fine. */ \
346 GC_ASSERT(high_prod >= 0 && high_prod <= HBLK_OBJS(hhdr -> hb_sz)); \
347 TRACE(source, GC_log_printf("GC:%u: passed validity tests\n", \
348 (unsigned)GC_gc_no)); \
349 SET_MARK_BIT_EXIT_IF_SET(hhdr, high_prod, exit_label); \
350 TRACE(source, GC_log_printf("GC:%u: previously unmarked\n", \
351 (unsigned)GC_gc_no)); \
352 TRACE_TARGET(base, \
353 GC_log_printf("GC:%u: marking %p from %p instead\n", \
354 (unsigned)GC_gc_no, base, source)); \
355 INCR_MARKS(hhdr); \
356 GC_STORE_BACK_PTR((ptr_t)source, base); \
357 PUSH_OBJ(base, hhdr, mark_stack_top, mark_stack_limit); \
359 #endif /* MARK_BIT_PER_OBJ */
361 #if defined(PRINT_BLACK_LIST) || defined(KEEP_BACK_PTRS)
362 # define PUSH_ONE_CHECKED_STACK(p, source) \
363 GC_mark_and_push_stack((ptr_t)(p), (ptr_t)(source))
364 #else
365 # define PUSH_ONE_CHECKED_STACK(p, source) \
366 GC_mark_and_push_stack((ptr_t)(p))
367 #endif
370 * Push a single value onto mark stack. Mark from the object pointed to by p.
371 * Invoke FIXUP_POINTER(p) before any further processing.
372 * P is considered valid even if it is an interior pointer.
373 * Previously marked objects are not pushed. Hence we make progress even
374 * if the mark stack overflows.
377 #if NEED_FIXUP_POINTER
378 /* Try both the raw version and the fixed up one. */
379 # define GC_PUSH_ONE_STACK(p, source) \
380 if ((word)(p) >= (word)GC_least_plausible_heap_addr \
381 && (word)(p) < (word)GC_greatest_plausible_heap_addr) { \
382 PUSH_ONE_CHECKED_STACK(p, source); \
384 FIXUP_POINTER(p); \
385 if ((word)(p) >= (word)GC_least_plausible_heap_addr \
386 && (word)(p) < (word)GC_greatest_plausible_heap_addr) { \
387 PUSH_ONE_CHECKED_STACK(p, source); \
389 #else /* !NEED_FIXUP_POINTER */
390 # define GC_PUSH_ONE_STACK(p, source) \
391 if ((word)(p) >= (word)GC_least_plausible_heap_addr \
392 && (word)(p) < (word)GC_greatest_plausible_heap_addr) { \
393 PUSH_ONE_CHECKED_STACK(p, source); \
395 #endif
397 /* As above, but interior pointer recognition as for normal heap pointers. */
398 #define GC_PUSH_ONE_HEAP(p,source,mark_stack_top) \
400 FIXUP_POINTER(p); \
401 if ((word)(p) >= (word)GC_least_plausible_heap_addr \
402 && (word)(p) < (word)GC_greatest_plausible_heap_addr) \
403 mark_stack_top = GC_mark_and_push((void *)(p), mark_stack_top, \
404 GC_mark_stack_limit, (void * *)(source)); \
407 /* Mark starting at mark stack entry top (incl.) down to */
408 /* mark stack entry bottom (incl.). Stop after performing */
409 /* about one page worth of work. Return the new mark stack */
410 /* top entry. */
411 GC_INNER mse * GC_mark_from(mse * top, mse * bottom, mse *limit);
413 #define MARK_FROM_MARK_STACK() \
414 GC_mark_stack_top = GC_mark_from(GC_mark_stack_top, \
415 GC_mark_stack, \
416 GC_mark_stack + GC_mark_stack_size);
418 #define GC_mark_stack_empty() ((word)GC_mark_stack_top < (word)GC_mark_stack)
421 * Mark from one finalizable object using the specified
422 * mark proc. May not mark the object pointed to by
423 * real_ptr. That is the job of the caller, if appropriate.
424 * Note that this is called with the mutator running, but
425 * with us holding the allocation lock. This is safe only if the
426 * mutator needs the allocation lock to reveal hidden pointers.
427 * FIXME: Why do we need the GC_mark_state test below?
429 #define GC_MARK_FO(real_ptr, mark_proc) \
431 (*(mark_proc))(real_ptr); \
432 while (!GC_mark_stack_empty()) MARK_FROM_MARK_STACK(); \
433 if (GC_mark_state != MS_NONE) { \
434 GC_set_mark_bit(real_ptr); \
435 while (!GC_mark_some((ptr_t)0)) {} \
439 GC_EXTERN GC_bool GC_mark_stack_too_small;
440 /* We need a larger mark stack. May be */
441 /* set by client supplied mark routines.*/
443 typedef int mark_state_t; /* Current state of marking, as follows:*/
444 /* Used to remember where we are during */
445 /* concurrent marking. */
447 /* We say something is dirty if it was */
448 /* written since the last time we */
449 /* retrieved dirty bits. We say it's */
450 /* grungy if it was marked dirty in the */
451 /* last set of bits we retrieved. */
453 /* Invariant I: all roots and marked */
454 /* objects p are either dirty, or point */
455 /* to objects q that are either marked */
456 /* or a pointer to q appears in a range */
457 /* on the mark stack. */
459 #define MS_NONE 0 /* No marking in progress. I holds. */
460 /* Mark stack is empty. */
462 #define MS_PUSH_RESCUERS 1 /* Rescuing objects are currently */
463 /* being pushed. I holds, except */
464 /* that grungy roots may point to */
465 /* unmarked objects, as may marked */
466 /* grungy objects above scan_ptr. */
468 #define MS_PUSH_UNCOLLECTABLE 2 /* I holds, except that marked */
469 /* uncollectable objects above scan_ptr */
470 /* may point to unmarked objects. */
471 /* Roots may point to unmarked objects */
473 #define MS_ROOTS_PUSHED 3 /* I holds, mark stack may be nonempty */
475 #define MS_PARTIALLY_INVALID 4 /* I may not hold, e.g. because of M.S. */
476 /* overflow. However marked heap */
477 /* objects below scan_ptr point to */
478 /* marked or stacked objects. */
480 #define MS_INVALID 5 /* I may not hold. */
482 GC_EXTERN mark_state_t GC_mark_state;
484 #endif /* GC_PMARK_H */