backgraph.c 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475
  1. /*
  2. * Copyright (c) 2001 by Hewlett-Packard Company. All rights reserved.
  3. *
  4. * THIS MATERIAL IS PROVIDED AS IS, WITH ABSOLUTELY NO WARRANTY EXPRESSED
  5. * OR IMPLIED. ANY USE IS AT YOUR OWN RISK.
  6. *
  7. * Permission is hereby granted to use or copy this program
  8. * for any purpose, provided the above notices are retained on all copies.
  9. * Permission to modify the code and to distribute modified code is granted,
  10. * provided the above notices are retained, and a notice that the code was
  11. * modified is included with the above copyright notice.
  12. *
  13. */
  14. #include "private/dbg_mlc.h"
  15. /*
  16. * This implements a full, though not well-tuned, representation of the
  17. * backwards points-to graph. This is used to test for non-GC-robust
  18. * data structures; the code is not used during normal garbage collection.
  19. *
  20. * One restriction is that we drop all back-edges from nodes with very
  21. * high in-degree, and simply add them add them to a list of such
  22. * nodes. They are then treated as permanent roots. Id this by itself
  23. * doesn't introduce a space leak, then such nodes can't contribute to
  24. * a growing space leak.
  25. */
  26. #ifdef MAKE_BACK_GRAPH
  27. #define MAX_IN 10 /* Maximum in-degree we handle directly */
  28. /* #include <unistd.h> */
  29. #if !defined(DBG_HDRS_ALL) || (ALIGNMENT != CPP_WORDSZ/8) /* || !defined(UNIX_LIKE) */
  30. # error The configuration does not support MAKE_BACK_GRAPH
  31. #endif
  32. /* We store single back pointers directly in the object's oh_bg_ptr field. */
  33. /* If there is more than one ptr to an object, we store q | FLAG_MANY, */
  34. /* where q is a pointer to a back_edges object. */
  35. /* Every once in a while we use a back_edges object even for a single */
  36. /* pointer, since we need the other fields in the back_edges structure to */
  37. /* be present in some fraction of the objects. Otherwise we get serious */
  38. /* performance issues. */
  39. #define FLAG_MANY 2
  40. typedef struct back_edges_struct {
  41. word n_edges; /* Number of edges, including those in continuation */
  42. /* structures. */
  43. unsigned short flags;
  44. # define RETAIN 1 /* Directly points to a reachable object; */
  45. /* retain for next GC. */
  46. unsigned short height_gc_no;
  47. /* If height > 0, then the GC_gc_no value when it */
  48. /* was computed. If it was computed this cycle, then */
  49. /* it is current. If it was computed during the */
  50. /* last cycle, then it represents the old height, */
  51. /* which is only saved for live objects referenced by */
  52. /* dead ones. This may grow due to refs from newly */
  53. /* dead objects. */
  54. signed_word height;
  55. /* Longest path through unreachable nodes to this node */
  56. /* that we found using depth first search. */
  57. # define HEIGHT_UNKNOWN ((signed_word)(-2))
  58. # define HEIGHT_IN_PROGRESS ((signed_word)(-1))
  59. ptr_t edges[MAX_IN];
  60. struct back_edges_struct *cont;
  61. /* Pointer to continuation structure; we use only the */
  62. /* edges field in the continuation. */
  63. /* also used as free list link. */
  64. } back_edges;
  65. /* Allocate a new back edge structure. Should be more sophisticated */
  66. /* if this were production code. */
  67. #define MAX_BACK_EDGE_STRUCTS 100000
  68. static back_edges *back_edge_space = 0;
  69. STATIC int GC_n_back_edge_structs = 0;
  70. /* Serves as pointer to never used */
  71. /* back_edges space. */
  72. static back_edges *avail_back_edges = 0;
  73. /* Pointer to free list of deallocated */
  74. /* back_edges structures. */
  75. static back_edges * new_back_edges(void)
  76. {
  77. if (0 == back_edge_space) {
  78. back_edge_space = (back_edges *)
  79. GET_MEM(MAX_BACK_EDGE_STRUCTS*sizeof(back_edges));
  80. GC_add_to_our_memory((ptr_t)back_edge_space,
  81. MAX_BACK_EDGE_STRUCTS*sizeof(back_edges));
  82. }
  83. if (0 != avail_back_edges) {
  84. back_edges * result = avail_back_edges;
  85. avail_back_edges = result -> cont;
  86. result -> cont = 0;
  87. return result;
  88. }
  89. if (GC_n_back_edge_structs >= MAX_BACK_EDGE_STRUCTS - 1) {
  90. ABORT("Needed too much space for back edges: adjust "
  91. "MAX_BACK_EDGE_STRUCTS");
  92. }
  93. return back_edge_space + (GC_n_back_edge_structs++);
  94. }
  95. /* Deallocate p and its associated continuation structures. */
  96. static void deallocate_back_edges(back_edges *p)
  97. {
  98. back_edges *last = p;
  99. while (0 != last -> cont) last = last -> cont;
  100. last -> cont = avail_back_edges;
  101. avail_back_edges = p;
  102. }
  103. /* Table of objects that are currently on the depth-first search */
  104. /* stack. Only objects with in-degree one are in this table. */
  105. /* Other objects are identified using HEIGHT_IN_PROGRESS. */
  106. /* FIXME: This data structure NEEDS IMPROVEMENT. */
  107. #define INITIAL_IN_PROGRESS 10000
  108. static ptr_t * in_progress_space = 0;
  109. static size_t in_progress_size = 0;
  110. static size_t n_in_progress = 0;
  111. static void push_in_progress(ptr_t p)
  112. {
  113. if (n_in_progress >= in_progress_size) {
  114. if (in_progress_size == 0) {
  115. in_progress_size = INITIAL_IN_PROGRESS;
  116. in_progress_space = (ptr_t *)GET_MEM(in_progress_size * sizeof(ptr_t));
  117. GC_add_to_our_memory((ptr_t)in_progress_space,
  118. in_progress_size * sizeof(ptr_t));
  119. } else {
  120. ptr_t * new_in_progress_space;
  121. in_progress_size *= 2;
  122. new_in_progress_space = (ptr_t *)
  123. GET_MEM(in_progress_size * sizeof(ptr_t));
  124. GC_add_to_our_memory((ptr_t)new_in_progress_space,
  125. in_progress_size * sizeof(ptr_t));
  126. BCOPY(in_progress_space, new_in_progress_space,
  127. n_in_progress * sizeof(ptr_t));
  128. in_progress_space = new_in_progress_space;
  129. /* FIXME: This just drops the old space. */
  130. }
  131. }
  132. if (in_progress_space == 0)
  133. ABORT("MAKE_BACK_GRAPH: Out of in-progress space: "
  134. "Huge linear data structure?");
  135. in_progress_space[n_in_progress++] = p;
  136. }
  137. static GC_bool is_in_progress(ptr_t p)
  138. {
  139. size_t i;
  140. for (i = 0; i < n_in_progress; ++i) {
  141. if (in_progress_space[i] == p) return TRUE;
  142. }
  143. return FALSE;
  144. }
  145. GC_INLINE void pop_in_progress(ptr_t p GC_ATTR_UNUSED)
  146. {
  147. --n_in_progress;
  148. GC_ASSERT(in_progress_space[n_in_progress] == p);
  149. }
  150. #define GET_OH_BG_PTR(p) \
  151. (ptr_t)GC_REVEAL_POINTER(((oh *)(p)) -> oh_bg_ptr)
  152. #define SET_OH_BG_PTR(p,q) (((oh *)(p)) -> oh_bg_ptr = GC_HIDE_POINTER(q))
  153. /* Execute s once for each predecessor q of p in the points-to graph. */
  154. /* s should be a bracketed statement. We declare q. */
  155. #define FOR_EACH_PRED(q, p, s) \
  156. do { \
  157. ptr_t q = GET_OH_BG_PTR(p); \
  158. if (!((word)q & FLAG_MANY)) { \
  159. if (q && !((word)q & 1)) s \
  160. /* !((word)q & 1) checks for a misinterpreted freelist link */ \
  161. } else { \
  162. back_edges *orig_be_ = (back_edges *)((word)q & ~FLAG_MANY); \
  163. back_edges *be_ = orig_be_; \
  164. int local_; \
  165. word total_; \
  166. word n_edges_ = be_ -> n_edges; \
  167. for (total_ = 0, local_ = 0; total_ < n_edges_; ++local_, ++total_) { \
  168. if (local_ == MAX_IN) { \
  169. be_ = be_ -> cont; \
  170. local_ = 0; \
  171. } \
  172. q = be_ -> edges[local_]; s \
  173. } \
  174. } \
  175. } while (0)
  176. /* Ensure that p has a back_edges structure associated with it. */
  177. static void ensure_struct(ptr_t p)
  178. {
  179. ptr_t old_back_ptr = GET_OH_BG_PTR(p);
  180. if (!((word)old_back_ptr & FLAG_MANY)) {
  181. back_edges *be = new_back_edges();
  182. be -> flags = 0;
  183. if (0 == old_back_ptr) {
  184. be -> n_edges = 0;
  185. } else {
  186. be -> n_edges = 1;
  187. be -> edges[0] = old_back_ptr;
  188. }
  189. be -> height = HEIGHT_UNKNOWN;
  190. be -> height_gc_no = (unsigned short)(GC_gc_no - 1);
  191. GC_ASSERT((word)be >= (word)back_edge_space);
  192. SET_OH_BG_PTR(p, (word)be | FLAG_MANY);
  193. }
  194. }
  195. /* Add the (forward) edge from p to q to the backward graph. Both p */
  196. /* q are pointers to the object base, i.e. pointers to an oh. */
  197. static void add_edge(ptr_t p, ptr_t q)
  198. {
  199. ptr_t old_back_ptr = GET_OH_BG_PTR(q);
  200. back_edges * be, *be_cont;
  201. word i;
  202. static unsigned random_number = 13;
  203. # define GOT_LUCKY_NUMBER (((++random_number) & 0x7f) == 0)
  204. /* A not very random number we use to occasionally allocate a */
  205. /* back_edges structure even for a single backward edge. This */
  206. /* prevents us from repeatedly tracing back through very long */
  207. /* chains, since we will have some place to store height and */
  208. /* in_progress flags along the way. */
  209. GC_ASSERT(p == GC_base(p) && q == GC_base(q));
  210. if (!GC_HAS_DEBUG_INFO(q) || !GC_HAS_DEBUG_INFO(p)) {
  211. /* This is really a misinterpreted free list link, since we saw */
  212. /* a pointer to a free list. Don't overwrite it! */
  213. return;
  214. }
  215. if (0 == old_back_ptr) {
  216. SET_OH_BG_PTR(q, p);
  217. if (GOT_LUCKY_NUMBER) ensure_struct(q);
  218. return;
  219. }
  220. /* Check whether it was already in the list of predecessors. */
  221. FOR_EACH_PRED(pred, q, { if (p == pred) return; });
  222. ensure_struct(q);
  223. old_back_ptr = GET_OH_BG_PTR(q);
  224. be = (back_edges *)((word)old_back_ptr & ~FLAG_MANY);
  225. for (i = be -> n_edges, be_cont = be; i > MAX_IN; i -= MAX_IN)
  226. be_cont = be_cont -> cont;
  227. if (i == MAX_IN) {
  228. be_cont -> cont = new_back_edges();
  229. be_cont = be_cont -> cont;
  230. i = 0;
  231. }
  232. be_cont -> edges[i] = p;
  233. be -> n_edges++;
  234. # ifdef DEBUG_PRINT_BIG_N_EDGES
  235. if (GC_print_stats == VERBOSE && be -> n_edges == 100) {
  236. GC_err_printf("The following object has big in-degree:\n");
  237. GC_print_heap_obj(q);
  238. }
  239. # endif
  240. }
  241. typedef void (*per_object_func)(ptr_t p, size_t n_bytes, word gc_descr);
  242. static void per_object_helper(struct hblk *h, word fn)
  243. {
  244. hdr * hhdr = HDR(h);
  245. size_t sz = hhdr -> hb_sz;
  246. word descr = hhdr -> hb_descr;
  247. per_object_func f = (per_object_func)fn;
  248. int i = 0;
  249. do {
  250. f((ptr_t)(h -> hb_body + i), sz, descr);
  251. i += (int)sz;
  252. } while ((word)i + sz <= BYTES_TO_WORDS(HBLKSIZE));
  253. }
  254. GC_INLINE void GC_apply_to_each_object(per_object_func f)
  255. {
  256. GC_apply_to_all_blocks(per_object_helper, (word)f);
  257. }
  258. static void reset_back_edge(ptr_t p, size_t n_bytes GC_ATTR_UNUSED,
  259. word gc_descr GC_ATTR_UNUSED)
  260. {
  261. /* Skip any free list links, or dropped blocks */
  262. if (GC_HAS_DEBUG_INFO(p)) {
  263. ptr_t old_back_ptr = GET_OH_BG_PTR(p);
  264. if ((word)old_back_ptr & FLAG_MANY) {
  265. back_edges *be = (back_edges *)((word)old_back_ptr & ~FLAG_MANY);
  266. if (!(be -> flags & RETAIN)) {
  267. deallocate_back_edges(be);
  268. SET_OH_BG_PTR(p, 0);
  269. } else {
  270. GC_ASSERT(GC_is_marked(p));
  271. /* Back edges may point to objects that will not be retained. */
  272. /* Delete them for now, but remember the height. */
  273. /* Some will be added back at next GC. */
  274. be -> n_edges = 0;
  275. if (0 != be -> cont) {
  276. deallocate_back_edges(be -> cont);
  277. be -> cont = 0;
  278. }
  279. GC_ASSERT(GC_is_marked(p));
  280. /* We only retain things for one GC cycle at a time. */
  281. be -> flags &= ~RETAIN;
  282. }
  283. } else /* Simple back pointer */ {
  284. /* Clear to avoid dangling pointer. */
  285. SET_OH_BG_PTR(p, 0);
  286. }
  287. }
  288. }
  289. static void add_back_edges(ptr_t p, size_t n_bytes, word gc_descr)
  290. {
  291. word *currentp = (word *)(p + sizeof(oh));
  292. /* For now, fix up non-length descriptors conservatively. */
  293. if((gc_descr & GC_DS_TAGS) != GC_DS_LENGTH) {
  294. gc_descr = n_bytes;
  295. }
  296. while ((word)currentp < (word)(p + gc_descr)) {
  297. word current = *currentp++;
  298. FIXUP_POINTER(current);
  299. if (current >= (word)GC_least_plausible_heap_addr &&
  300. current <= (word)GC_greatest_plausible_heap_addr) {
  301. ptr_t target = GC_base((void *)current);
  302. if (0 != target) {
  303. add_edge(p, target);
  304. }
  305. }
  306. }
  307. }
  308. /* Rebuild the representation of the backward reachability graph. */
  309. /* Does not examine mark bits. Can be called before GC. */
  310. GC_INNER void GC_build_back_graph(void)
  311. {
  312. GC_apply_to_each_object(add_back_edges);
  313. }
  314. /* Return an approximation to the length of the longest simple path */
  315. /* through unreachable objects to p. We refer to this as the height */
  316. /* of p. */
  317. static word backwards_height(ptr_t p)
  318. {
  319. word result;
  320. ptr_t back_ptr = GET_OH_BG_PTR(p);
  321. back_edges *be;
  322. if (0 == back_ptr) return 1;
  323. if (!((word)back_ptr & FLAG_MANY)) {
  324. if (is_in_progress(p)) return 0; /* DFS back edge, i.e. we followed */
  325. /* an edge to an object already */
  326. /* on our stack: ignore */
  327. push_in_progress(p);
  328. result = backwards_height(back_ptr)+1;
  329. pop_in_progress(p);
  330. return result;
  331. }
  332. be = (back_edges *)((word)back_ptr & ~FLAG_MANY);
  333. if (be -> height >= 0 && be -> height_gc_no == (unsigned short)GC_gc_no)
  334. return be -> height;
  335. /* Ignore back edges in DFS */
  336. if (be -> height == HEIGHT_IN_PROGRESS) return 0;
  337. result = (be -> height > 0? be -> height : 1);
  338. be -> height = HEIGHT_IN_PROGRESS;
  339. FOR_EACH_PRED(q, p, {
  340. word this_height;
  341. if (GC_is_marked(q) && !(FLAG_MANY & (word)GET_OH_BG_PTR(p))) {
  342. GC_COND_LOG_PRINTF("Found bogus pointer from %p to %p\n", q, p);
  343. /* Reachable object "points to" unreachable one. */
  344. /* Could be caused by our lax treatment of GC descriptors. */
  345. this_height = 1;
  346. } else {
  347. this_height = backwards_height(q);
  348. }
  349. if (this_height >= result) result = this_height + 1;
  350. });
  351. be -> height = result;
  352. be -> height_gc_no = (unsigned short)GC_gc_no;
  353. return result;
  354. }
  355. STATIC word GC_max_height = 0;
  356. STATIC ptr_t GC_deepest_obj = NULL;
  357. /* Compute the maximum height of every unreachable predecessor p of a */
  358. /* reachable object. Arrange to save the heights of all such objects p */
  359. /* so that they can be used in calculating the height of objects in the */
  360. /* next GC. */
  361. /* Set GC_max_height to be the maximum height we encounter, and */
  362. /* GC_deepest_obj to be the corresponding object. */
  363. static void update_max_height(ptr_t p, size_t n_bytes GC_ATTR_UNUSED,
  364. word gc_descr GC_ATTR_UNUSED)
  365. {
  366. if (GC_is_marked(p) && GC_HAS_DEBUG_INFO(p)) {
  367. word p_height = 0;
  368. ptr_t p_deepest_obj = 0;
  369. ptr_t back_ptr;
  370. back_edges *be = 0;
  371. /* If we remembered a height last time, use it as a minimum. */
  372. /* It may have increased due to newly unreachable chains pointing */
  373. /* to p, but it can't have decreased. */
  374. back_ptr = GET_OH_BG_PTR(p);
  375. if (0 != back_ptr && ((word)back_ptr & FLAG_MANY)) {
  376. be = (back_edges *)((word)back_ptr & ~FLAG_MANY);
  377. if (be -> height != HEIGHT_UNKNOWN) p_height = be -> height;
  378. }
  379. FOR_EACH_PRED(q, p, {
  380. if (!GC_is_marked(q) && GC_HAS_DEBUG_INFO(q)) {
  381. word q_height;
  382. q_height = backwards_height(q);
  383. if (q_height > p_height) {
  384. p_height = q_height;
  385. p_deepest_obj = q;
  386. }
  387. }
  388. });
  389. if (p_height > 0) {
  390. /* Remember the height for next time. */
  391. if (be == 0) {
  392. ensure_struct(p);
  393. back_ptr = GET_OH_BG_PTR(p);
  394. be = (back_edges *)((word)back_ptr & ~FLAG_MANY);
  395. }
  396. be -> flags |= RETAIN;
  397. be -> height = p_height;
  398. be -> height_gc_no = (unsigned short)GC_gc_no;
  399. }
  400. if (p_height > GC_max_height) {
  401. GC_max_height = p_height;
  402. GC_deepest_obj = p_deepest_obj;
  403. }
  404. }
  405. }
  406. STATIC word GC_max_max_height = 0;
  407. GC_INNER void GC_traverse_back_graph(void)
  408. {
  409. GC_max_height = 0;
  410. GC_apply_to_each_object(update_max_height);
  411. if (0 != GC_deepest_obj)
  412. GC_set_mark_bit(GC_deepest_obj); /* Keep it until we can print it. */
  413. }
  414. void GC_print_back_graph_stats(void)
  415. {
  416. GC_printf("Maximum backwards height of reachable objects at GC %lu is %lu\n",
  417. (unsigned long) GC_gc_no, (unsigned long)GC_max_height);
  418. if (GC_max_height > GC_max_max_height) {
  419. GC_max_max_height = GC_max_height;
  420. GC_err_printf(
  421. "The following unreachable object is last in a longest chain "
  422. "of unreachable objects:\n");
  423. GC_print_heap_obj(GC_deepest_obj);
  424. }
  425. GC_COND_LOG_PRINTF("Needed max total of %d back-edge structs\n",
  426. GC_n_back_edge_structs);
  427. GC_apply_to_each_object(reset_back_edge);
  428. GC_deepest_obj = 0;
  429. }
  430. #endif /* MAKE_BACK_GRAPH */