ginblock.h 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346
  1. /*--------------------------------------------------------------------------
  2. * ginblock.h
  3. * details of structures stored in GIN index blocks
  4. *
  5. * Copyright (c) 2006-2022, PostgreSQL Global Development Group
  6. *
  7. * src/include/access/ginblock.h
  8. *--------------------------------------------------------------------------
  9. */
  10. #ifndef GINBLOCK_H
  11. #define GINBLOCK_H
  12. #include "access/transam.h"
  13. #include "storage/block.h"
  14. #include "storage/bufpage.h"
  15. #include "storage/itemptr.h"
  16. #include "storage/off.h"
  17. /*
  18. * Page opaque data in an inverted index page.
  19. *
  20. * Note: GIN does not include a page ID word as do the other index types.
  21. * This is OK because the opaque data is only 8 bytes and so can be reliably
  22. * distinguished by size. Revisit this if the size ever increases.
  23. * Further note: as of 9.2, SP-GiST also uses 8-byte special space, as does
  24. * BRIN as of 9.5. This is still OK, as long as GIN isn't using all of the
  25. * high-order bits in its flags word, because that way the flags word cannot
  26. * match the page IDs used by SP-GiST and BRIN.
  27. */
  28. typedef struct GinPageOpaqueData
  29. {
  30. BlockNumber rightlink; /* next page if any */
  31. OffsetNumber maxoff; /* number of PostingItems on GIN_DATA &
  32. * ~GIN_LEAF page. On GIN_LIST page, number of
  33. * heap tuples. */
  34. uint16 flags; /* see bit definitions below */
  35. } GinPageOpaqueData;
  36. typedef GinPageOpaqueData *GinPageOpaque;
  37. #define GIN_DATA (1 << 0)
  38. #define GIN_LEAF (1 << 1)
  39. #define GIN_DELETED (1 << 2)
  40. #define GIN_META (1 << 3)
  41. #define GIN_LIST (1 << 4)
  42. #define GIN_LIST_FULLROW (1 << 5) /* makes sense only on GIN_LIST page */
  43. #define GIN_INCOMPLETE_SPLIT (1 << 6) /* page was split, but parent not
  44. * updated */
  45. #define GIN_COMPRESSED (1 << 7)
  46. /* Page numbers of fixed-location pages */
  47. #define GIN_METAPAGE_BLKNO (0)
  48. #define GIN_ROOT_BLKNO (1)
  49. typedef struct GinMetaPageData
  50. {
  51. /*
  52. * Pointers to head and tail of pending list, which consists of GIN_LIST
  53. * pages. These store fast-inserted entries that haven't yet been moved
  54. * into the regular GIN structure.
  55. */
  56. BlockNumber head;
  57. BlockNumber tail;
  58. /*
  59. * Free space in bytes in the pending list's tail page.
  60. */
  61. uint32 tailFreeSize;
  62. /*
  63. * We store both number of pages and number of heap tuples that are in the
  64. * pending list.
  65. */
  66. BlockNumber nPendingPages;
  67. int64 nPendingHeapTuples;
  68. /*
  69. * Statistics for planner use (accurate as of last VACUUM)
  70. */
  71. BlockNumber nTotalPages;
  72. BlockNumber nEntryPages;
  73. BlockNumber nDataPages;
  74. int64 nEntries;
  75. /*
  76. * GIN version number (ideally this should have been at the front, but too
  77. * late now. Don't move it!)
  78. *
  79. * Currently 2 (for indexes initialized in 9.4 or later)
  80. *
  81. * Version 1 (indexes initialized in version 9.1, 9.2 or 9.3), is
  82. * compatible, but may contain uncompressed posting tree (leaf) pages and
  83. * posting lists. They will be converted to compressed format when
  84. * modified.
  85. *
  86. * Version 0 (indexes initialized in 9.0 or before) is compatible but may
  87. * be missing null entries, including both null keys and placeholders.
  88. * Reject full-index-scan attempts on such indexes.
  89. */
  90. int32 ginVersion;
  91. } GinMetaPageData;
  92. #define GIN_CURRENT_VERSION 2
  93. #define GinPageGetMeta(p) \
  94. ((GinMetaPageData *) PageGetContents(p))
  95. /*
  96. * Macros for accessing a GIN index page's opaque data
  97. */
  98. #define GinPageGetOpaque(page) ( (GinPageOpaque) PageGetSpecialPointer(page) )
  99. #define GinPageIsLeaf(page) ( (GinPageGetOpaque(page)->flags & GIN_LEAF) != 0 )
  100. #define GinPageSetLeaf(page) ( GinPageGetOpaque(page)->flags |= GIN_LEAF )
  101. #define GinPageSetNonLeaf(page) ( GinPageGetOpaque(page)->flags &= ~GIN_LEAF )
  102. #define GinPageIsData(page) ( (GinPageGetOpaque(page)->flags & GIN_DATA) != 0 )
  103. #define GinPageSetData(page) ( GinPageGetOpaque(page)->flags |= GIN_DATA )
  104. #define GinPageIsList(page) ( (GinPageGetOpaque(page)->flags & GIN_LIST) != 0 )
  105. #define GinPageSetList(page) ( GinPageGetOpaque(page)->flags |= GIN_LIST )
  106. #define GinPageHasFullRow(page) ( (GinPageGetOpaque(page)->flags & GIN_LIST_FULLROW) != 0 )
  107. #define GinPageSetFullRow(page) ( GinPageGetOpaque(page)->flags |= GIN_LIST_FULLROW )
  108. #define GinPageIsCompressed(page) ( (GinPageGetOpaque(page)->flags & GIN_COMPRESSED) != 0 )
  109. #define GinPageSetCompressed(page) ( GinPageGetOpaque(page)->flags |= GIN_COMPRESSED )
  110. #define GinPageIsDeleted(page) ( (GinPageGetOpaque(page)->flags & GIN_DELETED) != 0 )
  111. #define GinPageSetDeleted(page) ( GinPageGetOpaque(page)->flags |= GIN_DELETED)
  112. #define GinPageSetNonDeleted(page) ( GinPageGetOpaque(page)->flags &= ~GIN_DELETED)
  113. #define GinPageIsIncompleteSplit(page) ( (GinPageGetOpaque(page)->flags & GIN_INCOMPLETE_SPLIT) != 0 )
  114. #define GinPageRightMost(page) ( GinPageGetOpaque(page)->rightlink == InvalidBlockNumber)
  115. /*
  116. * We should reclaim deleted page only once every transaction started before
  117. * its deletion is over.
  118. */
  119. #define GinPageGetDeleteXid(page) ( ((PageHeader) (page))->pd_prune_xid )
  120. #define GinPageSetDeleteXid(page, xid) ( ((PageHeader) (page))->pd_prune_xid = xid)
  121. extern bool GinPageIsRecyclable(Page page);
  122. /*
  123. * We use our own ItemPointerGet(BlockNumber|OffsetNumber)
  124. * to avoid Asserts, since sometimes the ip_posid isn't "valid"
  125. */
  126. #define GinItemPointerGetBlockNumber(pointer) \
  127. (ItemPointerGetBlockNumberNoCheck(pointer))
  128. #define GinItemPointerGetOffsetNumber(pointer) \
  129. (ItemPointerGetOffsetNumberNoCheck(pointer))
  130. #define GinItemPointerSetBlockNumber(pointer, blkno) \
  131. (ItemPointerSetBlockNumber((pointer), (blkno)))
  132. #define GinItemPointerSetOffsetNumber(pointer, offnum) \
  133. (ItemPointerSetOffsetNumber((pointer), (offnum)))
  134. /*
  135. * Special-case item pointer values needed by the GIN search logic.
  136. * MIN: sorts less than any valid item pointer
  137. * MAX: sorts greater than any valid item pointer
  138. * LOSSY PAGE: indicates a whole heap page, sorts after normal item
  139. * pointers for that page
  140. * Note that these are all distinguishable from an "invalid" item pointer
  141. * (which is InvalidBlockNumber/0) as well as from all normal item
  142. * pointers (which have item numbers in the range 1..MaxHeapTuplesPerPage).
  143. */
  144. #define ItemPointerSetMin(p) \
  145. ItemPointerSet((p), (BlockNumber)0, (OffsetNumber)0)
  146. #define ItemPointerIsMin(p) \
  147. (GinItemPointerGetOffsetNumber(p) == (OffsetNumber)0 && \
  148. GinItemPointerGetBlockNumber(p) == (BlockNumber)0)
  149. #define ItemPointerSetMax(p) \
  150. ItemPointerSet((p), InvalidBlockNumber, (OffsetNumber)0xffff)
  151. #define ItemPointerSetLossyPage(p, b) \
  152. ItemPointerSet((p), (b), (OffsetNumber)0xffff)
  153. #define ItemPointerIsLossyPage(p) \
  154. (GinItemPointerGetOffsetNumber(p) == (OffsetNumber)0xffff && \
  155. GinItemPointerGetBlockNumber(p) != InvalidBlockNumber)
  156. /*
  157. * Posting item in a non-leaf posting-tree page
  158. */
  159. typedef struct
  160. {
  161. /* We use BlockIdData not BlockNumber to avoid padding space wastage */
  162. BlockIdData child_blkno;
  163. ItemPointerData key;
  164. } PostingItem;
  165. #define PostingItemGetBlockNumber(pointer) \
  166. BlockIdGetBlockNumber(&(pointer)->child_blkno)
  167. #define PostingItemSetBlockNumber(pointer, blockNumber) \
  168. BlockIdSet(&((pointer)->child_blkno), (blockNumber))
  169. /*
  170. * Category codes to distinguish placeholder nulls from ordinary NULL keys.
  171. *
  172. * The first two code values were chosen to be compatible with the usual usage
  173. * of bool isNull flags. However, casting between bool and GinNullCategory is
  174. * risky because of the possibility of different bit patterns and type sizes,
  175. * so it is no longer done.
  176. *
  177. * GIN_CAT_EMPTY_QUERY is never stored in the index; and notice that it is
  178. * chosen to sort before not after regular key values.
  179. */
  180. typedef signed char GinNullCategory;
  181. #define GIN_CAT_NORM_KEY 0 /* normal, non-null key value */
  182. #define GIN_CAT_NULL_KEY 1 /* null key value */
  183. #define GIN_CAT_EMPTY_ITEM 2 /* placeholder for zero-key item */
  184. #define GIN_CAT_NULL_ITEM 3 /* placeholder for null item */
  185. #define GIN_CAT_EMPTY_QUERY (-1) /* placeholder for full-scan query */
  186. /*
  187. * Access macros for null category byte in entry tuples
  188. */
  189. #define GinCategoryOffset(itup,ginstate) \
  190. (IndexInfoFindDataOffset((itup)->t_info) + \
  191. ((ginstate)->oneCol ? 0 : sizeof(int16)))
  192. #define GinGetNullCategory(itup,ginstate) \
  193. (*((GinNullCategory *) ((char*)(itup) + GinCategoryOffset(itup,ginstate))))
  194. #define GinSetNullCategory(itup,ginstate,c) \
  195. (*((GinNullCategory *) ((char*)(itup) + GinCategoryOffset(itup,ginstate))) = (c))
  196. /*
  197. * Access macros for leaf-page entry tuples (see discussion in README)
  198. */
  199. #define GinGetNPosting(itup) GinItemPointerGetOffsetNumber(&(itup)->t_tid)
  200. #define GinSetNPosting(itup,n) ItemPointerSetOffsetNumber(&(itup)->t_tid,n)
  201. #define GIN_TREE_POSTING ((OffsetNumber)0xffff)
  202. #define GinIsPostingTree(itup) (GinGetNPosting(itup) == GIN_TREE_POSTING)
  203. #define GinSetPostingTree(itup, blkno) ( GinSetNPosting((itup),GIN_TREE_POSTING), ItemPointerSetBlockNumber(&(itup)->t_tid, blkno) )
  204. #define GinGetPostingTree(itup) GinItemPointerGetBlockNumber(&(itup)->t_tid)
  205. #define GIN_ITUP_COMPRESSED (1U << 31)
  206. #define GinGetPostingOffset(itup) (GinItemPointerGetBlockNumber(&(itup)->t_tid) & (~GIN_ITUP_COMPRESSED))
  207. #define GinSetPostingOffset(itup,n) ItemPointerSetBlockNumber(&(itup)->t_tid,(n)|GIN_ITUP_COMPRESSED)
  208. #define GinGetPosting(itup) ((Pointer) ((char*)(itup) + GinGetPostingOffset(itup)))
  209. #define GinItupIsCompressed(itup) ((GinItemPointerGetBlockNumber(&(itup)->t_tid) & GIN_ITUP_COMPRESSED) != 0)
  210. /*
  211. * Maximum size of an item on entry tree page. Make sure that we fit at least
  212. * three items on each page. (On regular B-tree indexes, we must fit at least
  213. * three items: two data items and the "high key". In GIN entry tree, we don't
  214. * currently store the high key explicitly, we just use the rightmost item on
  215. * the page, so it would actually be enough to fit two items.)
  216. */
  217. #define GinMaxItemSize \
  218. Min(INDEX_SIZE_MASK, \
  219. MAXALIGN_DOWN(((BLCKSZ - \
  220. MAXALIGN(SizeOfPageHeaderData + 3 * sizeof(ItemIdData)) - \
  221. MAXALIGN(sizeof(GinPageOpaqueData))) / 3)))
  222. /*
  223. * Access macros for non-leaf entry tuples
  224. */
  225. #define GinGetDownlink(itup) GinItemPointerGetBlockNumber(&(itup)->t_tid)
  226. #define GinSetDownlink(itup,blkno) ItemPointerSet(&(itup)->t_tid, blkno, InvalidOffsetNumber)
  227. /*
  228. * Data (posting tree) pages
  229. *
  230. * Posting tree pages don't store regular tuples. Non-leaf pages contain
  231. * PostingItems, which are pairs of ItemPointers and child block numbers.
  232. * Leaf pages contain GinPostingLists and an uncompressed array of item
  233. * pointers.
  234. *
  235. * In a leaf page, the compressed posting lists are stored after the regular
  236. * page header, one after each other. Although we don't store regular tuples,
  237. * pd_lower is used to indicate the end of the posting lists. After that, free
  238. * space follows. This layout is compatible with the "standard" heap and
  239. * index page layout described in bufpage.h, so that we can e.g set buffer_std
  240. * when writing WAL records.
  241. *
  242. * In the special space is the GinPageOpaque struct.
  243. */
  244. #define GinDataLeafPageGetPostingList(page) \
  245. (GinPostingList *) ((PageGetContents(page) + MAXALIGN(sizeof(ItemPointerData))))
  246. #define GinDataLeafPageGetPostingListSize(page) \
  247. (((PageHeader) page)->pd_lower - MAXALIGN(SizeOfPageHeaderData) - MAXALIGN(sizeof(ItemPointerData)))
  248. #define GinDataLeafPageIsEmpty(page) \
  249. (GinPageIsCompressed(page) ? (GinDataLeafPageGetPostingListSize(page) == 0) : (GinPageGetOpaque(page)->maxoff < FirstOffsetNumber))
  250. #define GinDataLeafPageGetFreeSpace(page) PageGetExactFreeSpace(page)
  251. #define GinDataPageGetRightBound(page) ((ItemPointer) PageGetContents(page))
  252. /*
  253. * Pointer to the data portion of a posting tree page. For internal pages,
  254. * that's the beginning of the array of PostingItems. For compressed leaf
  255. * pages, the first compressed posting list. For uncompressed (pre-9.4) leaf
  256. * pages, it's the beginning of the ItemPointer array.
  257. */
  258. #define GinDataPageGetData(page) \
  259. (PageGetContents(page) + MAXALIGN(sizeof(ItemPointerData)))
  260. /* non-leaf pages contain PostingItems */
  261. #define GinDataPageGetPostingItem(page, i) \
  262. ((PostingItem *) (GinDataPageGetData(page) + ((i)-1) * sizeof(PostingItem)))
  263. /*
  264. * Note: there is no GinDataPageGetDataSize macro, because before version
  265. * 9.4, we didn't set pd_lower on data pages. There can be pages in the index
  266. * that were binary-upgraded from earlier versions and still have an invalid
  267. * pd_lower, so we cannot trust it in general. Compressed posting tree leaf
  268. * pages are new in 9.4, however, so we can trust them; see
  269. * GinDataLeafPageGetPostingListSize.
  270. */
  271. #define GinDataPageSetDataSize(page, size) \
  272. { \
  273. Assert(size <= GinDataPageMaxDataSize); \
  274. ((PageHeader) page)->pd_lower = (size) + MAXALIGN(SizeOfPageHeaderData) + MAXALIGN(sizeof(ItemPointerData)); \
  275. }
  276. #define GinNonLeafDataPageGetFreeSpace(page) \
  277. (GinDataPageMaxDataSize - \
  278. GinPageGetOpaque(page)->maxoff * sizeof(PostingItem))
  279. #define GinDataPageMaxDataSize \
  280. (BLCKSZ - MAXALIGN(SizeOfPageHeaderData) \
  281. - MAXALIGN(sizeof(ItemPointerData)) \
  282. - MAXALIGN(sizeof(GinPageOpaqueData)))
  283. /*
  284. * List pages
  285. */
  286. #define GinListPageSize \
  287. ( BLCKSZ - SizeOfPageHeaderData - MAXALIGN(sizeof(GinPageOpaqueData)) )
  288. /*
  289. * A compressed posting list.
  290. *
  291. * Note: This requires 2-byte alignment.
  292. */
  293. typedef struct
  294. {
  295. ItemPointerData first; /* first item in this posting list (unpacked) */
  296. uint16 nbytes; /* number of bytes that follow */
  297. unsigned char bytes[FLEXIBLE_ARRAY_MEMBER]; /* varbyte encoded items */
  298. } GinPostingList;
  299. #define SizeOfGinPostingList(plist) (offsetof(GinPostingList, bytes) + SHORTALIGN((plist)->nbytes) )
  300. #define GinNextPostingListSegment(cur) ((GinPostingList *) (((char *) (cur)) + SizeOfGinPostingList((cur))))
  301. #endif /* GINBLOCK_H */