snappy-internal.h 9.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222
  1. // Copyright 2008 Google Inc. All Rights Reserved.
  2. //
  3. // Redistribution and use in source and binary forms, with or without
  4. // modification, are permitted provided that the following conditions are
  5. // met:
  6. //
  7. // * Redistributions of source code must retain the above copyright
  8. // notice, this list of conditions and the following disclaimer.
  9. // * Redistributions in binary form must reproduce the above
  10. // copyright notice, this list of conditions and the following disclaimer
  11. // in the documentation and/or other materials provided with the
  12. // distribution.
  13. // * Neither the name of Google Inc. nor the names of its
  14. // contributors may be used to endorse or promote products derived from
  15. // this software without specific prior written permission.
  16. //
  17. // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  18. // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  19. // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  20. // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  21. // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  22. // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  23. // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  24. // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  25. // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  26. // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  27. // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  28. //
  29. // Internals shared between the Snappy implementation and its unittest.
  30. #ifndef THIRD_PARTY_SNAPPY_SNAPPY_INTERNAL_H_
  31. #define THIRD_PARTY_SNAPPY_SNAPPY_INTERNAL_H_
  32. #include "snappy-stubs-internal.h"
  33. namespace snappy {
  34. namespace internal {
  35. class WorkingMemory {
  36. public:
  37. WorkingMemory() : large_table_(NULL) { }
  38. ~WorkingMemory() { delete[] large_table_; }
  39. // Allocates and clears a hash table using memory in "*this",
  40. // stores the number of buckets in "*table_size" and returns a pointer to
  41. // the base of the hash table.
  42. uint16* GetHashTable(size_t input_size, int* table_size);
  43. private:
  44. uint16 small_table_[1<<10]; // 2KB
  45. uint16* large_table_; // Allocated only when needed
  46. DISALLOW_COPY_AND_ASSIGN(WorkingMemory);
  47. };
  48. // Flat array compression that does not emit the "uncompressed length"
  49. // prefix. Compresses "input" string to the "*op" buffer.
  50. //
  51. // REQUIRES: "input_length <= kBlockSize"
  52. // REQUIRES: "op" points to an array of memory that is at least
  53. // "MaxCompressedLength(input_length)" in size.
  54. // REQUIRES: All elements in "table[0..table_size-1]" are initialized to zero.
  55. // REQUIRES: "table_size" is a power of two
  56. //
  57. // Returns an "end" pointer into "op" buffer.
  58. // "end - op" is the compressed size of "input".
  59. char* CompressFragment(const char* input,
  60. size_t input_length,
  61. char* op,
  62. uint16* table,
  63. const int table_size);
  64. // Find the largest n such that
  65. //
  66. // s1[0,n-1] == s2[0,n-1]
  67. // and n <= (s2_limit - s2).
  68. //
  69. // Return make_pair(n, n < 8).
  70. // Does not read *s2_limit or beyond.
  71. // Does not read *(s1 + (s2_limit - s2)) or beyond.
  72. // Requires that s2_limit >= s2.
  73. //
  74. // Separate implementation for x86_64, for speed. Uses the fact that
  75. // x86_64 is little endian.
  76. #if defined(ARCH_K8)
  77. static inline std::pair<size_t, bool> FindMatchLength(const char* s1,
  78. const char* s2,
  79. const char* s2_limit) {
  80. assert(s2_limit >= s2);
  81. size_t matched = 0;
  82. // This block isn't necessary for correctness; we could just start looping
  83. // immediately. As an optimization though, it is useful. It creates some not
  84. // uncommon code paths that determine, without extra effort, whether the match
  85. // length is less than 8. In short, we are hoping to avoid a conditional
  86. // branch, and perhaps get better code layout from the C++ compiler.
  87. if (PREDICT_TRUE(s2 <= s2_limit - 8)) {
  88. uint64 a1 = UNALIGNED_LOAD64(s1);
  89. uint64 a2 = UNALIGNED_LOAD64(s2);
  90. if (a1 != a2) {
  91. return std::pair<size_t, bool>(Bits::FindLSBSetNonZero64(a1 ^ a2) >> 3,
  92. true);
  93. } else {
  94. matched = 8;
  95. s2 += 8;
  96. }
  97. }
  98. // Find out how long the match is. We loop over the data 64 bits at a
  99. // time until we find a 64-bit block that doesn't match; then we find
  100. // the first non-matching bit and use that to calculate the total
  101. // length of the match.
  102. while (PREDICT_TRUE(s2 <= s2_limit - 8)) {
  103. if (UNALIGNED_LOAD64(s2) == UNALIGNED_LOAD64(s1 + matched)) {
  104. s2 += 8;
  105. matched += 8;
  106. } else {
  107. uint64 x = UNALIGNED_LOAD64(s2) ^ UNALIGNED_LOAD64(s1 + matched);
  108. int matching_bits = Bits::FindLSBSetNonZero64(x);
  109. matched += matching_bits >> 3;
  110. assert(matched >= 8);
  111. return std::pair<size_t, bool>(matched, false);
  112. }
  113. }
  114. while (PREDICT_TRUE(s2 < s2_limit)) {
  115. if (s1[matched] == *s2) {
  116. ++s2;
  117. ++matched;
  118. } else {
  119. return std::pair<size_t, bool>(matched, matched < 8);
  120. }
  121. }
  122. return std::pair<size_t, bool>(matched, matched < 8);
  123. }
  124. #else
  125. static inline std::pair<size_t, bool> FindMatchLength(const char* s1,
  126. const char* s2,
  127. const char* s2_limit) {
  128. // Implementation based on the x86-64 version, above.
  129. assert(s2_limit >= s2);
  130. int matched = 0;
  131. while (s2 <= s2_limit - 4 &&
  132. UNALIGNED_LOAD32(s2) == UNALIGNED_LOAD32(s1 + matched)) {
  133. s2 += 4;
  134. matched += 4;
  135. }
  136. if (LittleEndian::IsLittleEndian() && s2 <= s2_limit - 4) {
  137. uint32 x = UNALIGNED_LOAD32(s2) ^ UNALIGNED_LOAD32(s1 + matched);
  138. int matching_bits = Bits::FindLSBSetNonZero(x);
  139. matched += matching_bits >> 3;
  140. } else {
  141. while ((s2 < s2_limit) && (s1[matched] == *s2)) {
  142. ++s2;
  143. ++matched;
  144. }
  145. }
  146. return std::pair<size_t, bool>(matched, matched < 8);
  147. }
  148. #endif
  149. // Lookup tables for decompression code. Give --snappy_dump_decompression_table
  150. // to the unit test to recompute char_table.
  151. enum {
  152. LITERAL = 0,
  153. COPY_1_BYTE_OFFSET = 1, // 3 bit length + 3 bits of offset in opcode
  154. COPY_2_BYTE_OFFSET = 2,
  155. COPY_4_BYTE_OFFSET = 3
  156. };
  157. static const int kMaximumTagLength = 5; // COPY_4_BYTE_OFFSET plus the actual offset.
  158. // Data stored per entry in lookup table:
  159. // Range Bits-used Description
  160. // ------------------------------------
  161. // 1..64 0..7 Literal/copy length encoded in opcode byte
  162. // 0..7 8..10 Copy offset encoded in opcode byte / 256
  163. // 0..4 11..13 Extra bytes after opcode
  164. //
  165. // We use eight bits for the length even though 7 would have sufficed
  166. // because of efficiency reasons:
  167. // (1) Extracting a byte is faster than a bit-field
  168. // (2) It properly aligns copy offset so we do not need a <<8
  169. static const uint16 char_table[256] = {
  170. 0x0001, 0x0804, 0x1001, 0x2001, 0x0002, 0x0805, 0x1002, 0x2002,
  171. 0x0003, 0x0806, 0x1003, 0x2003, 0x0004, 0x0807, 0x1004, 0x2004,
  172. 0x0005, 0x0808, 0x1005, 0x2005, 0x0006, 0x0809, 0x1006, 0x2006,
  173. 0x0007, 0x080a, 0x1007, 0x2007, 0x0008, 0x080b, 0x1008, 0x2008,
  174. 0x0009, 0x0904, 0x1009, 0x2009, 0x000a, 0x0905, 0x100a, 0x200a,
  175. 0x000b, 0x0906, 0x100b, 0x200b, 0x000c, 0x0907, 0x100c, 0x200c,
  176. 0x000d, 0x0908, 0x100d, 0x200d, 0x000e, 0x0909, 0x100e, 0x200e,
  177. 0x000f, 0x090a, 0x100f, 0x200f, 0x0010, 0x090b, 0x1010, 0x2010,
  178. 0x0011, 0x0a04, 0x1011, 0x2011, 0x0012, 0x0a05, 0x1012, 0x2012,
  179. 0x0013, 0x0a06, 0x1013, 0x2013, 0x0014, 0x0a07, 0x1014, 0x2014,
  180. 0x0015, 0x0a08, 0x1015, 0x2015, 0x0016, 0x0a09, 0x1016, 0x2016,
  181. 0x0017, 0x0a0a, 0x1017, 0x2017, 0x0018, 0x0a0b, 0x1018, 0x2018,
  182. 0x0019, 0x0b04, 0x1019, 0x2019, 0x001a, 0x0b05, 0x101a, 0x201a,
  183. 0x001b, 0x0b06, 0x101b, 0x201b, 0x001c, 0x0b07, 0x101c, 0x201c,
  184. 0x001d, 0x0b08, 0x101d, 0x201d, 0x001e, 0x0b09, 0x101e, 0x201e,
  185. 0x001f, 0x0b0a, 0x101f, 0x201f, 0x0020, 0x0b0b, 0x1020, 0x2020,
  186. 0x0021, 0x0c04, 0x1021, 0x2021, 0x0022, 0x0c05, 0x1022, 0x2022,
  187. 0x0023, 0x0c06, 0x1023, 0x2023, 0x0024, 0x0c07, 0x1024, 0x2024,
  188. 0x0025, 0x0c08, 0x1025, 0x2025, 0x0026, 0x0c09, 0x1026, 0x2026,
  189. 0x0027, 0x0c0a, 0x1027, 0x2027, 0x0028, 0x0c0b, 0x1028, 0x2028,
  190. 0x0029, 0x0d04, 0x1029, 0x2029, 0x002a, 0x0d05, 0x102a, 0x202a,
  191. 0x002b, 0x0d06, 0x102b, 0x202b, 0x002c, 0x0d07, 0x102c, 0x202c,
  192. 0x002d, 0x0d08, 0x102d, 0x202d, 0x002e, 0x0d09, 0x102e, 0x202e,
  193. 0x002f, 0x0d0a, 0x102f, 0x202f, 0x0030, 0x0d0b, 0x1030, 0x2030,
  194. 0x0031, 0x0e04, 0x1031, 0x2031, 0x0032, 0x0e05, 0x1032, 0x2032,
  195. 0x0033, 0x0e06, 0x1033, 0x2033, 0x0034, 0x0e07, 0x1034, 0x2034,
  196. 0x0035, 0x0e08, 0x1035, 0x2035, 0x0036, 0x0e09, 0x1036, 0x2036,
  197. 0x0037, 0x0e0a, 0x1037, 0x2037, 0x0038, 0x0e0b, 0x1038, 0x2038,
  198. 0x0039, 0x0f04, 0x1039, 0x2039, 0x003a, 0x0f05, 0x103a, 0x203a,
  199. 0x003b, 0x0f06, 0x103b, 0x203b, 0x003c, 0x0f07, 0x103c, 0x203c,
  200. 0x0801, 0x0f08, 0x103d, 0x203d, 0x1001, 0x0f09, 0x103e, 0x203e,
  201. 0x1801, 0x0f0a, 0x103f, 0x203f, 0x2001, 0x0f0b, 0x1040, 0x2040
  202. };
  203. } // end namespace internal
  204. } // end namespace snappy
  205. #endif // THIRD_PARTY_SNAPPY_SNAPPY_INTERNAL_H_