snappy-internal.h source code [DuckDB/third_party/miniparquet/snappy/snappy-internal.h]

1	// Copyright 2008 Google Inc. All Rights Reserved.
2	//
3	// Redistribution and use in source and binary forms, with or without
4	// modification, are permitted provided that the following conditions are
5	// met:
6	//
7	// Redistributions of source code must retain the above copyright*
8	// notice, this list of conditions and the following disclaimer.
9	// Redistributions in binary form must reproduce the above*
10	// copyright notice, this list of conditions and the following disclaimer
11	// in the documentation and/or other materials provided with the
12	// distribution.
13	// Neither the name of Google Inc. nor the names of its*
14	// contributors may be used to endorse or promote products derived from
15	// this software without specific prior written permission.
16	//
17	// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
18	// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
19	// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
20	// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
21	// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
22	// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
23	// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
24	// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
25	// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
26	// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
27	// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28	//
29	// Internals shared between the Snappy implementation and its unittest.
30
31	#ifndef THIRD_PARTY_SNAPPY_SNAPPY_INTERNAL_H_
32	#define THIRD_PARTY_SNAPPY_SNAPPY_INTERNAL_H_
33
34	#include "snappy-stubs-internal.h"
35
36	namespace snappy {
37	namespace internal {
38
39	// Working memory performs a single allocation to hold all scratch space
40	// required for compression.
41	class WorkingMemory {
42	public:
43	explicit WorkingMemory(size_t input_size);
44	~WorkingMemory();
45
46	// Allocates and clears a hash table using memory in "this",*
47	// stores the number of buckets in "table_size" and returns a pointer to*
48	// the base of the hash table.
49	uint16* GetHashTable(size_t fragment_size, int* table_size) const;
50	char* GetScratchInput() const { return input_; }
51	char* GetScratchOutput() const { return output_; }
52
53	private:
54	char* mem_; // the allocated memory, never nullptr
55	size_t size_; // the size of the allocated memory, never 0
56	uint16* table_; // the pointer to the hashtable
57	char* input_; // the pointer to the input scratch buffer
58	char* output_; // the pointer to the output scratch buffer
59
60	// No copying
61	WorkingMemory(const WorkingMemory&);
62	void operator=(const WorkingMemory&);
63	};
64
65	// Flat array compression that does not emit the "uncompressed length"
66	// prefix. Compresses "input" string to the "op" buffer.*
67	//
68	// REQUIRES: "input_length <= kBlockSize"
69	// REQUIRES: "op" points to an array of memory that is at least
70	// "MaxCompressedLength(input_length)" in size.
71	// REQUIRES: All elements in "table[0..table_size-1]" are initialized to zero.
72	// REQUIRES: "table_size" is a power of two
73	//
74	// Returns an "end" pointer into "op" buffer.
75	// "end - op" is the compressed size of "input".
76	char* CompressFragment(const char* input,
77	size_t input_length,
78	char* op,
79	uint16* table,
80	const int table_size);
81
82	// Find the largest n such that
83	//
84	// s1[0,n-1] == s2[0,n-1]
85	// and n <= (s2_limit - s2).
86	//
87	// Return make_pair(n, n < 8).
88	// Does not read s2_limit or beyond.*
89	// Does not read (s1 + (s2_limit - s2)) or beyond.*
90	// Requires that s2_limit >= s2.
91	//
92	// Separate implementation for 64-bit, little-endian cpus.
93	#if !defined(SNAPPY_IS_BIG_ENDIAN) && \
94	(defined(ARCH_K8) \|\| defined(ARCH_PPC) \|\| defined(ARCH_ARM))
95	static inline std::pair<size_t, bool> FindMatchLength(const char* s1,
96	const char* s2,
97	const char* s2_limit) {
98	assert(s2_limit >= s2);
99	size_t matched = `0`;
100
101	// This block isn't necessary for correctness; we could just start looping
102	// immediately. As an optimization though, it is useful. It creates some not
103	// uncommon code paths that determine, without extra effort, whether the match
104	// length is less than 8. In short, we are hoping to avoid a conditional
105	// branch, and perhaps get better code layout from the C++ compiler.
106	if (SNAPPY_PREDICT_TRUE(s2 <= s2_limit - `8`)) {
107	uint64 a1 = UNALIGNED_LOAD64(s1);
108	uint64 a2 = UNALIGNED_LOAD64(s2);
109	if (a1 != a2) {
110	return std::pair<size_t, bool>(Bits::FindLSBSetNonZero64(a1 ^ a2) >> `3`,
111	true);
112	} else {
113	matched = `8`;
114	s2 += `8`;
115	}
116	}
117
118	// Find out how long the match is. We loop over the data 64 bits at a
119	// time until we find a 64-bit block that doesn't match; then we find
120	// the first non-matching bit and use that to calculate the total
121	// length of the match.
122	while (SNAPPY_PREDICT_TRUE(s2 <= s2_limit - `8`)) {
123	if (UNALIGNED_LOAD64(s2) == UNALIGNED_LOAD64(s1 + matched)) {
124	s2 += `8`;
125	matched += `8`;
126	} else {
127	uint64 x = UNALIGNED_LOAD64(s2) ^ UNALIGNED_LOAD64(s1 + matched);
128	int matching_bits = Bits::FindLSBSetNonZero64(x);
129	matched += matching_bits >> `3`;
130	assert(matched >= `8`);
131	return std::pair<size_t, bool>(matched, false);
132	}
133	}
134	while (SNAPPY_PREDICT_TRUE(s2 < s2_limit)) {
135	if (s1[matched] == *s2) {
136	++s2;
137	++matched;
138	} else {
139	return std::pair<size_t, bool>(matched, matched < `8`);
140	}
141	}
142	return std::pair<size_t, bool>(matched, matched < `8`);
143	}
144	#else
145	static inline std::pair<size_t, bool> FindMatchLength(const char* s1,
146	const char* s2,
147	const char* s2_limit) {
148	// Implementation based on the x86-64 version, above.
149	assert(s2_limit >= s2);
150	int matched = `0`;
151
152	while (s2 <= s2_limit - `4` &&
153	UNALIGNED_LOAD32(s2) == UNALIGNED_LOAD32(s1 + matched)) {
154	s2 += `4`;
155	matched += `4`;
156	}
157	if (LittleEndian::IsLittleEndian() && s2 <= s2_limit - `4`) {
158	uint32 x = UNALIGNED_LOAD32(s2) ^ UNALIGNED_LOAD32(s1 + matched);
159	int matching_bits = Bits::FindLSBSetNonZero(x);
160	matched += matching_bits >> `3`;
161	} else {
162	while ((s2 < s2_limit) && (s1[matched] == *s2)) {
163	++s2;
164	++matched;
165	}
166	}
167	return std::pair<size_t, bool>(matched, matched < `8`);
168	}
169	#endif
170
171	// Lookup tables for decompression code. Give --snappy_dump_decompression_table
172	// to the unit test to recompute char_table.
173
174	enum {
175	LITERAL = `0`,
176	COPY_1_BYTE_OFFSET = `1`, // 3 bit length + 3 bits of offset in opcode
177	COPY_2_BYTE_OFFSET = `2`,
178	COPY_4_BYTE_OFFSET = `3`
179	};
180	static const int kMaximumTagLength = `5`; // COPY_4_BYTE_OFFSET plus the actual offset.
181
182	// Data stored per entry in lookup table:
183	// Range Bits-used Description
184	// ------------------------------------
185	// 1..64 0..7 Literal/copy length encoded in opcode byte
186	// 0..7 8..10 Copy offset encoded in opcode byte / 256
187	// 0..4 11..13 Extra bytes after opcode
188	//
189	// We use eight bits for the length even though 7 would have sufficed
190	// because of efficiency reasons:
191	// (1) Extracting a byte is faster than a bit-field
192	// (2) It properly aligns copy offset so we do not need a <<8
193	static const uint16 char_table[`256`] = {
194	`0x0001`, `0x0804`, `0x1001`, `0x2001`, `0x0002`, `0x0805`, `0x1002`, `0x2002`,
195	`0x0003`, `0x0806`, `0x1003`, `0x2003`, `0x0004`, `0x0807`, `0x1004`, `0x2004`,
196	`0x0005`, `0x0808`, `0x1005`, `0x2005`, `0x0006`, `0x0809`, `0x1006`, `0x2006`,
197	`0x0007`, `0x080a`, `0x1007`, `0x2007`, `0x0008`, `0x080b`, `0x1008`, `0x2008`,
198	`0x0009`, `0x0904`, `0x1009`, `0x2009`, `0x000a`, `0x0905`, `0x100a`, `0x200a`,
199	`0x000b`, `0x0906`, `0x100b`, `0x200b`, `0x000c`, `0x0907`, `0x100c`, `0x200c`,
200	`0x000d`, `0x0908`, `0x100d`, `0x200d`, `0x000e`, `0x0909`, `0x100e`, `0x200e`,
201	`0x000f`, `0x090a`, `0x100f`, `0x200f`, `0x0010`, `0x090b`, `0x1010`, `0x2010`,
202	`0x0011`, `0x0a04`, `0x1011`, `0x2011`, `0x0012`, `0x0a05`, `0x1012`, `0x2012`,
203	`0x0013`, `0x0a06`, `0x1013`, `0x2013`, `0x0014`, `0x0a07`, `0x1014`, `0x2014`,
204	`0x0015`, `0x0a08`, `0x1015`, `0x2015`, `0x0016`, `0x0a09`, `0x1016`, `0x2016`,
205	`0x0017`, `0x0a0a`, `0x1017`, `0x2017`, `0x0018`, `0x0a0b`, `0x1018`, `0x2018`,
206	`0x0019`, `0x0b04`, `0x1019`, `0x2019`, `0x001a`, `0x0b05`, `0x101a`, `0x201a`,
207	`0x001b`, `0x0b06`, `0x101b`, `0x201b`, `0x001c`, `0x0b07`, `0x101c`, `0x201c`,
208	`0x001d`, `0x0b08`, `0x101d`, `0x201d`, `0x001e`, `0x0b09`, `0x101e`, `0x201e`,
209	`0x001f`, `0x0b0a`, `0x101f`, `0x201f`, `0x0020`, `0x0b0b`, `0x1020`, `0x2020`,
210	`0x0021`, `0x0c04`, `0x1021`, `0x2021`, `0x0022`, `0x0c05`, `0x1022`, `0x2022`,
211	`0x0023`, `0x0c06`, `0x1023`, `0x2023`, `0x0024`, `0x0c07`, `0x1024`, `0x2024`,
212	`0x0025`, `0x0c08`, `0x1025`, `0x2025`, `0x0026`, `0x0c09`, `0x1026`, `0x2026`,
213	`0x0027`, `0x0c0a`, `0x1027`, `0x2027`, `0x0028`, `0x0c0b`, `0x1028`, `0x2028`,
214	`0x0029`, `0x0d04`, `0x1029`, `0x2029`, `0x002a`, `0x0d05`, `0x102a`, `0x202a`,
215	`0x002b`, `0x0d06`, `0x102b`, `0x202b`, `0x002c`, `0x0d07`, `0x102c`, `0x202c`,
216	`0x002d`, `0x0d08`, `0x102d`, `0x202d`, `0x002e`, `0x0d09`, `0x102e`, `0x202e`,
217	`0x002f`, `0x0d0a`, `0x102f`, `0x202f`, `0x0030`, `0x0d0b`, `0x1030`, `0x2030`,
218	`0x0031`, `0x0e04`, `0x1031`, `0x2031`, `0x0032`, `0x0e05`, `0x1032`, `0x2032`,
219	`0x0033`, `0x0e06`, `0x1033`, `0x2033`, `0x0034`, `0x0e07`, `0x1034`, `0x2034`,
220	`0x0035`, `0x0e08`, `0x1035`, `0x2035`, `0x0036`, `0x0e09`, `0x1036`, `0x2036`,
221	`0x0037`, `0x0e0a`, `0x1037`, `0x2037`, `0x0038`, `0x0e0b`, `0x1038`, `0x2038`,
222	`0x0039`, `0x0f04`, `0x1039`, `0x2039`, `0x003a`, `0x0f05`, `0x103a`, `0x203a`,
223	`0x003b`, `0x0f06`, `0x103b`, `0x203b`, `0x003c`, `0x0f07`, `0x103c`, `0x203c`,
224	`0x0801`, `0x0f08`, `0x103d`, `0x203d`, `0x1001`, `0x0f09`, `0x103e`, `0x203e`,
225	`0x1801`, `0x0f0a`, `0x103f`, `0x203f`, `0x2001`, `0x0f0b`, `0x1040`, `0x2040`
226	};
227
228	} // end namespace internal
229
230
231	// The size of a compression block. Note that many parts of the compression
232	// code assumes that kBlockSize <= 65536; in particular, the hash table
233	// can only store 16-bit offsets, and EmitCopy() also assumes the offset
234	// is 65535 bytes or less. Note also that if you change this, it will
235	// affect the framing format (see framing_format.txt).
236	//
237	// Note that there might be older data around that is compressed with larger
238	// block sizes, so the decompression code should not rely on the
239	// non-existence of long backreferences.
240	static const int kBlockLog = `16`;
241	static const size_t kBlockSize = `1` << kBlockLog;
242
243	static const int kMaxHashTableBits = `14`;
244	static const size_t kMaxHashTableSize = `1` << kMaxHashTableBits;
245
246
247	} // end namespace snappy
248
249	#endif // THIRD_PARTY_SNAPPY_SNAPPY_INTERNAL_H_
250

Browse the source code of DuckDB/third_party/miniparquet/snappy/snappy-internal.h