imageDecompressor.cpp source code [OpenJDK/src/java.base/share/native/libjimage/imageDecompressor.cpp]

1	/*
2	* Copyright (c) 2015, 2018, Oracle and/or its affiliates. All rights reserved.
3	*
4	* Redistribution and use in source and binary forms, with or without
5	* modification, are permitted provided that the following conditions
6	* are met:
7	*
8	* - Redistributions of source code must retain the above copyright
9	* notice, this list of conditions and the following disclaimer.
10	*
11	* - Redistributions in binary form must reproduce the above copyright
12	* notice, this list of conditions and the following disclaimer in the
13	* documentation and/or other materials provided with the distribution.
14	*
15	* - Neither the name of Oracle nor the names of its
16	* contributors may be used to endorse or promote products derived
17	* from this software without specific prior written permission.
18	*
19	* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS
20	* IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
21	* THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22	* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
23	* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
24	* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
25	* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
26	* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
27	* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
28	* NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
29	* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30	*/
31
32	#include "jni.h"
33	#include "imageDecompressor.hpp"
34	#include "endian.hpp"
35	#ifdef WIN32
36	#include <windows.h>
37	#else
38	#include <dlfcn.h>
39	#endif
40
41	typedef jboolean (ZipInflateFully_t)(void* *inBuf, jlong inLen,
42	void outBuf, jlong outLen, char* **pmsg);
43	static ZipInflateFully_t ZipInflateFully = NULL;
44
45	#ifndef WIN32
46	#define JNI_LIB_PREFIX "lib"
47	#ifdef __APPLE__
48	#define JNI_LIB_SUFFIX ".dylib"
49	#else
50	#define JNI_LIB_SUFFIX ".so"
51	#endif
52	#endif
53
54	/**
55	* Return the address of the entry point named in the zip shared library.
56	* @param name - the name of the entry point
57	* @return the address of the entry point or NULL
58	*/
59	static void* findEntry(const char* name) {
60	void *addr = NULL;
61	#ifdef WIN32
62	HMODULE handle = GetModuleHandle("zip.dll");
63	if (handle == NULL) {
64	return NULL;
65	}
66	addr = (void*) GetProcAddress(handle, name);
67	return addr;
68	#else
69	addr = dlopen(JNI_LIB_PREFIX "zip" JNI_LIB_SUFFIX, RTLD_GLOBAL\|RTLD_LAZY);
70	if (addr == NULL) {
71	return NULL;
72	}
73	addr = dlsym(addr, name);
74	return addr;
75	#endif
76	}
77
78	/*
79	* Initialize the array of decompressors.
80	*/
81	int ImageDecompressor::_decompressors_num = `0`;
82	ImageDecompressor** ImageDecompressor::_decompressors = NULL;
83	void ImageDecompressor::image_decompressor_init() {
84	if (_decompressors == NULL) {
85	ZipInflateFully = (ZipInflateFully_t) findEntry("ZIP_InflateFully");
86	assert(ZipInflateFully != NULL && "ZIP decompressor not found.");
87	_decompressors_num = `2`;
88	_decompressors = new ImageDecompressor*[_decompressors_num];
89	_decompressors[`0`] = new ZipDecompressor ("zip");
90	_decompressors[`1`] = new SharedStringDecompressor ("compact-cp");
91	}
92	}
93
94	void ImageDecompressor::image_decompressor_close() {
95	delete[] _decompressors;
96	}
97
98	/*
99	* Locate decompressor.
100	*/
101	ImageDecompressor* ImageDecompressor::get_decompressor(const char * decompressor_name) {
102	image_decompressor_init();
103	for (int i = `0`; i < _decompressors_num; i++) {
104	ImageDecompressor* decompressor = _decompressors[i];
105	assert(decompressor != NULL && "Decompressors not initialized.");
106	if (strcmp(decompressor->get_name(), decompressor_name) == `0`) {
107	return decompressor;
108	}
109	}
110	assert(false && "No decompressor found.");
111	return NULL;
112	}
113
114	// Sparc to read unaligned content
115	// u8 l = ((u8) ptr);
116	// If ptr is not aligned, sparc will fail.
117	u8 ImageDecompressor::getU8(u1* ptr, Endian *endian) {
118	u8 ret;
119	if (endian->is_big_endian()) {
120	ret = (u8)ptr[`0`] << `56` \| (u8)ptr[`1`] << `48` \| (u8)ptr[`2`]<<`40` \| (u8)ptr[`3`]<<`32` \|
121	ptr[`4`]<<`24` \| ptr[`5`]<<`16` \| ptr[`6`]<<`8` \| ptr[`7`];
122	} else {
123	ret = ptr[`0`] \| ptr[`1`]<<`8` \| ptr[`2`]<<`16` \| ptr[`3`]<<`24` \| (u8)ptr[`4`]<<`32` \|
124	(u8)ptr[`5`]<<`40` \| (u8)ptr[`6`]<<`48` \| (u8)ptr[`7`]<<`56`;
125	}
126	return ret;
127	}
128
129	u4 ImageDecompressor::getU4(u1* ptr, Endian *endian) {
130	u4 ret;
131	if (endian->is_big_endian()) {
132	ret = ptr[`0`] << `24` \| ptr[`1`]<<`16` \| (ptr[`2`]<<`8`) \| ptr[`3`];
133	} else {
134	ret = ptr[`0`] \| ptr[`1`]<<`8` \| (ptr[`2`]<<`16`) \| ptr[`3`]<<`24`;
135	}
136	return ret;
137	}
138
139	/*
140	* Decompression entry point. Called from ImageFileReader::get_resource.
141	*/
142	void ImageDecompressor::decompress_resource(u1* compressed, u1* uncompressed,
143	u8 uncompressed_size, const ImageStrings* strings, Endian *endian) {
144	bool has_header = false;
145	u1* decompressed_resource = compressed;
146	u1* compressed_resource = compressed;
147	// Resource could have been transformed by a stack of decompressors.
148	// Iterate and decompress resources until there is no more header.
149	do {
150	ResourceHeader _header;
151	u1* compressed_resource_base = compressed_resource;
152	_header._magic = getU4(compressed_resource, endian);
153	compressed_resource += `4`;
154	_header._size = getU8(compressed_resource, endian);
155	compressed_resource += `8`;
156	_header._uncompressed_size = getU8(compressed_resource, endian);
157	compressed_resource += `8`;
158	_header._decompressor_name_offset = getU4(compressed_resource, endian);
159	compressed_resource += `4`;
160	_header._decompressor_config_offset = getU4(compressed_resource, endian);
161	compressed_resource += `4`;
162	_header._is_terminal = *compressed_resource;
163	compressed_resource += `1`;
164	has_header = _header._magic == ResourceHeader::resource_header_magic;
165	if (has_header) {
166	// decompressed_resource array contains the result of decompression
167	decompressed_resource = new u1[(size_t) _header._uncompressed_size];
168	// Retrieve the decompressor name
169	const char* decompressor_name = strings->get(_header._decompressor_name_offset);
170	assert(decompressor_name && "image decompressor not found");
171	// Retrieve the decompressor instance
172	ImageDecompressor* decompressor = get_decompressor(decompressor_name);
173	assert(decompressor && "image decompressor not found");
174	// Ask the decompressor to decompress the compressed content
175	decompressor->decompress_resource(compressed_resource, decompressed_resource,
176	&_header, strings);
177	if (compressed_resource_base != compressed) {
178	delete[] compressed_resource_base;
179	}
180	compressed_resource = decompressed_resource;
181	}
182	} while (has_header);
183	memcpy(uncompressed, decompressed_resource, (size_t) uncompressed_size);
184	delete[] decompressed_resource;
185	}
186
187	// Zip decompressor
188
189	void ZipDecompressor::decompress_resource(u1* data, u1* uncompressed,
190	ResourceHeader* header, const ImageStrings* strings) {
191	char* msg = NULL;
192	jboolean res = ZipDecompressor::decompress(data, header->_size, uncompressed,
193	header->_uncompressed_size, &msg);
194	assert(res && "decompression failed");
195	}
196
197	jboolean ZipDecompressor::decompress(void in, u8 inSize, void* out, u8 outSize, char* **pmsg) {
198	return (*ZipInflateFully)(in, inSize, out, outSize, pmsg);
199	}
200
201	// END Zip Decompressor
202
203	// Shared String decompressor
204
205	// array index is the constant pool tag. value is size.
206	// eg: array[5] = 8; means size of long is 8 bytes.
207	const u1 SharedStringDecompressor::sizes[] = {
208	`0`, `0`, `0`, `4`, `4`, `8`, `8`, `2`, `2`, `4`, `4`, `4`, `4`, `0`, `0`, `3`, `2`, `0`, `4`
209	};
210	/**
211	* Recreate the class by reconstructing the constant pool.
212	*/
213	void SharedStringDecompressor::decompress_resource(u1* data,
214	u1* uncompressed_resource,
215	ResourceHeader* header, const ImageStrings* strings) {
216	u1* uncompressed_base = uncompressed_resource;
217	u1* data_base = data;
218	int header_size = `8`; // magic + major + minor
219	memcpy(uncompressed_resource, data, header_size + `2`); //+ cp count
220	uncompressed_resource += header_size + `2`;
221	data += header_size;
222	u2 cp_count = Endian::get_java(data);
223	data += `2`;
224	for (int i = `1`; i < cp_count; i++) {
225	u1 tag = *data;
226	data += `1`;
227	switch (tag) {
228
229	case externalized_string:
230	{ // String in Strings table
231	*uncompressed_resource = `1`;
232	uncompressed_resource += `1`;
233	int k = decompress_int(data);
234	const char * string = strings->get(k);
235	int str_length = (int) strlen(string);
236	Endian::set_java(uncompressed_resource, str_length);
237	uncompressed_resource += `2`;
238	memcpy(uncompressed_resource, string, str_length);
239	uncompressed_resource += str_length;
240	break;
241	}
242	// Descriptor String has been split and types added to Strings table
243	case externalized_string_descriptor:
244	{
245	*uncompressed_resource = `1`;
246	uncompressed_resource += `1`;
247	int descriptor_index = decompress_int(data);
248	int indexes_length = decompress_int(data);
249	u1* length_address = uncompressed_resource;
250	uncompressed_resource += `2`;
251	int desc_length = `0`;
252	const char * desc_string = strings->get(descriptor_index);
253	if (indexes_length > `0`) {
254	u1* indexes_base = data;
255	data += indexes_length;
256	char c = *desc_string;
257	do {
258	*uncompressed_resource = c;
259	uncompressed_resource++;
260	desc_length += `1`;
261	/*
262	* Every L character is the marker we are looking at in order
263	* to reconstruct the descriptor. Each time an L is found, then
264	* we retrieve the couple token/token at the current index and
265	* add it to the descriptor.
266	* "(L;I)V" and "java/lang","String" couple of tokens,
267	* this becomes "(Ljava/lang/String;I)V"
268	*/
269	if (c == `'L'`) {
270	int index = decompress_int(indexes_base);
271	const char * pkg = strings->get(index);
272	int str_length = (int) strlen(pkg);
273	// the case where we have a package.
274	// reconstruct the type full name
275	if (str_length > `0`) {
276	int len = str_length + `1`;
277	char* fullpkg = new char[len];
278	char* pkg_base = fullpkg;
279	memcpy(fullpkg, pkg, str_length);
280	fullpkg += str_length;
281	*fullpkg = `'/'`;
282	memcpy(uncompressed_resource, pkg_base, len);
283	uncompressed_resource += len;
284	delete[] pkg_base;
285	desc_length += len;
286	} else { // Empty package
287	// Nothing to do.
288	}
289	int classIndex = decompress_int(indexes_base);
290	const char * clazz = strings->get(classIndex);
291	int clazz_length = (int) strlen(clazz);
292	memcpy(uncompressed_resource, clazz, clazz_length);
293	uncompressed_resource += clazz_length;
294	desc_length += clazz_length;
295	}
296	desc_string += `1`;
297	c = *desc_string;
298	} while (c != `'\0'`);
299	} else {
300	desc_length = (int) strlen(desc_string);
301	memcpy(uncompressed_resource, desc_string, desc_length);
302	uncompressed_resource += desc_length;
303	}
304	Endian::set_java(length_address, desc_length);
305	break;
306	}
307
308	case constant_utf8:
309	{ // UTF-8
310	*uncompressed_resource = tag;
311	uncompressed_resource += `1`;
312	u2 str_length = Endian::get_java(data);
313	int len = str_length + `2`;
314	memcpy(uncompressed_resource, data, len);
315	uncompressed_resource += len;
316	data += len;
317	break;
318	}
319
320	case constant_long:
321	case constant_double:
322	{
323	i++;
324	}
325	/ fall through /
326	default:
327	{
328	*uncompressed_resource = tag;
329	uncompressed_resource += `1`;
330	int size = sizes[tag];
331	memcpy(uncompressed_resource, data, size);
332	uncompressed_resource += size;
333	data += size;
334	}
335	}
336	}
337	u8 remain = header->_size - (int)(data - data_base);
338	u8 computed = (u8)(uncompressed_resource - uncompressed_base) + remain;
339	if (header->_uncompressed_size != computed)
340	printf("Failure, expecting %llu but getting %llu\n", header->_uncompressed_size,
341	computed);
342	assert(header->_uncompressed_size == computed &&
343	"Constant Pool reconstruction failed");
344	memcpy(uncompressed_resource, data, (size_t) remain);
345	}
346
347	/*
348	* Decompress integers. Compressed integers are negative.
349	* If positive, the integer is not decompressed.
350	* If negative, length extracted from the first byte, then reconstruct the integer
351	* from the following bytes.
352	* Example of compression: 1 is compressed on 1 byte: 10100001
353	*/
354	int SharedStringDecompressor::decompress_int(unsigned char*& value) {
355	int len = `4`;
356	int res = `0`;
357	char b1 = *value;
358	if (is_compressed((signed char)b1)) { // compressed
359	len = get_compressed_length(b1);
360	char clearedValue = b1 &= `0x1F`;
361	if (len == `1`) {
362	res = clearedValue;
363	} else {
364	res = (clearedValue & `0xFF`) << `8` * (len - `1`);
365	for (int i = `1`; i < len; i++) {
366	res \|= (value[i]&`0xFF`) << `8` * (len - i - `1`);
367	}
368	}
369	} else {
370	res = (value[`0`] & `0xFF`) << `24` \| (value[`1`]&`0xFF`) << `16` \|
371	(value[`2`]&`0xFF`) << `8` \| (value[`3`]&`0xFF`);
372	}
373	value += len;
374	return res;
375	}
376	// END Shared String decompressor
377

Browse the source code of OpenJDK/src/java.base/share/native/libjimage/imageDecompressor.cpp