| 1 | /* |
| 2 | * Copyright (c) 2015, 2016, Oracle and/or its affiliates. All rights reserved. |
| 3 | * |
| 4 | * Redistribution and use in source and binary forms, with or without |
| 5 | * modification, are permitted provided that the following conditions |
| 6 | * are met: |
| 7 | * |
| 8 | * - Redistributions of source code must retain the above copyright |
| 9 | * notice, this list of conditions and the following disclaimer. |
| 10 | * |
| 11 | * - Redistributions in binary form must reproduce the above copyright |
| 12 | * notice, this list of conditions and the following disclaimer in the |
| 13 | * documentation and/or other materials provided with the distribution. |
| 14 | * |
| 15 | * - Neither the name of Oracle nor the names of its |
| 16 | * contributors may be used to endorse or promote products derived |
| 17 | * from this software without specific prior written permission. |
| 18 | * |
| 19 | * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS |
| 20 | * IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, |
| 21 | * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR |
| 22 | * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR |
| 23 | * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, |
| 24 | * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, |
| 25 | * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR |
| 26 | * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF |
| 27 | * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING |
| 28 | * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |
| 29 | * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| 30 | */ |
| 31 | |
| 32 | #ifndef LIBJIMAGE_IMAGEDECOMPRESSOR_HPP |
| 33 | #define LIBJIMAGE_IMAGEDECOMPRESSOR_HPP |
| 34 | |
| 35 | #include <assert.h> |
| 36 | #include <string.h> |
| 37 | |
| 38 | #include "imageFile.hpp" |
| 39 | #include "inttypes.hpp" |
| 40 | #include "jni.h" |
| 41 | |
| 42 | /* |
| 43 | * Compressed resources located in image have an header. |
| 44 | * This header contains: |
| 45 | * - _magic: A magic u4, required to retrieved the header in the compressed content |
| 46 | * - _size: The size of the compressed resource. |
| 47 | * - _uncompressed_size: The uncompressed size of the compressed resource. |
| 48 | * - _decompressor_name_offset: The ImageDecompressor instance name StringsTable offset. |
| 49 | * - _decompressor_config_offset: StringsTable offset of configuration that could be needed by |
| 50 | * the decompressor in order to decompress. |
| 51 | * - _is_terminal: 1: the compressed content is terminal. Uncompressing it would |
| 52 | * create the actual resource. 0: the compressed content is not terminal. Uncompressing it |
| 53 | * will result in a compressed content to be decompressed (This occurs when a stack of compressors |
| 54 | * have been used to compress the resource. |
| 55 | */ |
| 56 | struct { |
| 57 | /* magic bytes that identifies a compressed resource header*/ |
| 58 | static const u4 = 0xCAFEFAFA; |
| 59 | u4 ; // Resource header |
| 60 | u8 ; // Resource size |
| 61 | u8 ; // Expected uncompressed size |
| 62 | u4 ; // Strings table decompressor offset |
| 63 | u4 ; // Strings table config offset |
| 64 | u1 ; // Last decompressor 1, otherwise 0. |
| 65 | }; |
| 66 | |
| 67 | /* |
| 68 | * Resources located in jimage file can be compressed. Compression occurs at |
| 69 | * jimage file creation time. When compressed a resource is added an header that |
| 70 | * contains the name of the compressor that compressed it. |
| 71 | * Various compression strategies can be applied to compress a resource. |
| 72 | * The same resource can even be compressed multiple time by a stack of compressors. |
| 73 | * At runtime, a resource is decompressed in a loop until there is no more header |
| 74 | * meaning that the resource is equivalent to the not compressed resource. |
| 75 | * In each iteration, the name of the compressor located in the current header |
| 76 | * is used to retrieve the associated instance of ImageDecompressor. |
| 77 | * For example "zip" is the name of the compressor that compresses resources |
| 78 | * using the zip algorithm. The ZipDecompressor class name is also "zip". |
| 79 | * ImageDecompressor instances are retrieved from a static array in which |
| 80 | * they are registered. |
| 81 | */ |
| 82 | class ImageDecompressor { |
| 83 | |
| 84 | private: |
| 85 | const char* _name; |
| 86 | |
| 87 | /* |
| 88 | * Array of concrete decompressors. This array is used to retrieve the decompressor |
| 89 | * that can handle resource decompression. |
| 90 | */ |
| 91 | static ImageDecompressor** _decompressors; |
| 92 | /** |
| 93 | * Num of decompressors |
| 94 | */ |
| 95 | static int _decompressors_num; |
| 96 | /* |
| 97 | * Identifier of a decompressor. This name is the identification key to retrieve |
| 98 | * decompressor from a resource header. |
| 99 | */ |
| 100 | inline const char* get_name() const { return _name; } |
| 101 | |
| 102 | static u8 getU8(u1* ptr, Endian *endian); |
| 103 | static u4 getU4(u1* ptr, Endian *endian); |
| 104 | |
| 105 | protected: |
| 106 | ImageDecompressor(const char* name) : _name(name) { |
| 107 | } |
| 108 | virtual void (u1* data, u1* uncompressed, |
| 109 | ResourceHeader* , const ImageStrings* strings) = 0; |
| 110 | |
| 111 | public: |
| 112 | static void image_decompressor_init(); |
| 113 | static void image_decompressor_close(); |
| 114 | static ImageDecompressor* get_decompressor(const char * decompressor_name) ; |
| 115 | static void decompress_resource(u1* compressed, u1* uncompressed, |
| 116 | u8 uncompressed_size, const ImageStrings* strings, Endian* _endian); |
| 117 | }; |
| 118 | |
| 119 | /** |
| 120 | * Zip decompressor. |
| 121 | */ |
| 122 | class ZipDecompressor : public ImageDecompressor { |
| 123 | public: |
| 124 | ZipDecompressor(const char* sym) : ImageDecompressor(sym) { } |
| 125 | void (u1* data, u1* uncompressed, ResourceHeader* , |
| 126 | const ImageStrings* strings); |
| 127 | static jboolean decompress(void *in, u8 inSize, void *out, u8 outSize, char **pmsg); |
| 128 | }; |
| 129 | |
| 130 | /* |
| 131 | * Shared Strings decompressor. This decompressor reconstruct the class |
| 132 | * constant pool UTF_U entries by retrieving strings stored in jimage strings table. |
| 133 | * In addition, if the UTF_8 entry is a descriptor, the descriptor has to be rebuilt, |
| 134 | * all java type having been removed from the descriptor and added to the sting table. |
| 135 | * eg: "(Ljava/lang/String;I)V" ==> "(L;I)V" and "java/lang", "String" |
| 136 | * stored in string table. offsets to the 2 strings are compressed and stored in the |
| 137 | * constantpool entry. |
| 138 | */ |
| 139 | class SharedStringDecompressor : public ImageDecompressor { |
| 140 | private: |
| 141 | // the constant pool tag for UTF8 string located in strings table |
| 142 | static const int externalized_string = 23; |
| 143 | // the constant pool tag for UTF8 descriptors string located in strings table |
| 144 | static const int externalized_string_descriptor = 25; |
| 145 | // the constant pool tag for UTF8 |
| 146 | static const int constant_utf8 = 1; |
| 147 | // the constant pool tag for long |
| 148 | static const int constant_long = 5; |
| 149 | // the constant pool tag for double |
| 150 | static const int constant_double = 6; |
| 151 | // array index is the constant pool tag. value is size. |
| 152 | // eg: array[5] = 8; means size of long is 8 bytes. |
| 153 | static const u1 sizes[]; |
| 154 | // bit 5 and 6 are used to store the length of the compressed integer. |
| 155 | // size can be 1 (01), 2 (10), 3 (11). |
| 156 | // 0x60 ==> 0110000 |
| 157 | static const int compressed_index_size_mask = 0x60; |
| 158 | /* |
| 159 | * mask the length bits (5 and 6) and move to the right 5 bits. |
| 160 | */ |
| 161 | inline static int get_compressed_length(char c) { |
| 162 | return ((char) (c & compressed_index_size_mask) >> 5); |
| 163 | } |
| 164 | inline static bool is_compressed(signed char b1) { return b1 < 0; } |
| 165 | static int decompress_int(unsigned char*& value); |
| 166 | public: |
| 167 | SharedStringDecompressor(const char* sym) : ImageDecompressor(sym){} |
| 168 | void (u1* data, u1* uncompressed, ResourceHeader* , |
| 169 | const ImageStrings* strings); |
| 170 | }; |
| 171 | #endif // LIBJIMAGE_IMAGEDECOMPRESSOR_HPP |
| 172 | |