|
1 /* |
|
2 * Copyright (c) 2015, 2016, Oracle and/or its affiliates. All rights reserved. |
|
3 * |
|
4 * Redistribution and use in source and binary forms, with or without |
|
5 * modification, are permitted provided that the following conditions |
|
6 * are met: |
|
7 * |
|
8 * - Redistributions of source code must retain the above copyright |
|
9 * notice, this list of conditions and the following disclaimer. |
|
10 * |
|
11 * - Redistributions in binary form must reproduce the above copyright |
|
12 * notice, this list of conditions and the following disclaimer in the |
|
13 * documentation and/or other materials provided with the distribution. |
|
14 * |
|
15 * - Neither the name of Oracle nor the names of its |
|
16 * contributors may be used to endorse or promote products derived |
|
17 * from this software without specific prior written permission. |
|
18 * |
|
19 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS |
|
20 * IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, |
|
21 * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR |
|
22 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR |
|
23 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, |
|
24 * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, |
|
25 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR |
|
26 * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF |
|
27 * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING |
|
28 * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |
|
29 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
|
30 */ |
|
31 |
|
32 #ifndef LIBJIMAGE_IMAGEDECOMPRESSOR_HPP |
|
33 #define LIBJIMAGE_IMAGEDECOMPRESSOR_HPP |
|
34 |
|
35 #include <assert.h> |
|
36 #include <string.h> |
|
37 |
|
38 #include "imageFile.hpp" |
|
39 #include "inttypes.hpp" |
|
40 #include "jni.h" |
|
41 |
|
42 /* |
|
43 * Compressed resources located in image have an header. |
|
44 * This header contains: |
|
45 * - _magic: A magic u4, required to retrieved the header in the compressed content |
|
46 * - _size: The size of the compressed resource. |
|
47 * - _uncompressed_size: The uncompressed size of the compressed resource. |
|
48 * - _decompressor_name_offset: The ImageDecompressor instance name StringsTable offset. |
|
49 * - _decompressor_config_offset: StringsTable offset of configuration that could be needed by |
|
50 * the decompressor in order to decompress. |
|
51 * - _is_terminal: 1: the compressed content is terminal. Uncompressing it would |
|
52 * create the actual resource. 0: the compressed content is not terminal. Uncompressing it |
|
53 * will result in a compressed content to be decompressed (This occurs when a stack of compressors |
|
54 * have been used to compress the resource. |
|
55 */ |
|
56 struct ResourceHeader { |
|
57 /* magic bytes that identifies a compressed resource header*/ |
|
58 static const u4 resource_header_magic = 0xCAFEFAFA; |
|
59 u4 _magic; // Resource header |
|
60 u8 _size; // Resource size |
|
61 u8 _uncompressed_size; // Expected uncompressed size |
|
62 u4 _decompressor_name_offset; // Strings table decompressor offset |
|
63 u4 _decompressor_config_offset; // Strings table config offset |
|
64 u1 _is_terminal; // Last decompressor 1, otherwise 0. |
|
65 }; |
|
66 |
|
67 /* |
|
68 * Resources located in jimage file can be compressed. Compression occurs at |
|
69 * jimage file creation time. When compressed a resource is added an header that |
|
70 * contains the name of the compressor that compressed it. |
|
71 * Various compression strategies can be applied to compress a resource. |
|
72 * The same resource can even be compressed multiple time by a stack of compressors. |
|
73 * At runtime, a resource is decompressed in a loop until there is no more header |
|
74 * meaning that the resource is equivalent to the not compressed resource. |
|
75 * In each iteration, the name of the compressor located in the current header |
|
76 * is used to retrieve the associated instance of ImageDecompressor. |
|
77 * For example "zip" is the name of the compressor that compresses resources |
|
78 * using the zip algorithm. The ZipDecompressor class name is also "zip". |
|
79 * ImageDecompressor instances are retrieved from a static array in which |
|
80 * they are registered. |
|
81 */ |
|
82 class ImageDecompressor { |
|
83 |
|
84 private: |
|
85 const char* _name; |
|
86 |
|
87 /* |
|
88 * Array of concrete decompressors. This array is used to retrieve the decompressor |
|
89 * that can handle resource decompression. |
|
90 */ |
|
91 static ImageDecompressor** _decompressors; |
|
92 /** |
|
93 * Num of decompressors |
|
94 */ |
|
95 static int _decompressors_num; |
|
96 /* |
|
97 * Identifier of a decompressor. This name is the identification key to retrieve |
|
98 * decompressor from a resource header. |
|
99 */ |
|
100 inline const char* get_name() const { return _name; } |
|
101 |
|
102 static u8 getU8(u1* ptr, Endian *endian); |
|
103 static u4 getU4(u1* ptr, Endian *endian); |
|
104 |
|
105 protected: |
|
106 ImageDecompressor(const char* name) : _name(name) { |
|
107 } |
|
108 virtual void decompress_resource(u1* data, u1* uncompressed, |
|
109 ResourceHeader* header, const ImageStrings* strings) = 0; |
|
110 |
|
111 public: |
|
112 static void image_decompressor_init(); |
|
113 static void image_decompressor_close(); |
|
114 static ImageDecompressor* get_decompressor(const char * decompressor_name) ; |
|
115 static void decompress_resource(u1* compressed, u1* uncompressed, |
|
116 u8 uncompressed_size, const ImageStrings* strings, Endian* _endian); |
|
117 }; |
|
118 |
|
119 /** |
|
120 * Zip decompressor. |
|
121 */ |
|
122 class ZipDecompressor : public ImageDecompressor { |
|
123 public: |
|
124 ZipDecompressor(const char* sym) : ImageDecompressor(sym) { } |
|
125 void decompress_resource(u1* data, u1* uncompressed, ResourceHeader* header, |
|
126 const ImageStrings* strings); |
|
127 static jboolean decompress(void *in, u8 inSize, void *out, u8 outSize, char **pmsg); |
|
128 }; |
|
129 |
|
130 /* |
|
131 * Shared Strings decompressor. This decompressor reconstruct the class |
|
132 * constant pool UTF_U entries by retrieving strings stored in jimage strings table. |
|
133 * In addition, if the UTF_8 entry is a descriptor, the descriptor has to be rebuilt, |
|
134 * all java type having been removed from the descriptor and added to the sting table. |
|
135 * eg: "(Ljava/lang/String;I)V" ==> "(L;I)V" and "java/lang", "String" |
|
136 * stored in string table. offsets to the 2 strings are compressed and stored in the |
|
137 * constantpool entry. |
|
138 */ |
|
139 class SharedStringDecompressor : public ImageDecompressor { |
|
140 private: |
|
141 // the constant pool tag for UTF8 string located in strings table |
|
142 static const int externalized_string = 23; |
|
143 // the constant pool tag for UTF8 descriptors string located in strings table |
|
144 static const int externalized_string_descriptor = 25; |
|
145 // the constant pool tag for UTF8 |
|
146 static const int constant_utf8 = 1; |
|
147 // the constant pool tag for long |
|
148 static const int constant_long = 5; |
|
149 // the constant pool tag for double |
|
150 static const int constant_double = 6; |
|
151 // array index is the constant pool tag. value is size. |
|
152 // eg: array[5] = 8; means size of long is 8 bytes. |
|
153 static const u1 sizes[]; |
|
154 // bit 5 and 6 are used to store the length of the compressed integer. |
|
155 // size can be 1 (01), 2 (10), 3 (11). |
|
156 // 0x60 ==> 0110000 |
|
157 static const int compressed_index_size_mask = 0x60; |
|
158 /* |
|
159 * mask the length bits (5 and 6) and move to the right 5 bits. |
|
160 */ |
|
161 inline static int get_compressed_length(char c) { |
|
162 return ((char) (c & compressed_index_size_mask) >> 5); |
|
163 } |
|
164 inline static bool is_compressed(signed char b1) { return b1 < 0; } |
|
165 static int decompress_int(unsigned char*& value); |
|
166 public: |
|
167 SharedStringDecompressor(const char* sym) : ImageDecompressor(sym){} |
|
168 void decompress_resource(u1* data, u1* uncompressed, ResourceHeader* header, |
|
169 const ImageStrings* strings); |
|
170 }; |
|
171 #endif // LIBJIMAGE_IMAGEDECOMPRESSOR_HPP |