1 | // jpgd.h - C++ class for JPEG decompression. |
2 | // Public domain, Rich Geldreich <richgel99@gmail.com> |
3 | #ifndef JPEG_DECODER_H |
4 | #define JPEG_DECODER_H |
5 | |
6 | #include <stdlib.h> |
7 | #include <stdio.h> |
8 | #include <setjmp.h> |
9 | #include <assert.h> |
10 | #include <stdint.h> |
11 | |
12 | #ifdef _MSC_VER |
13 | #define JPGD_NORETURN __declspec(noreturn) |
14 | #elif defined(__GNUC__) |
15 | #define JPGD_NORETURN __attribute__ ((noreturn)) |
16 | #else |
17 | #define JPGD_NORETURN |
18 | #endif |
19 | |
20 | #define JPGD_HUFF_TREE_MAX_LENGTH 512 |
21 | #define JPGD_HUFF_CODE_SIZE_MAX_LENGTH 256 |
22 | |
23 | namespace jpgd |
24 | { |
25 | typedef unsigned char uint8; |
26 | typedef signed short int16; |
27 | typedef unsigned short uint16; |
28 | typedef unsigned int uint; |
29 | typedef signed int int32; |
30 | |
31 | // Loads a JPEG image from a memory buffer or a file. |
32 | // req_comps can be 1 (grayscale), 3 (RGB), or 4 (RGBA). |
33 | // On return, width/height will be set to the image's dimensions, and actual_comps will be set to the either 1 (grayscale) or 3 (RGB). |
34 | // Notes: For more control over where and how the source data is read, see the decompress_jpeg_image_from_stream() function below, or call the jpeg_decoder class directly. |
35 | // Requesting a 8 or 32bpp image is currently a little faster than 24bpp because the jpeg_decoder class itself currently always unpacks to either 8 or 32bpp. |
36 | unsigned char* decompress_jpeg_image_from_memory(const unsigned char* pSrc_data, int src_data_size, int* width, int* height, int* actual_comps, int req_comps, uint32_t flags = 0); |
37 | unsigned char* decompress_jpeg_image_from_file(const char* pSrc_filename, int* width, int* height, int* actual_comps, int req_comps, uint32_t flags = 0); |
38 | |
39 | // Success/failure error codes. |
40 | enum jpgd_status |
41 | { |
42 | JPGD_SUCCESS = 0, JPGD_FAILED = -1, JPGD_DONE = 1, |
43 | JPGD_BAD_DHT_COUNTS = -256, JPGD_BAD_DHT_INDEX, JPGD_BAD_DHT_MARKER, JPGD_BAD_DQT_MARKER, JPGD_BAD_DQT_TABLE, |
44 | JPGD_BAD_PRECISION, JPGD_BAD_HEIGHT, JPGD_BAD_WIDTH, JPGD_TOO_MANY_COMPONENTS, |
45 | JPGD_BAD_SOF_LENGTH, JPGD_BAD_VARIABLE_MARKER, JPGD_BAD_DRI_LENGTH, JPGD_BAD_SOS_LENGTH, |
46 | JPGD_BAD_SOS_COMP_ID, , JPGD_NO_ARITHMITIC_SUPPORT, JPGD_UNEXPECTED_MARKER, |
47 | JPGD_NOT_JPEG, JPGD_UNSUPPORTED_MARKER, JPGD_BAD_DQT_LENGTH, JPGD_TOO_MANY_BLOCKS, |
48 | JPGD_UNDEFINED_QUANT_TABLE, JPGD_UNDEFINED_HUFF_TABLE, JPGD_NOT_SINGLE_SCAN, JPGD_UNSUPPORTED_COLORSPACE, |
49 | JPGD_UNSUPPORTED_SAMP_FACTORS, JPGD_DECODE_ERROR, JPGD_BAD_RESTART_MARKER, |
50 | JPGD_BAD_SOS_SPECTRAL, JPGD_BAD_SOS_SUCCESSIVE, JPGD_STREAM_READ, JPGD_NOTENOUGHMEM, JPGD_TOO_MANY_SCANS |
51 | }; |
52 | |
53 | // Input stream interface. |
54 | // Derive from this class to read input data from sources other than files or memory. Set m_eof_flag to true when no more data is available. |
55 | // The decoder is rather greedy: it will keep on calling this method until its internal input buffer is full, or until the EOF flag is set. |
56 | // It the input stream contains data after the JPEG stream's EOI (end of image) marker it will probably be pulled into the internal buffer. |
57 | // Call the get_total_bytes_read() method to determine the actual size of the JPEG stream after successful decoding. |
58 | class jpeg_decoder_stream |
59 | { |
60 | public: |
61 | jpeg_decoder_stream() { } |
62 | virtual ~jpeg_decoder_stream() { } |
63 | |
64 | // The read() method is called when the internal input buffer is empty. |
65 | // Parameters: |
66 | // pBuf - input buffer |
67 | // max_bytes_to_read - maximum bytes that can be written to pBuf |
68 | // pEOF_flag - set this to true if at end of stream (no more bytes remaining) |
69 | // Returns -1 on error, otherwise return the number of bytes actually written to the buffer (which may be 0). |
70 | // Notes: This method will be called in a loop until you set *pEOF_flag to true or the internal buffer is full. |
71 | virtual int read(uint8* pBuf, int max_bytes_to_read, bool* pEOF_flag) = 0; |
72 | }; |
73 | |
74 | // stdio FILE stream class. |
75 | class jpeg_decoder_file_stream : public jpeg_decoder_stream |
76 | { |
77 | jpeg_decoder_file_stream(const jpeg_decoder_file_stream&); |
78 | jpeg_decoder_file_stream& operator =(const jpeg_decoder_file_stream&); |
79 | |
80 | FILE* m_pFile; |
81 | bool m_eof_flag, m_error_flag; |
82 | |
83 | public: |
84 | jpeg_decoder_file_stream(); |
85 | virtual ~jpeg_decoder_file_stream(); |
86 | |
87 | bool open(const char* Pfilename); |
88 | void close(); |
89 | |
90 | virtual int read(uint8* pBuf, int max_bytes_to_read, bool* pEOF_flag); |
91 | }; |
92 | |
93 | // Memory stream class. |
94 | class jpeg_decoder_mem_stream : public jpeg_decoder_stream |
95 | { |
96 | const uint8* m_pSrc_data; |
97 | uint m_ofs, m_size; |
98 | |
99 | public: |
100 | jpeg_decoder_mem_stream() : m_pSrc_data(NULL), m_ofs(0), m_size(0) { } |
101 | jpeg_decoder_mem_stream(const uint8* pSrc_data, uint size) : m_pSrc_data(pSrc_data), m_ofs(0), m_size(size) { } |
102 | |
103 | virtual ~jpeg_decoder_mem_stream() { } |
104 | |
105 | bool open(const uint8* pSrc_data, uint size); |
106 | void close() { m_pSrc_data = NULL; m_ofs = 0; m_size = 0; } |
107 | |
108 | virtual int read(uint8* pBuf, int max_bytes_to_read, bool* pEOF_flag); |
109 | }; |
110 | |
111 | // Loads JPEG file from a jpeg_decoder_stream. |
112 | unsigned char* decompress_jpeg_image_from_stream(jpeg_decoder_stream* pStream, int* width, int* height, int* actual_comps, int req_comps, uint32_t flags = 0); |
113 | |
114 | enum |
115 | { |
116 | JPGD_IN_BUF_SIZE = 8192, JPGD_MAX_BLOCKS_PER_MCU = 10, JPGD_MAX_HUFF_TABLES = 8, JPGD_MAX_QUANT_TABLES = 4, |
117 | JPGD_MAX_COMPONENTS = 4, JPGD_MAX_COMPS_IN_SCAN = 4, JPGD_MAX_BLOCKS_PER_ROW = 16384, JPGD_MAX_HEIGHT = 32768, JPGD_MAX_WIDTH = 32768 |
118 | }; |
119 | |
120 | typedef int16 jpgd_quant_t; |
121 | typedef int16 jpgd_block_t; |
122 | |
123 | class jpeg_decoder |
124 | { |
125 | public: |
126 | enum |
127 | { |
128 | cFlagLinearChromaFiltering = 1 |
129 | }; |
130 | |
131 | // Call get_error_code() after constructing to determine if the stream is valid or not. You may call the get_width(), get_height(), etc. |
132 | // methods after the constructor is called. You may then either destruct the object, or begin decoding the image by calling begin_decoding(), then decode() on each scanline. |
133 | jpeg_decoder(jpeg_decoder_stream* pStream, uint32_t flags = cFlagLinearChromaFiltering); |
134 | |
135 | ~jpeg_decoder(); |
136 | |
137 | // Call this method after constructing the object to begin decompression. |
138 | // If JPGD_SUCCESS is returned you may then call decode() on each scanline. |
139 | |
140 | int begin_decoding(); |
141 | |
142 | // Returns the next scan line. |
143 | // For grayscale images, pScan_line will point to a buffer containing 8-bit pixels (get_bytes_per_pixel() will return 1). |
144 | // Otherwise, it will always point to a buffer containing 32-bit RGBA pixels (A will always be 255, and get_bytes_per_pixel() will return 4). |
145 | // Returns JPGD_SUCCESS if a scan line has been returned. |
146 | // Returns JPGD_DONE if all scan lines have been returned. |
147 | // Returns JPGD_FAILED if an error occurred. Call get_error_code() for a more info. |
148 | int decode(const void** pScan_line, uint* pScan_line_len); |
149 | |
150 | inline jpgd_status get_error_code() const { return m_error_code; } |
151 | |
152 | inline int get_width() const { return m_image_x_size; } |
153 | inline int get_height() const { return m_image_y_size; } |
154 | |
155 | inline int get_num_components() const { return m_comps_in_frame; } |
156 | |
157 | inline int get_bytes_per_pixel() const { return m_dest_bytes_per_pixel; } |
158 | inline int get_bytes_per_scan_line() const { return m_image_x_size * get_bytes_per_pixel(); } |
159 | |
160 | // Returns the total number of bytes actually consumed by the decoder (which should equal the actual size of the JPEG file). |
161 | inline int get_total_bytes_read() const { return m_total_bytes_read; } |
162 | |
163 | private: |
164 | jpeg_decoder(const jpeg_decoder&); |
165 | jpeg_decoder& operator =(const jpeg_decoder&); |
166 | |
167 | typedef void (*pDecode_block_func)(jpeg_decoder*, int, int, int); |
168 | |
169 | struct huff_tables |
170 | { |
171 | bool ac_table; |
172 | uint look_up[256]; |
173 | uint look_up2[256]; |
174 | uint8 code_size[JPGD_HUFF_CODE_SIZE_MAX_LENGTH]; |
175 | uint tree[JPGD_HUFF_TREE_MAX_LENGTH]; |
176 | }; |
177 | |
178 | struct coeff_buf |
179 | { |
180 | uint8* pData; |
181 | int block_num_x, block_num_y; |
182 | int block_len_x, block_len_y; |
183 | int block_size; |
184 | }; |
185 | |
186 | struct mem_block |
187 | { |
188 | mem_block* m_pNext; |
189 | size_t m_used_count; |
190 | size_t m_size; |
191 | char m_data[1]; |
192 | }; |
193 | |
194 | jmp_buf m_jmp_state; |
195 | uint32_t m_flags; |
196 | mem_block* m_pMem_blocks; |
197 | int m_image_x_size; |
198 | int m_image_y_size; |
199 | jpeg_decoder_stream* m_pStream; |
200 | |
201 | int m_progressive_flag; |
202 | |
203 | uint8 m_huff_ac[JPGD_MAX_HUFF_TABLES]; |
204 | uint8* m_huff_num[JPGD_MAX_HUFF_TABLES]; // pointer to number of Huffman codes per bit size |
205 | uint8* m_huff_val[JPGD_MAX_HUFF_TABLES]; // pointer to Huffman codes per bit size |
206 | jpgd_quant_t* m_quant[JPGD_MAX_QUANT_TABLES]; // pointer to quantization tables |
207 | int m_scan_type; // Gray, Yh1v1, Yh1v2, Yh2v1, Yh2v2 (CMYK111, CMYK4114 no longer supported) |
208 | int m_comps_in_frame; // # of components in frame |
209 | int m_comp_h_samp[JPGD_MAX_COMPONENTS]; // component's horizontal sampling factor |
210 | int m_comp_v_samp[JPGD_MAX_COMPONENTS]; // component's vertical sampling factor |
211 | int m_comp_quant[JPGD_MAX_COMPONENTS]; // component's quantization table selector |
212 | int m_comp_ident[JPGD_MAX_COMPONENTS]; // component's ID |
213 | int m_comp_h_blocks[JPGD_MAX_COMPONENTS]; |
214 | int m_comp_v_blocks[JPGD_MAX_COMPONENTS]; |
215 | int m_comps_in_scan; // # of components in scan |
216 | int m_comp_list[JPGD_MAX_COMPS_IN_SCAN]; // components in this scan |
217 | int m_comp_dc_tab[JPGD_MAX_COMPONENTS]; // component's DC Huffman coding table selector |
218 | int m_comp_ac_tab[JPGD_MAX_COMPONENTS]; // component's AC Huffman coding table selector |
219 | int m_spectral_start; // spectral selection start |
220 | int m_spectral_end; // spectral selection end |
221 | int m_successive_low; // successive approximation low |
222 | int m_successive_high; // successive approximation high |
223 | int m_max_mcu_x_size; // MCU's max. X size in pixels |
224 | int m_max_mcu_y_size; // MCU's max. Y size in pixels |
225 | int m_blocks_per_mcu; |
226 | int m_max_blocks_per_row; |
227 | int m_mcus_per_row, m_mcus_per_col; |
228 | int m_mcu_org[JPGD_MAX_BLOCKS_PER_MCU]; |
229 | int m_total_lines_left; // total # lines left in image |
230 | int m_mcu_lines_left; // total # lines left in this MCU |
231 | int m_num_buffered_scanlines; |
232 | int m_real_dest_bytes_per_scan_line; |
233 | int m_dest_bytes_per_scan_line; // rounded up |
234 | int m_dest_bytes_per_pixel; // 4 (RGB) or 1 (Y) |
235 | huff_tables* m_pHuff_tabs[JPGD_MAX_HUFF_TABLES]; |
236 | coeff_buf* m_dc_coeffs[JPGD_MAX_COMPONENTS]; |
237 | coeff_buf* m_ac_coeffs[JPGD_MAX_COMPONENTS]; |
238 | int m_eob_run; |
239 | int m_block_y_mcu[JPGD_MAX_COMPONENTS]; |
240 | uint8* m_pIn_buf_ofs; |
241 | int m_in_buf_left; |
242 | int m_tem_flag; |
243 | |
244 | uint8 m_in_buf_pad_start[64]; |
245 | uint8 m_in_buf[JPGD_IN_BUF_SIZE + 128]; |
246 | uint8 m_in_buf_pad_end[64]; |
247 | |
248 | int m_bits_left; |
249 | uint m_bit_buf; |
250 | int m_restart_interval; |
251 | int m_restarts_left; |
252 | int m_next_restart_num; |
253 | int m_max_mcus_per_row; |
254 | int m_max_blocks_per_mcu; |
255 | |
256 | int m_max_mcus_per_col; |
257 | uint m_last_dc_val[JPGD_MAX_COMPONENTS]; |
258 | jpgd_block_t* m_pMCU_coefficients; |
259 | int m_mcu_block_max_zag[JPGD_MAX_BLOCKS_PER_MCU]; |
260 | uint8* m_pSample_buf; |
261 | uint8* m_pSample_buf_prev; |
262 | int m_crr[256]; |
263 | int m_cbb[256]; |
264 | int m_crg[256]; |
265 | int m_cbg[256]; |
266 | uint8* m_pScan_line_0; |
267 | uint8* m_pScan_line_1; |
268 | jpgd_status m_error_code; |
269 | int m_total_bytes_read; |
270 | |
271 | bool m_ready_flag; |
272 | bool m_eof_flag; |
273 | bool m_sample_buf_prev_valid; |
274 | |
275 | inline int check_sample_buf_ofs(int ofs) const { assert(ofs >= 0); assert(ofs < m_max_blocks_per_row * 64); return ofs; } |
276 | void free_all_blocks(); |
277 | JPGD_NORETURN void stop_decoding(jpgd_status status); |
278 | void* alloc(size_t n, bool zero = false); |
279 | void word_clear(void* p, uint16 c, uint n); |
280 | void prep_in_buffer(); |
281 | void read_dht_marker(); |
282 | void read_dqt_marker(); |
283 | void read_sof_marker(); |
284 | void skip_variable_marker(); |
285 | void read_dri_marker(); |
286 | void read_sos_marker(); |
287 | int next_marker(); |
288 | int process_markers(); |
289 | void locate_soi_marker(); |
290 | void locate_sof_marker(); |
291 | int locate_sos_marker(); |
292 | void init(jpeg_decoder_stream* pStream, uint32_t flags); |
293 | void create_look_ups(); |
294 | void fix_in_buffer(); |
295 | void transform_mcu(int mcu_row); |
296 | coeff_buf* coeff_buf_open(int block_num_x, int block_num_y, int block_len_x, int block_len_y); |
297 | inline jpgd_block_t* coeff_buf_getp(coeff_buf* cb, int block_x, int block_y); |
298 | void load_next_row(); |
299 | void decode_next_row(); |
300 | void make_huff_table(int index, huff_tables* pH); |
301 | void check_quant_tables(); |
302 | void check_huff_tables(); |
303 | bool calc_mcu_block_order(); |
304 | int init_scan(); |
305 | void init_frame(); |
306 | void process_restart(); |
307 | void decode_scan(pDecode_block_func decode_block_func); |
308 | void init_progressive(); |
309 | void init_sequential(); |
310 | void decode_start(); |
311 | void decode_init(jpeg_decoder_stream* pStream, uint32_t flags); |
312 | void H2V2Convert(); |
313 | uint32_t H2V2ConvertFiltered(); |
314 | void H2V1Convert(); |
315 | void H2V1ConvertFiltered(); |
316 | void H1V2Convert(); |
317 | void H1V2ConvertFiltered(); |
318 | void H1V1Convert(); |
319 | void gray_convert(); |
320 | void find_eoi(); |
321 | inline uint get_char(); |
322 | inline uint get_char(bool* pPadding_flag); |
323 | inline void stuff_char(uint8 q); |
324 | inline uint8 get_octet(); |
325 | inline uint get_bits(int num_bits); |
326 | inline uint get_bits_no_markers(int numbits); |
327 | inline int huff_decode(huff_tables* pH); |
328 | inline int huff_decode(huff_tables* pH, int& ); |
329 | |
330 | // Clamps a value between 0-255. |
331 | static inline uint8 clamp(int i) |
332 | { |
333 | if (static_cast<uint>(i) > 255) |
334 | i = (((~i) >> 31) & 0xFF); |
335 | return static_cast<uint8>(i); |
336 | } |
337 | int decode_next_mcu_row(); |
338 | |
339 | static void decode_block_dc_first(jpeg_decoder* pD, int component_id, int block_x, int block_y); |
340 | static void decode_block_dc_refine(jpeg_decoder* pD, int component_id, int block_x, int block_y); |
341 | static void decode_block_ac_first(jpeg_decoder* pD, int component_id, int block_x, int block_y); |
342 | static void decode_block_ac_refine(jpeg_decoder* pD, int component_id, int block_x, int block_y); |
343 | }; |
344 | |
345 | } // namespace jpgd |
346 | |
347 | #endif // JPEG_DECODER_H |
348 | |