1 | /******************************************************************** |
2 | * * |
3 | * THIS FILE IS PART OF THE OggTheora SOFTWARE CODEC SOURCE CODE. * |
4 | * USE, DISTRIBUTION AND REPRODUCTION OF THIS LIBRARY SOURCE IS * |
5 | * GOVERNED BY A BSD-STYLE SOURCE LICENSE INCLUDED WITH THIS SOURCE * |
6 | * IN 'COPYING'. PLEASE READ THESE TERMS BEFORE DISTRIBUTING. * |
7 | * * |
8 | * THE Theora SOURCE CODE IS COPYRIGHT (C) 2002-2009 * |
9 | * by the Xiph.Org Foundation and contributors http://www.xiph.org/ * |
10 | * * |
11 | ******************************************************************** |
12 | |
13 | function: |
14 | last mod: $Id$ |
15 | |
16 | ********************************************************************/ |
17 | |
18 | #include <limits.h> |
19 | #if !defined(_decint_H) |
20 | # define _decint_H (1) |
21 | # include "theora/theoradec.h" |
22 | # include "state.h" |
23 | # include "bitpack.h" |
24 | # include "huffdec.h" |
25 | # include "dequant.h" |
26 | |
27 | typedef struct th_setup_info oc_setup_info; |
28 | typedef struct oc_dec_opt_vtable oc_dec_opt_vtable; |
29 | typedef struct oc_dec_pipeline_state oc_dec_pipeline_state; |
30 | typedef struct th_dec_ctx oc_dec_ctx; |
31 | |
32 | |
33 | |
34 | /*Decoder-specific accelerated functions.*/ |
35 | # if defined(OC_C64X_ASM) |
36 | # include "c64x/c64xdec.h" |
37 | # endif |
38 | |
39 | # if !defined(oc_dec_accel_init) |
40 | # define oc_dec_accel_init oc_dec_accel_init_c |
41 | # endif |
42 | # if defined(OC_DEC_USE_VTABLE) |
43 | # if !defined(oc_dec_dc_unpredict_mcu_plane) |
44 | # define oc_dec_dc_unpredict_mcu_plane(_dec,_pipe,_pli) \ |
45 | ((*(_dec)->opt_vtable.dc_unpredict_mcu_plane)(_dec,_pipe,_pli)) |
46 | # endif |
47 | # else |
48 | # if !defined(oc_dec_dc_unpredict_mcu_plane) |
49 | # define oc_dec_dc_unpredict_mcu_plane oc_dec_dc_unpredict_mcu_plane_c |
50 | # endif |
51 | # endif |
52 | |
53 | |
54 | |
55 | /*Constants for the packet-in state machine specific to the decoder.*/ |
56 | |
57 | /*Next packet to read: Data packet.*/ |
58 | #define OC_PACKET_DATA (0) |
59 | |
60 | |
61 | |
62 | struct th_setup_info{ |
63 | /*The Huffman codes.*/ |
64 | ogg_int16_t *huff_tables[TH_NHUFFMAN_TABLES]; |
65 | /*The quantization parameters.*/ |
66 | th_quant_info qinfo; |
67 | }; |
68 | |
69 | |
70 | |
71 | /*Decoder specific functions with accelerated variants.*/ |
72 | struct oc_dec_opt_vtable{ |
73 | void (*dc_unpredict_mcu_plane)(oc_dec_ctx *_dec, |
74 | oc_dec_pipeline_state *_pipe,int _pli); |
75 | }; |
76 | |
77 | |
78 | |
79 | struct oc_dec_pipeline_state{ |
80 | /*Decoded DCT coefficients. |
81 | These are placed here instead of on the stack so that they can persist |
82 | between blocks, which makes clearing them back to zero much faster when |
83 | only a few non-zero coefficients were decoded. |
84 | It requires at least 65 elements because the zig-zag index array uses the |
85 | 65th element as a dumping ground for out-of-range indices to protect us |
86 | from buffer overflow. |
87 | We make it fully twice as large so that the second half can serve as the |
88 | reconstruction buffer, which saves passing another parameter to all the |
89 | acceleration functios. |
90 | It also solves problems with 16-byte alignment for NEON on ARM. |
91 | gcc (as of 4.2.1) only seems to be able to give stack variables 8-byte |
92 | alignment, and silently produces incorrect results if you ask for 16. |
93 | Finally, keeping it off the stack means there's less likely to be a data |
94 | hazard beween the NEON co-processor and the regular ARM core, which avoids |
95 | unnecessary stalls.*/ |
96 | OC_ALIGN16(ogg_int16_t dct_coeffs[128]); |
97 | OC_ALIGN16(signed char bounding_values[256]); |
98 | ptrdiff_t ti[3][64]; |
99 | ptrdiff_t ebi[3][64]; |
100 | ptrdiff_t eob_runs[3][64]; |
101 | const ptrdiff_t *coded_fragis[3]; |
102 | const ptrdiff_t *uncoded_fragis[3]; |
103 | ptrdiff_t ncoded_fragis[3]; |
104 | ptrdiff_t nuncoded_fragis[3]; |
105 | const ogg_uint16_t *dequant[3][3][2]; |
106 | int fragy0[3]; |
107 | int fragy_end[3]; |
108 | int pred_last[3][4]; |
109 | int mcu_nvfrags; |
110 | int loop_filter; |
111 | int pp_level; |
112 | }; |
113 | |
114 | |
115 | struct th_dec_ctx{ |
116 | /*Shared encoder/decoder state.*/ |
117 | oc_theora_state state; |
118 | /*Whether or not packets are ready to be emitted. |
119 | This takes on negative values while there are remaining header packets to |
120 | be emitted, reaches 0 when the codec is ready for input, and goes to 1 |
121 | when a frame has been processed and a data packet is ready.*/ |
122 | int packet_state; |
123 | /*Buffer in which to assemble packets.*/ |
124 | oc_pack_buf opb; |
125 | /*Huffman decode trees.*/ |
126 | ogg_int16_t *huff_tables[TH_NHUFFMAN_TABLES]; |
127 | /*The index of the first token in each plane for each coefficient.*/ |
128 | ptrdiff_t ti0[3][64]; |
129 | /*The number of outstanding EOB runs at the start of each coefficient in each |
130 | plane.*/ |
131 | ptrdiff_t eob_runs[3][64]; |
132 | /*The DCT token lists.*/ |
133 | unsigned char *dct_tokens; |
134 | /*The extra bits associated with DCT tokens.*/ |
135 | unsigned char *; |
136 | /*The number of dct tokens unpacked so far.*/ |
137 | int dct_tokens_count; |
138 | /*The out-of-loop post-processing level.*/ |
139 | int pp_level; |
140 | /*The DC scale used for out-of-loop deblocking.*/ |
141 | int pp_dc_scale[64]; |
142 | /*The sharpen modifier used for out-of-loop deringing.*/ |
143 | int pp_sharp_mod[64]; |
144 | /*The DC quantization index of each block.*/ |
145 | unsigned char *dc_qis; |
146 | /*The variance of each block.*/ |
147 | int *variances; |
148 | /*The storage for the post-processed frame buffer.*/ |
149 | unsigned char *pp_frame_data; |
150 | /*Whether or not the post-processsed frame buffer has space for chroma.*/ |
151 | int pp_frame_state; |
152 | /*The buffer used for the post-processed frame. |
153 | Note that this is _not_ guaranteed to have the same strides and offsets as |
154 | the reference frame buffers.*/ |
155 | th_ycbcr_buffer pp_frame_buf; |
156 | /*The striped decode callback function.*/ |
157 | th_stripe_callback stripe_cb; |
158 | oc_dec_pipeline_state pipe; |
159 | # if defined(OC_DEC_USE_VTABLE) |
160 | /*Table for decoder acceleration functions.*/ |
161 | oc_dec_opt_vtable opt_vtable; |
162 | # endif |
163 | # if defined(HAVE_CAIRO) |
164 | /*Output metrics for debugging.*/ |
165 | int telemetry_mbmode; |
166 | int telemetry_mv; |
167 | int telemetry_qi; |
168 | int telemetry_bits; |
169 | int telemetry_frame_bytes; |
170 | int telemetry_coding_bytes; |
171 | int telemetry_mode_bytes; |
172 | int telemetry_mv_bytes; |
173 | int telemetry_qi_bytes; |
174 | int telemetry_dc_bytes; |
175 | unsigned char *telemetry_frame_data; |
176 | # endif |
177 | }; |
178 | |
179 | /*Default pure-C implementations of decoder-specific accelerated functions.*/ |
180 | void oc_dec_accel_init_c(oc_dec_ctx *_dec); |
181 | |
182 | void oc_dec_dc_unpredict_mcu_plane_c(oc_dec_ctx *_dec, |
183 | oc_dec_pipeline_state *_pipe,int _pli); |
184 | |
185 | #endif |
186 | |