| 1 | //============================================================================ |
| 2 | // |
| 3 | // SSSS tt lll lll |
| 4 | // SS SS tt ll ll |
| 5 | // SS tttttt eeee ll ll aaaa |
| 6 | // SSSS tt ee ee ll ll aa |
| 7 | // SS tt eeeeee ll ll aaaaa -- "An Atari 2600 VCS Emulator" |
| 8 | // SS SS tt ee ll ll aa aa |
| 9 | // SSSS ttt eeeee llll llll aaaaa |
| 10 | // |
| 11 | // Copyright (c) 1995-2019 by Bradford W. Mott, Stephen Anthony |
| 12 | // and the Stella Team |
| 13 | // |
| 14 | // See the file "License.txt" for information on usage and redistribution of |
| 15 | // this file, and for a DISCLAIMER OF ALL WARRANTIES. |
| 16 | //============================================================================ |
| 17 | |
| 18 | /* |
| 19 | * Atari TIA NTSC video filter |
| 20 | * Based on nes_ntsc 0.2.2. http://www.slack.net/~ant |
| 21 | * |
| 22 | * Copyright (C) 2006-2009 Shay Green. This module is free software; you |
| 23 | * can redistribute it and/or modify it under the terms of the GNU Lesser |
| 24 | * General Public License as published by the Free Software Foundation; either |
| 25 | * version 2.1 of the License, or (at your option) any later version. This |
| 26 | * module is distributed in the hope that it will be useful, but WITHOUT ANY |
| 27 | * WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS |
| 28 | * FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for more |
| 29 | * details. You should have received a copy of the GNU Lesser General Public |
| 30 | * License along with this module; if not, write to the Free Software Foundation, |
| 31 | * Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
| 32 | */ |
| 33 | |
| 34 | /** |
| 35 | The class is basically a thin wrapper around atari_ntsc_xxx structs |
| 36 | and methods, so that the rest of the codebase isn't affected by |
| 37 | updated versions of Blargg code. |
| 38 | */ |
| 39 | |
| 40 | #ifndef ATARI_NTSC_HXX |
| 41 | #define ATARI_NTSC_HXX |
| 42 | |
| 43 | #include <cmath> |
| 44 | #include <thread> |
| 45 | |
| 46 | #include "bspf.hxx" |
| 47 | |
| 48 | class AtariNTSC |
| 49 | { |
| 50 | public: |
| 51 | static constexpr uInt32 palette_size = 256, entry_size = 2 * 14; |
| 52 | |
| 53 | // By default, threading is turned off |
| 54 | AtariNTSC() { enableThreading(false); } |
| 55 | |
| 56 | // Image parameters, ranging from -1.0 to 1.0. Actual internal values shown |
| 57 | // in parenthesis and should remain fairly stable in future versions. |
| 58 | struct Setup |
| 59 | { |
| 60 | // Basic parameters |
| 61 | float hue; // -1 = -180 degrees +1 = +180 degrees |
| 62 | float saturation; // -1 = grayscale (0.0) +1 = oversaturated colors (2.0) |
| 63 | float contrast; // -1 = dark (0.5) +1 = light (1.5) |
| 64 | float brightness; // -1 = dark (0.5) +1 = light (1.5) |
| 65 | float sharpness; // edge contrast enhancement/blurring |
| 66 | |
| 67 | // Advanced parameters |
| 68 | float gamma; // -1 = dark (1.5) +1 = light (0.5) |
| 69 | float resolution; // image resolution |
| 70 | float artifacts; // artifacts caused by color changes |
| 71 | float fringing; // color artifacts caused by brightness changes |
| 72 | float bleed; // color bleed (color resolution reduction) |
| 73 | }; |
| 74 | |
| 75 | // Video format presets |
| 76 | static const Setup TV_Composite; // color bleeding + artifacts |
| 77 | static const Setup TV_SVideo; // color bleeding only |
| 78 | static const Setup TV_RGB; // crisp image |
| 79 | static const Setup TV_Bad; // badly adjusted TV |
| 80 | |
| 81 | // Initializes and adjusts parameters. |
| 82 | void initialize(const Setup& setup, const uInt8* palette); |
| 83 | void initializePalette(const uInt8* palette); |
| 84 | |
| 85 | // Set up threading |
| 86 | void enableThreading(bool enable); |
| 87 | |
| 88 | // Set phosphor palette, for use in Blargg + phosphor mode |
| 89 | void setPhosphorPalette(uInt8 palette[256][256]) { |
| 90 | memcpy(myPhosphorPalette, palette, 256 * 256); |
| 91 | } |
| 92 | |
| 93 | // Filters one or more rows of pixels. Input pixels are 8-bit Atari |
| 94 | // palette colors. |
| 95 | // In_row_width is the number of pixels to get to the next input row. |
| 96 | // Out_pitch is the number of *bytes* to get to the next output row. |
| 97 | void render(const uInt8* atari_in, const uInt32 in_width, const uInt32 in_height, |
| 98 | void* rgb_out, const uInt32 out_pitch, uInt32* rgb_in = nullptr); |
| 99 | |
| 100 | // Number of input pixels that will fit within given output width. |
| 101 | // Might be rounded down slightly; use outWidth() on result to find |
| 102 | // rounded value. |
| 103 | /*static constexpr uInt32 inWidth( uInt32 out_width ) { |
| 104 | return (((out_width - 8) / PIXEL_out_chunk - 1) * PIXEL_in_chunk + 1); |
| 105 | }*/ |
| 106 | |
| 107 | // Number of output pixels written by blitter for given input width. |
| 108 | // Width might be rounded down slightly; use inWidth() on result to |
| 109 | // find rounded value. Guaranteed not to round 160 down at all. |
| 110 | static constexpr uInt32 outWidth(uInt32 in_width) { |
| 111 | return ((((in_width) - 1) / PIXEL_in_chunk + 1)* PIXEL_out_chunk) + 8; |
| 112 | } |
| 113 | |
| 114 | private: |
| 115 | // Threaded rendering |
| 116 | void renderThread(const uInt8* atari_in, const uInt32 in_width, |
| 117 | const uInt32 in_height, const uInt32 numThreads, const uInt32 threadNum, void* rgb_out, const uInt32 out_pitch); |
| 118 | void renderWithPhosphorThread(const uInt8* atari_in, const uInt32 in_width, |
| 119 | const uInt32 in_height, const uInt32 numThreads, const uInt32 threadNum, uInt32* rgb_in, void* rgb_out, const uInt32 out_pitch); |
| 120 | |
| 121 | /** |
| 122 | Used to calculate an averaged color for the 'phosphor' effect. |
| 123 | |
| 124 | @param c RGB Color 1 (current frame) |
| 125 | @param cp RGB Color 2 (previous frame) |
| 126 | |
| 127 | @return Averaged value of the two RGB colors |
| 128 | */ |
| 129 | uInt32 getRGBPhosphor(const uInt32 c, const uInt32 cp) const; |
| 130 | |
| 131 | private: |
| 132 | static constexpr Int32 |
| 133 | PIXEL_in_chunk = 2, // number of input pixels read per chunk |
| 134 | PIXEL_out_chunk = 7, // number of output pixels generated per chunk |
| 135 | NTSC_black = 0, // palette index for black |
| 136 | |
| 137 | alignment_count = 2, |
| 138 | burst_count = 1, |
| 139 | rescale_in = 8, |
| 140 | rescale_out = 7, |
| 141 | |
| 142 | burst_size = entry_size / burst_count, |
| 143 | kernel_half = 16, |
| 144 | kernel_size = kernel_half * 2 + 1, |
| 145 | gamma_size = 256, |
| 146 | |
| 147 | rgb_builder = ((1 << 21) | (1 << 11) | (1 << 1)), |
| 148 | rgb_kernel_size = burst_size / alignment_count, |
| 149 | rgb_bits = 8, |
| 150 | rgb_unit = (1 << rgb_bits), |
| 151 | rgb_bias = rgb_unit * 2 * rgb_builder, |
| 152 | |
| 153 | std_decoder_hue = 0, |
| 154 | ext_decoder_hue = std_decoder_hue + 15 |
| 155 | ; |
| 156 | |
| 157 | #define artifacts_mid 1.5f |
| 158 | #define artifacts_max 2.5f |
| 159 | #define fringing_mid 1.0f |
| 160 | #define fringing_max 2.0f |
| 161 | #define rgb_offset (rgb_unit * 2 + 0.5f) |
| 162 | |
| 163 | #define LUMA_CUTOFF 0.20f |
| 164 | |
| 165 | uInt32 myColorTable[palette_size][entry_size]; |
| 166 | uInt8 myPhosphorPalette[256][256]; |
| 167 | |
| 168 | // Rendering threads |
| 169 | unique_ptr<std::thread[]> myThreads; |
| 170 | // Number of rendering and total threads |
| 171 | uInt32 myWorkerThreads, myTotalThreads; |
| 172 | |
| 173 | struct init_t |
| 174 | { |
| 175 | float to_rgb [burst_count * 6]; |
| 176 | float to_float [gamma_size]; |
| 177 | float contrast; |
| 178 | float brightness; |
| 179 | float artifacts; |
| 180 | float fringing; |
| 181 | float kernel [rescale_out * kernel_size * 2]; |
| 182 | |
| 183 | init_t() : contrast(0.0), brightness(0.0), artifacts(0.0), fringing(0.0) { |
| 184 | std::fill(to_rgb, to_rgb + burst_count * 6, 0.0); |
| 185 | std::fill(to_float, to_float + gamma_size, 0.0); |
| 186 | std::fill(kernel, kernel + rescale_out * kernel_size * 2, 0.0); |
| 187 | } |
| 188 | }; |
| 189 | init_t myImpl; |
| 190 | |
| 191 | struct pixel_info_t |
| 192 | { |
| 193 | int offset; |
| 194 | float negate; |
| 195 | float kernel [4]; |
| 196 | }; |
| 197 | static const pixel_info_t atari_ntsc_pixels[alignment_count]; |
| 198 | |
| 199 | static const float default_decoder[6]; |
| 200 | |
| 201 | void init(init_t& impl, const Setup& setup); |
| 202 | void initFilters(init_t& impl, const Setup& setup); |
| 203 | // Generate pixel at all burst phases and column alignments |
| 204 | void genKernel(init_t& impl, float y, float i, float q, uInt32* out); |
| 205 | |
| 206 | // Begins outputting row and starts two pixels. First pixel will be cut |
| 207 | // off a bit. Use atari_ntsc_black for unused pixels. |
| 208 | #define ATARI_NTSC_BEGIN_ROW( pixel0, pixel1 ) \ |
| 209 | unsigned const atari_ntsc_pixel0_ = (pixel0);\ |
| 210 | uInt32 const* kernel0 = myColorTable[atari_ntsc_pixel0_];\ |
| 211 | unsigned const atari_ntsc_pixel1_ = (pixel1);\ |
| 212 | uInt32 const* kernel1 = myColorTable[atari_ntsc_pixel1_];\ |
| 213 | uInt32 const* kernelx0;\ |
| 214 | uInt32 const* kernelx1 = kernel0 |
| 215 | |
| 216 | // Begins input pixel |
| 217 | #define ATARI_NTSC_COLOR_IN( index, color ) {\ |
| 218 | unsigned color_;\ |
| 219 | kernelx##index = kernel##index;\ |
| 220 | kernel##index = (color_ = (color), myColorTable[color_]);\ |
| 221 | } |
| 222 | |
| 223 | // Generates output in the specified 32-bit format (x = junk bits). |
| 224 | // native: xxxRRRRR RRRxxGGG GGGGGxxB BBBBBBBx (native internal format) |
| 225 | // 8888: 00000000 RRRRRRRR GGGGGGGG BBBBBBBB (8-8-8-8 32-bit ARGB) |
| 226 | #define ATARI_NTSC_RGB_OUT_8888( index, rgb_out ) {\ |
| 227 | uInt32 raw_ =\ |
| 228 | kernel0 [index ] + kernel1 [(index+10)%7+14] +\ |
| 229 | kernelx0 [(index+7)%14] + kernelx1 [(index+ 3)%7+14+7];\ |
| 230 | ATARI_NTSC_CLAMP_( raw_, 0 );\ |
| 231 | rgb_out = (raw_>>5 & 0x00FF0000)|(raw_>>3 & 0x0000FF00)|(raw_>>1 & 0x000000FF);\ |
| 232 | } |
| 233 | |
| 234 | // Common ntsc macros |
| 235 | #define atari_ntsc_clamp_mask (rgb_builder * 3 / 2) |
| 236 | #define atari_ntsc_clamp_add (rgb_builder * 0x101) |
| 237 | #define ATARI_NTSC_CLAMP_( io, shift ) {\ |
| 238 | uInt32 sub = (io) >> (9-(shift)) & atari_ntsc_clamp_mask;\ |
| 239 | uInt32 clamp = atari_ntsc_clamp_add - sub;\ |
| 240 | io |= clamp;\ |
| 241 | clamp -= sub;\ |
| 242 | io &= clamp;\ |
| 243 | } |
| 244 | |
| 245 | // Kernel generation |
| 246 | #define ROTATE_IQ( i, q, sin_b, cos_b ) {\ |
| 247 | float t;\ |
| 248 | t = i * cos_b - q * sin_b;\ |
| 249 | q = i * sin_b + q * cos_b;\ |
| 250 | i = t;\ |
| 251 | } |
| 252 | #define RGB_TO_YIQ( r, g, b, y, i ) (\ |
| 253 | (y = (r) * 0.299f + (g) * 0.587f + (b) * 0.114f),\ |
| 254 | (i = (r) * 0.595716f - (g) * 0.274453f - (b) * 0.321263f),\ |
| 255 | ((r) * 0.211456f - (g) * 0.522591f + (b) * 0.311135f)\ |
| 256 | ) |
| 257 | #define YIQ_TO_RGB( y, i, q, to_rgb, type, r, g ) (\ |
| 258 | r = type(y + to_rgb [0] * i + to_rgb [1] * q),\ |
| 259 | g = type(y + to_rgb [2] * i + to_rgb [3] * q),\ |
| 260 | type(y + to_rgb [4] * i + to_rgb [5] * q)\ |
| 261 | ) |
| 262 | #ifndef PACK_RGB |
| 263 | #define PACK_RGB( r, g, b ) ((r) << 21 | (g) << 11 | (b) << 1) |
| 264 | #endif |
| 265 | |
| 266 | #define PIXEL_OFFSET_( ntsc, scaled ) \ |
| 267 | (kernel_size / 2 + ntsc + (scaled != 0) + (rescale_out - scaled) % rescale_out + \ |
| 268 | (kernel_size * 2 * scaled)) |
| 269 | |
| 270 | #define PIXEL_OFFSET( ntsc, scaled ) \ |
| 271 | PIXEL_OFFSET_( ((ntsc) - (scaled) / rescale_out * rescale_in),\ |
| 272 | (((scaled) + rescale_out * 10) % rescale_out) ),\ |
| 273 | (1.0f - (((ntsc) + 100) & 2)) |
| 274 | |
| 275 | #define DISTRIBUTE_ERROR( a, b, c ) {\ |
| 276 | uInt32 fourth = (error + 2 * rgb_builder) >> 2;\ |
| 277 | fourth &= (rgb_bias >> 1) - rgb_builder;\ |
| 278 | fourth -= rgb_bias >> 2;\ |
| 279 | out [a] += fourth;\ |
| 280 | out [b] += fourth;\ |
| 281 | out [c] += fourth;\ |
| 282 | out [i] += error - (fourth * 3);\ |
| 283 | } |
| 284 | |
| 285 | #define RGB_PALETTE_OUT( rgb, out_ )\ |
| 286 | {\ |
| 287 | unsigned char* out = (out_);\ |
| 288 | uInt32 clamped = (rgb);\ |
| 289 | ATARI_NTSC_CLAMP_( clamped, (8 - rgb_bits) );\ |
| 290 | out [0] = (unsigned char) (clamped >> 21);\ |
| 291 | out [1] = (unsigned char) (clamped >> 11);\ |
| 292 | out [2] = (unsigned char) (clamped >> 1);\ |
| 293 | } |
| 294 | }; |
| 295 | |
| 296 | #endif |
| 297 | |