| // Copyright 2012 Google Inc. All Rights Reserved. |
| // |
| // This code is licensed under the same terms as WebM: |
| // Software License Agreement: http://www.webmproject.org/license/software/ |
| // Additional IP Rights Grant: http://www.webmproject.org/license/additional/ |
| // ----------------------------------------------------------------------------- |
| // |
| // Image transforms and color space conversion methods for lossless decoder. |
| // |
| // Authors: Vikas Arora (vikaas.arora@gmail.com) |
| // Jyrki Alakuijala (jyrki@google.com) |
| // Urvang Joshi (urvang@google.com) |
| |
| #if defined(__cplusplus) || defined(c_plusplus) |
| extern "C" { |
| #endif |
| |
| #include <math.h> |
| #include <stdlib.h> |
| #include "./lossless.h" |
| #include "../dec/vp8li.h" |
| #include "../dsp/yuv.h" |
| #include "../dsp/dsp.h" |
| #include "../enc/histogram.h" |
| |
| // A lookup table for small values of log(int) to be used in entropy |
| // computation. |
| // |
| // ", ".join(["%.16ff" % x for x in [0.0]+[log(x) for x in range(1, 256)]]) |
| #define LOG_LOOKUP_IDX_MAX 256 |
| static const float kLogTable[LOG_LOOKUP_IDX_MAX] = { |
| 0.0000000000000000f, 0.0000000000000000f, 0.6931471805599453f, |
| 1.0986122886681098f, 1.3862943611198906f, 1.6094379124341003f, |
| 1.7917594692280550f, 1.9459101490553132f, 2.0794415416798357f, |
| 2.1972245773362196f, 2.3025850929940459f, 2.3978952727983707f, |
| 2.4849066497880004f, 2.5649493574615367f, 2.6390573296152584f, |
| 2.7080502011022101f, 2.7725887222397811f, 2.8332133440562162f, |
| 2.8903717578961645f, 2.9444389791664403f, 2.9957322735539909f, |
| 3.0445224377234230f, 3.0910424533583161f, 3.1354942159291497f, |
| 3.1780538303479458f, 3.2188758248682006f, 3.2580965380214821f, |
| 3.2958368660043291f, 3.3322045101752038f, 3.3672958299864741f, |
| 3.4011973816621555f, 3.4339872044851463f, 3.4657359027997265f, |
| 3.4965075614664802f, 3.5263605246161616f, 3.5553480614894135f, |
| 3.5835189384561099f, 3.6109179126442243f, 3.6375861597263857f, |
| 3.6635616461296463f, 3.6888794541139363f, 3.7135720667043080f, |
| 3.7376696182833684f, 3.7612001156935624f, 3.7841896339182610f, |
| 3.8066624897703196f, 3.8286413964890951f, 3.8501476017100584f, |
| 3.8712010109078911f, 3.8918202981106265f, 3.9120230054281460f, |
| 3.9318256327243257f, 3.9512437185814275f, 3.9702919135521220f, |
| 3.9889840465642745f, 4.0073331852324712f, 4.0253516907351496f, |
| 4.0430512678345503f, 4.0604430105464191f, 4.0775374439057197f, |
| 4.0943445622221004f, 4.1108738641733114f, 4.1271343850450917f, |
| 4.1431347263915326f, 4.1588830833596715f, 4.1743872698956368f, |
| 4.1896547420264252f, 4.2046926193909657f, 4.2195077051761070f, |
| 4.2341065045972597f, 4.2484952420493594f, 4.2626798770413155f, |
| 4.2766661190160553f, 4.2904594411483910f, 4.3040650932041702f, |
| 4.3174881135363101f, 4.3307333402863311f, 4.3438054218536841f, |
| 4.3567088266895917f, 4.3694478524670215f, 4.3820266346738812f, |
| 4.3944491546724391f, 4.4067192472642533f, 4.4188406077965983f, |
| 4.4308167988433134f, 4.4426512564903167f, 4.4543472962535073f, |
| 4.4659081186545837f, 4.4773368144782069f, 4.4886363697321396f, |
| 4.4998096703302650f, 4.5108595065168497f, 4.5217885770490405f, |
| 4.5325994931532563f, 4.5432947822700038f, 4.5538768916005408f, |
| 4.5643481914678361f, 4.5747109785033828f, 4.5849674786705723f, |
| 4.5951198501345898f, 4.6051701859880918f, 4.6151205168412597f, |
| 4.6249728132842707f, 4.6347289882296359f, 4.6443908991413725f, |
| 4.6539603501575231f, 4.6634390941120669f, 4.6728288344619058f, |
| 4.6821312271242199f, 4.6913478822291435f, 4.7004803657924166f, |
| 4.7095302013123339f, 4.7184988712950942f, 4.7273878187123408f, |
| 4.7361984483944957f, 4.7449321283632502f, 4.7535901911063645f, |
| 4.7621739347977563f, 4.7706846244656651f, 4.7791234931115296f, |
| 4.7874917427820458f, 4.7957905455967413f, 4.8040210447332568f, |
| 4.8121843553724171f, 4.8202815656050371f, 4.8283137373023015f, |
| 4.8362819069514780f, 4.8441870864585912f, 4.8520302639196169f, |
| 4.8598124043616719f, 4.8675344504555822f, 4.8751973232011512f, |
| 4.8828019225863706f, 4.8903491282217537f, 4.8978397999509111f, |
| 4.9052747784384296f, 4.9126548857360524f, 4.9199809258281251f, |
| 4.9272536851572051f, 4.9344739331306915f, 4.9416424226093039f, |
| 4.9487598903781684f, 4.9558270576012609f, 4.9628446302599070f, |
| 4.9698132995760007f, 4.9767337424205742f, 4.9836066217083363f, |
| 4.9904325867787360f, 4.9972122737641147f, 5.0039463059454592f, |
| 5.0106352940962555f, 5.0172798368149243f, 5.0238805208462765f, |
| 5.0304379213924353f, 5.0369526024136295f, 5.0434251169192468f, |
| 5.0498560072495371f, 5.0562458053483077f, 5.0625950330269669f, |
| 5.0689042022202315f, 5.0751738152338266f, 5.0814043649844631f, |
| 5.0875963352323836f, 5.0937502008067623f, 5.0998664278241987f, |
| 5.1059454739005803f, 5.1119877883565437f, 5.1179938124167554f, |
| 5.1239639794032588f, 5.1298987149230735f, 5.1357984370502621f, |
| 5.1416635565026603f, 5.1474944768134527f, 5.1532915944977793f, |
| 5.1590552992145291f, 5.1647859739235145f, 5.1704839950381514f, |
| 5.1761497325738288f, 5.1817835502920850f, 5.1873858058407549f, |
| 5.1929568508902104f, 5.1984970312658261f, 5.2040066870767951f, |
| 5.2094861528414214f, 5.2149357576089859f, 5.2203558250783244f, |
| 5.2257466737132017f, 5.2311086168545868f, 5.2364419628299492f, |
| 5.2417470150596426f, 5.2470240721604862f, 5.2522734280466299f, |
| 5.2574953720277815f, 5.2626901889048856f, 5.2678581590633282f, |
| 5.2729995585637468f, 5.2781146592305168f, 5.2832037287379885f, |
| 5.2882670306945352f, 5.2933048247244923f, 5.2983173665480363f, |
| 5.3033049080590757f, 5.3082676974012051f, 5.3132059790417872f, |
| 5.3181199938442161f, 5.3230099791384085f, 5.3278761687895813f, |
| 5.3327187932653688f, 5.3375380797013179f, 5.3423342519648109f, |
| 5.3471075307174685f, 5.3518581334760666f, 5.3565862746720123f, |
| 5.3612921657094255f, 5.3659760150218512f, 5.3706380281276624f, |
| 5.3752784076841653f, 5.3798973535404597f, 5.3844950627890888f, |
| 5.3890717298165010f, 5.3936275463523620f, 5.3981627015177525f, |
| 5.4026773818722793f, 5.4071717714601188f, 5.4116460518550396f, |
| 5.4161004022044201f, 5.4205349992722862f, 5.4249500174814029f, |
| 5.4293456289544411f, 5.4337220035542400f, 5.4380793089231956f, |
| 5.4424177105217932f, 5.4467373716663099f, 5.4510384535657002f, |
| 5.4553211153577017f, 5.4595855141441589f, 5.4638318050256105f, |
| 5.4680601411351315f, 5.4722706736714750f, 5.4764635519315110f, |
| 5.4806389233419912f, 5.4847969334906548f, 5.4889377261566867f, |
| 5.4930614433405482f, 5.4971682252932021f, 5.5012582105447274f, |
| 5.5053315359323625f, 5.5093883366279774f, 5.5134287461649825f, |
| 5.5174528964647074f, 5.5214609178622460f, 5.5254529391317835f, |
| 5.5294290875114234f, 5.5333894887275203f, 5.5373342670185366f, |
| 5.5412635451584258f |
| }; |
| |
| #define APPROX_LOG_MAX 4096 |
| #define LOG_2_BASE_E 0.6931471805599453f |
| |
| float VP8LFastLog(int v) { |
| if (v < APPROX_LOG_MAX) { |
| int log_cnt = 0; |
| while (v >= LOG_LOOKUP_IDX_MAX) { |
| ++log_cnt; |
| v = v >> 1; |
| } |
| return kLogTable[v] + (log_cnt * LOG_2_BASE_E); |
| } |
| return (float)log(v); |
| } |
| |
| //------------------------------------------------------------------------------ |
| // Image transforms. |
| |
| // In-place sum of each component with mod 256. |
| static WEBP_INLINE void AddPixelsEq(uint32_t* a, uint32_t b) { |
| const uint32_t alpha_and_green = (*a & 0xff00ff00u) + (b & 0xff00ff00u); |
| const uint32_t red_and_blue = (*a & 0x00ff00ffu) + (b & 0x00ff00ffu); |
| *a = (alpha_and_green & 0xff00ff00u) | (red_and_blue & 0x00ff00ffu); |
| } |
| |
| static WEBP_INLINE uint32_t Average2(uint32_t a0, uint32_t a1) { |
| return (((a0 ^ a1) & 0xfefefefeL) >> 1) + (a0 & a1); |
| } |
| |
| static WEBP_INLINE uint32_t Average3(uint32_t a0, uint32_t a1, uint32_t a2) { |
| return Average2(Average2(a0, a2), a1); |
| } |
| |
| static WEBP_INLINE uint32_t Average4(uint32_t a0, uint32_t a1, |
| uint32_t a2, uint32_t a3) { |
| return Average2(Average2(a0, a1), Average2(a2, a3)); |
| } |
| |
| static WEBP_INLINE uint32_t Clip255(uint32_t a) { |
| if (a < 256) { |
| return a; |
| } |
| // return 0, when a is a negative integer. |
| // return 255, when a is positive. |
| return ~a >> 24; |
| } |
| |
| static WEBP_INLINE int AddSubtractComponentFull(int a, int b, int c) { |
| return Clip255(a + b - c); |
| } |
| |
| static WEBP_INLINE uint32_t ClampedAddSubtractFull(uint32_t c0, uint32_t c1, |
| uint32_t c2) { |
| const int a = AddSubtractComponentFull(c0 >> 24, c1 >> 24, c2 >> 24); |
| const int r = AddSubtractComponentFull((c0 >> 16) & 0xff, |
| (c1 >> 16) & 0xff, |
| (c2 >> 16) & 0xff); |
| const int g = AddSubtractComponentFull((c0 >> 8) & 0xff, |
| (c1 >> 8) & 0xff, |
| (c2 >> 8) & 0xff); |
| const int b = AddSubtractComponentFull(c0 & 0xff, c1 & 0xff, c2 & 0xff); |
| return (a << 24) | (r << 16) | (g << 8) | b; |
| } |
| |
| static WEBP_INLINE int AddSubtractComponentHalf(int a, int b) { |
| return Clip255(a + (a - b) / 2); |
| } |
| |
| static WEBP_INLINE uint32_t ClampedAddSubtractHalf(uint32_t c0, uint32_t c1, |
| uint32_t c2) { |
| const uint32_t ave = Average2(c0, c1); |
| const int a = AddSubtractComponentHalf(ave >> 24, c2 >> 24); |
| const int r = AddSubtractComponentHalf((ave >> 16) & 0xff, (c2 >> 16) & 0xff); |
| const int g = AddSubtractComponentHalf((ave >> 8) & 0xff, (c2 >> 8) & 0xff); |
| const int b = AddSubtractComponentHalf((ave >> 0) & 0xff, (c2 >> 0) & 0xff); |
| return (a << 24) | (r << 16) | (g << 8) | b; |
| } |
| |
| static WEBP_INLINE int Sub3(int a, int b, int c) { |
| const int pa = b - c; |
| const int pb = a - c; |
| return abs(pa) - abs(pb); |
| } |
| |
| static WEBP_INLINE uint32_t Select(uint32_t a, uint32_t b, uint32_t c) { |
| const int pa_minus_pb = |
| Sub3((a >> 24) , (b >> 24) , (c >> 24) ) + |
| Sub3((a >> 16) & 0xff, (b >> 16) & 0xff, (c >> 16) & 0xff) + |
| Sub3((a >> 8) & 0xff, (b >> 8) & 0xff, (c >> 8) & 0xff) + |
| Sub3((a ) & 0xff, (b ) & 0xff, (c ) & 0xff); |
| |
| return (pa_minus_pb <= 0) ? a : b; |
| } |
| |
| //------------------------------------------------------------------------------ |
| // Predictors |
| |
| static uint32_t Predictor0(uint32_t left, const uint32_t* const top) { |
| (void)top; |
| (void)left; |
| return ARGB_BLACK; |
| } |
| static uint32_t Predictor1(uint32_t left, const uint32_t* const top) { |
| (void)top; |
| return left; |
| } |
| static uint32_t Predictor2(uint32_t left, const uint32_t* const top) { |
| (void)left; |
| return top[0]; |
| } |
| static uint32_t Predictor3(uint32_t left, const uint32_t* const top) { |
| (void)left; |
| return top[1]; |
| } |
| static uint32_t Predictor4(uint32_t left, const uint32_t* const top) { |
| (void)left; |
| return top[-1]; |
| } |
| static uint32_t Predictor5(uint32_t left, const uint32_t* const top) { |
| const uint32_t pred = Average3(left, top[0], top[1]); |
| return pred; |
| } |
| static uint32_t Predictor6(uint32_t left, const uint32_t* const top) { |
| const uint32_t pred = Average2(left, top[-1]); |
| return pred; |
| } |
| static uint32_t Predictor7(uint32_t left, const uint32_t* const top) { |
| const uint32_t pred = Average2(left, top[0]); |
| return pred; |
| } |
| static uint32_t Predictor8(uint32_t left, const uint32_t* const top) { |
| const uint32_t pred = Average2(top[-1], top[0]); |
| (void)left; |
| return pred; |
| } |
| static uint32_t Predictor9(uint32_t left, const uint32_t* const top) { |
| const uint32_t pred = Average2(top[0], top[1]); |
| (void)left; |
| return pred; |
| } |
| static uint32_t Predictor10(uint32_t left, const uint32_t* const top) { |
| const uint32_t pred = Average4(left, top[-1], top[0], top[1]); |
| return pred; |
| } |
| static uint32_t Predictor11(uint32_t left, const uint32_t* const top) { |
| const uint32_t pred = Select(top[0], left, top[-1]); |
| return pred; |
| } |
| static uint32_t Predictor12(uint32_t left, const uint32_t* const top) { |
| const uint32_t pred = ClampedAddSubtractFull(left, top[0], top[-1]); |
| return pred; |
| } |
| static uint32_t Predictor13(uint32_t left, const uint32_t* const top) { |
| const uint32_t pred = ClampedAddSubtractHalf(left, top[0], top[-1]); |
| return pred; |
| } |
| |
| typedef uint32_t (*PredictorFunc)(uint32_t left, const uint32_t* const top); |
| static const PredictorFunc kPredictors[16] = { |
| Predictor0, Predictor1, Predictor2, Predictor3, |
| Predictor4, Predictor5, Predictor6, Predictor7, |
| Predictor8, Predictor9, Predictor10, Predictor11, |
| Predictor12, Predictor13, |
| Predictor0, Predictor0 // <- padding security sentinels |
| }; |
| |
| // TODO(vikasa): Replace 256 etc with defines. |
| static double PredictionCostSpatial(const int* counts, |
| int weight_0, double exp_val) { |
| const int significant_symbols = 16; |
| const double exp_decay_factor = 0.6; |
| double bits = weight_0 * counts[0]; |
| int i; |
| for (i = 1; i < significant_symbols; ++i) { |
| bits += exp_val * (counts[i] + counts[256 - i]); |
| exp_val *= exp_decay_factor; |
| } |
| return -0.1 * bits; |
| } |
| |
| // Compute the Shanon's entropy: Sum(p*log2(p)) |
| static double ShannonEntropy(const int* const array, int n) { |
| int i; |
| double retval = 0; |
| int sum = 0; |
| for (i = 0; i < n; ++i) { |
| if (array[i] != 0) { |
| sum += array[i]; |
| retval += array[i] * VP8LFastLog(array[i]); |
| } |
| } |
| retval -= sum * VP8LFastLog(sum); |
| retval *= -1.4426950408889634; // 1.0 / -FastLog(2); |
| return retval; |
| } |
| |
| static double PredictionCostSpatialHistogram(int accumulated[4][256], |
| int tile[4][256]) { |
| int i; |
| int k; |
| int combo[256]; |
| double retval = 0; |
| for (i = 0; i < 4; ++i) { |
| const double exp_val = 0.94; |
| retval += PredictionCostSpatial(&tile[i][0], 1, exp_val); |
| retval += ShannonEntropy(&tile[i][0], 256); |
| for (k = 0; k < 256; ++k) { |
| combo[k] = accumulated[i][k] + tile[i][k]; |
| } |
| retval += ShannonEntropy(&combo[0], 256); |
| } |
| return retval; |
| } |
| |
| static int GetBestPredictorForTile(int width, int height, |
| int tile_x, int tile_y, int bits, |
| int accumulated[4][256], |
| const uint32_t* const argb_scratch) { |
| const int kNumPredModes = 14; |
| const int col_start = tile_x << bits; |
| const int row_start = tile_y << bits; |
| const int tile_size = 1 << bits; |
| const int ymax = (tile_size <= height - row_start) ? |
| tile_size : height - row_start; |
| const int xmax = (tile_size <= width - col_start) ? |
| tile_size : width - col_start; |
| int histo[4][256]; |
| double best_diff = 1e99; |
| int best_mode = 0; |
| |
| int mode; |
| for (mode = 0; mode < kNumPredModes; ++mode) { |
| const uint32_t* current_row = argb_scratch; |
| const PredictorFunc pred_func = kPredictors[mode]; |
| double cur_diff; |
| int y; |
| memset(&histo[0][0], 0, sizeof(histo)); |
| for (y = 0; y < ymax; ++y) { |
| int x; |
| const int row = row_start + y; |
| const uint32_t* const upper_row = current_row; |
| current_row = upper_row + width; |
| for (x = 0; x < xmax; ++x) { |
| const int col = col_start + x; |
| uint32_t predict; |
| uint32_t predict_diff; |
| if (row == 0) { |
| predict = (col == 0) ? ARGB_BLACK : current_row[col - 1]; // Left. |
| } else if (col == 0) { |
| predict = upper_row[col]; // Top. |
| } else { |
| predict = pred_func(current_row[col - 1], upper_row + col); |
| } |
| predict_diff = VP8LSubPixels(current_row[col], predict); |
| ++histo[0][predict_diff >> 24]; |
| ++histo[1][((predict_diff >> 16) & 0xff)]; |
| ++histo[2][((predict_diff >> 8) & 0xff)]; |
| ++histo[3][(predict_diff & 0xff)]; |
| } |
| } |
| cur_diff = PredictionCostSpatialHistogram(accumulated, histo); |
| if (cur_diff < best_diff) { |
| best_diff = cur_diff; |
| best_mode = mode; |
| } |
| } |
| |
| return best_mode; |
| } |
| |
| static void CopyTileWithPrediction(int width, int height, |
| int tile_x, int tile_y, int bits, int mode, |
| const uint32_t* const argb_scratch, |
| uint32_t* const argb) { |
| const int col_start = tile_x << bits; |
| const int row_start = tile_y << bits; |
| const int tile_size = 1 << bits; |
| const int ymax = (tile_size <= height - row_start) ? |
| tile_size : height - row_start; |
| const int xmax = (tile_size <= width - col_start) ? |
| tile_size : width - col_start; |
| const PredictorFunc pred_func = kPredictors[mode]; |
| const uint32_t* current_row = argb_scratch; |
| |
| int y; |
| for (y = 0; y < ymax; ++y) { |
| int x; |
| const int row = row_start + y; |
| const uint32_t* const upper_row = current_row; |
| current_row = upper_row + width; |
| for (x = 0; x < xmax; ++x) { |
| const int col = col_start + x; |
| const int pix = row * width + col; |
| uint32_t predict; |
| if (row == 0) { |
| predict = (col == 0) ? ARGB_BLACK : current_row[col - 1]; // Left. |
| } else if (col == 0) { |
| predict = upper_row[col]; // Top. |
| } else { |
| predict = pred_func(current_row[col - 1], upper_row + col); |
| } |
| argb[pix] = VP8LSubPixels(current_row[col], predict); |
| } |
| } |
| } |
| |
| void VP8LResidualImage(int width, int height, int bits, |
| uint32_t* const argb, uint32_t* const argb_scratch, |
| uint32_t* const image) { |
| const int max_tile_size = 1 << bits; |
| const int tiles_per_row = VP8LSubSampleSize(width, bits); |
| const int tiles_per_col = VP8LSubSampleSize(height, bits); |
| uint32_t* const upper_row = argb_scratch; |
| uint32_t* const current_tile_rows = argb_scratch + width; |
| int tile_y; |
| int histo[4][256]; |
| memset(histo, 0, sizeof(histo)); |
| for (tile_y = 0; tile_y < tiles_per_col; ++tile_y) { |
| const int tile_y_offset = tile_y * max_tile_size; |
| const int this_tile_height = |
| (tile_y < tiles_per_col - 1) ? max_tile_size : height - tile_y_offset; |
| int tile_x; |
| if (tile_y > 0) { |
| memcpy(upper_row, current_tile_rows + (max_tile_size - 1) * width, |
| width * sizeof(*upper_row)); |
| } |
| memcpy(current_tile_rows, &argb[tile_y_offset * width], |
| this_tile_height * width * sizeof(*current_tile_rows)); |
| for (tile_x = 0; tile_x < tiles_per_row; ++tile_x) { |
| int pred; |
| int y; |
| const int tile_x_offset = tile_x * max_tile_size; |
| int all_x_max = tile_x_offset + max_tile_size; |
| if (all_x_max > width) { |
| all_x_max = width; |
| } |
| pred = GetBestPredictorForTile(width, height, tile_x, tile_y, bits, histo, |
| argb_scratch); |
| image[tile_y * tiles_per_row + tile_x] = 0xff000000u | (pred << 8); |
| CopyTileWithPrediction(width, height, tile_x, tile_y, bits, pred, |
| argb_scratch, argb); |
| for (y = 0; y < max_tile_size; ++y) { |
| int ix; |
| int all_x; |
| int all_y = tile_y_offset + y; |
| if (all_y >= height) { |
| break; |
| } |
| ix = all_y * width + tile_x_offset; |
| for (all_x = tile_x_offset; all_x < all_x_max; ++all_x, ++ix) { |
| const uint32_t a = argb[ix]; |
| ++histo[0][a >> 24]; |
| ++histo[1][((a >> 16) & 0xff)]; |
| ++histo[2][((a >> 8) & 0xff)]; |
| ++histo[3][(a & 0xff)]; |
| } |
| } |
| } |
| } |
| } |
| |
| // Inverse prediction. |
| static void PredictorInverseTransform(const VP8LTransform* const transform, |
| int y_start, int y_end, uint32_t* data) { |
| const int width = transform->xsize_; |
| if (y_start == 0) { // First Row follows the L (mode=1) mode. |
| int x; |
| const uint32_t pred0 = Predictor0(data[-1], NULL); |
| AddPixelsEq(data, pred0); |
| for (x = 1; x < width; ++x) { |
| const uint32_t pred1 = Predictor1(data[x - 1], NULL); |
| AddPixelsEq(data + x, pred1); |
| } |
| data += width; |
| ++y_start; |
| } |
| |
| { |
| int y = y_start; |
| const int mask = (1 << transform->bits_) - 1; |
| const int tiles_per_row = VP8LSubSampleSize(width, transform->bits_); |
| const uint32_t* pred_mode_base = |
| transform->data_ + (y >> transform->bits_) * tiles_per_row; |
| |
| while (y < y_end) { |
| int x; |
| const uint32_t pred2 = Predictor2(data[-1], data - width); |
| const uint32_t* pred_mode_src = pred_mode_base; |
| PredictorFunc pred_func; |
| |
| // First pixel follows the T (mode=2) mode. |
| AddPixelsEq(data, pred2); |
| |
| // .. the rest: |
| pred_func = kPredictors[((*pred_mode_src++) >> 8) & 0xf]; |
| for (x = 1; x < width; ++x) { |
| uint32_t pred; |
| if ((x & mask) == 0) { // start of tile. Read predictor function. |
| pred_func = kPredictors[((*pred_mode_src++) >> 8) & 0xf]; |
| } |
| pred = pred_func(data[x - 1], data + x - width); |
| AddPixelsEq(data + x, pred); |
| } |
| data += width; |
| ++y; |
| if ((y & mask) == 0) { // Use the same mask, since tiles are squares. |
| pred_mode_base += tiles_per_row; |
| } |
| } |
| } |
| } |
| |
| void VP8LSubtractGreenFromBlueAndRed(uint32_t* argb_data, int num_pixs) { |
| int i; |
| for (i = 0; i < num_pixs; ++i) { |
| const uint32_t argb = argb_data[i]; |
| const uint32_t green = (argb >> 8) & 0xff; |
| const uint32_t new_r = (((argb >> 16) & 0xff) - green) & 0xff; |
| const uint32_t new_b = ((argb & 0xff) - green) & 0xff; |
| argb_data[i] = (argb & 0xff00ff00) | (new_r << 16) | new_b; |
| } |
| } |
| |
| // Add green to blue and red channels (i.e. perform the inverse transform of |
| // 'subtract green'). |
| static void AddGreenToBlueAndRed(const VP8LTransform* const transform, |
| int y_start, int y_end, uint32_t* data) { |
| const int width = transform->xsize_; |
| const uint32_t* const data_end = data + (y_end - y_start) * width; |
| while (data < data_end) { |
| const uint32_t argb = *data; |
| // "* 0001001u" is equivalent to "(green << 16) + green)" |
| const uint32_t green = ((argb >> 8) & 0xff); |
| uint32_t red_blue = (argb & 0x00ff00ffu); |
| red_blue += (green << 16) | green; |
| red_blue &= 0x00ff00ffu; |
| *data++ = (argb & 0xff00ff00u) | red_blue; |
| } |
| } |
| |
| typedef struct { |
| // Note: the members are uint8_t, so that any negative values are |
| // automatically converted to "mod 256" values. |
| uint8_t green_to_red_; |
| uint8_t green_to_blue_; |
| uint8_t red_to_blue_; |
| } Multipliers; |
| |
| static WEBP_INLINE void MultipliersClear(Multipliers* m) { |
| m->green_to_red_ = 0; |
| m->green_to_blue_ = 0; |
| m->red_to_blue_ = 0; |
| } |
| |
| static WEBP_INLINE uint32_t ColorTransformDelta(int8_t color_pred, |
| int8_t color) { |
| return (uint32_t)((int)(color_pred) * color) >> 5; |
| } |
| |
| static WEBP_INLINE void ColorCodeToMultipliers(uint32_t color_code, |
| Multipliers* const m) { |
| m->green_to_red_ = (color_code >> 0) & 0xff; |
| m->green_to_blue_ = (color_code >> 8) & 0xff; |
| m->red_to_blue_ = (color_code >> 16) & 0xff; |
| } |
| |
| static WEBP_INLINE uint32_t MultipliersToColorCode(Multipliers* const m) { |
| return 0xff000000u | |
| ((uint32_t)(m->red_to_blue_) << 16) | |
| ((uint32_t)(m->green_to_blue_) << 8) | |
| m->green_to_red_; |
| } |
| |
| static WEBP_INLINE uint32_t TransformColor(const Multipliers* const m, |
| uint32_t argb, int inverse) { |
| const uint32_t green = argb >> 8; |
| const uint32_t red = argb >> 16; |
| uint32_t new_red = red; |
| uint32_t new_blue = argb; |
| |
| if (inverse) { |
| new_red += ColorTransformDelta(m->green_to_red_, green); |
| new_red &= 0xff; |
| new_blue += ColorTransformDelta(m->green_to_blue_, green); |
| new_blue += ColorTransformDelta(m->red_to_blue_, new_red); |
| new_blue &= 0xff; |
| } else { |
| new_red -= ColorTransformDelta(m->green_to_red_, green); |
| new_red &= 0xff; |
| new_blue -= ColorTransformDelta(m->green_to_blue_, green); |
| new_blue -= ColorTransformDelta(m->red_to_blue_, red); |
| new_blue &= 0xff; |
| } |
| return (argb & 0xff00ff00u) | (new_red << 16) | (new_blue); |
| } |
| |
| static WEBP_INLINE int SkipRepeatedPixels(const uint32_t* const argb, |
| int ix, int xsize) { |
| const uint32_t v = argb[ix]; |
| if (ix >= xsize + 3) { |
| if (v == argb[ix - xsize] && |
| argb[ix - 1] == argb[ix - xsize - 1] && |
| argb[ix - 2] == argb[ix - xsize - 2] && |
| argb[ix - 3] == argb[ix - xsize - 3]) { |
| return 1; |
| } |
| return v == argb[ix - 3] && v == argb[ix - 2] && v == argb[ix - 1]; |
| } else if (ix >= 3) { |
| return v == argb[ix - 3] && v == argb[ix - 2] && v == argb[ix - 1]; |
| } |
| return 0; |
| } |
| |
| static double PredictionCostCrossColor(const int accumulated[256], |
| const int counts[256]) { |
| // Favor low entropy, locally and globally. |
| int i; |
| int combo[256]; |
| for (i = 0; i < 256; ++i) { |
| combo[i] = accumulated[i] + counts[i]; |
| } |
| return ShannonEntropy(combo, 256) + |
| ShannonEntropy(counts, 256) + |
| PredictionCostSpatial(counts, 3, 2.4); // Favor small absolute values. |
| } |
| |
| static Multipliers GetBestColorTransformForTile( |
| int tile_x, int tile_y, int bits, |
| Multipliers prevX, |
| Multipliers prevY, |
| int step, int xsize, int ysize, |
| int* accumulated_red_histo, |
| int* accumulated_blue_histo, |
| const uint32_t* const argb) { |
| double best_diff = 1e99; |
| double cur_diff; |
| const int halfstep = step / 2; |
| const int max_tile_size = 1 << bits; |
| const int tile_y_offset = tile_y * max_tile_size; |
| const int tile_x_offset = tile_x * max_tile_size; |
| int green_to_red; |
| int green_to_blue; |
| int red_to_blue; |
| int all_x_max = tile_x_offset + max_tile_size; |
| int all_y_max = tile_y_offset + max_tile_size; |
| Multipliers best_tx; |
| MultipliersClear(&best_tx); |
| if (all_x_max > xsize) { |
| all_x_max = xsize; |
| } |
| if (all_y_max > ysize) { |
| all_y_max = ysize; |
| } |
| for (green_to_red = -64; green_to_red <= 64; green_to_red += halfstep) { |
| int histo[256] = { 0 }; |
| int all_y; |
| Multipliers tx; |
| MultipliersClear(&tx); |
| tx.green_to_red_ = green_to_red & 0xff; |
| |
| for (all_y = tile_y_offset; all_y < all_y_max; ++all_y) { |
| uint32_t predict; |
| int ix = all_y * xsize + tile_x_offset; |
| int all_x; |
| for (all_x = tile_x_offset; all_x < all_x_max; ++all_x, ++ix) { |
| if (SkipRepeatedPixels(argb, ix, xsize)) { |
| continue; |
| } |
| predict = TransformColor(&tx, argb[ix], 0); |
| ++histo[(predict >> 16) & 0xff]; // red. |
| } |
| } |
| cur_diff = PredictionCostCrossColor(&accumulated_red_histo[0], &histo[0]); |
| if (tx.green_to_red_ == prevX.green_to_red_) { |
| cur_diff -= 3; // favor keeping the areas locally similar |
| } |
| if (tx.green_to_red_ == prevY.green_to_red_) { |
| cur_diff -= 3; // favor keeping the areas locally similar |
| } |
| if (tx.green_to_red_ == 0) { |
| cur_diff -= 3; |
| } |
| if (cur_diff < best_diff) { |
| best_diff = cur_diff; |
| best_tx = tx; |
| } |
| } |
| best_diff = 1e99; |
| green_to_red = best_tx.green_to_red_; |
| for (green_to_blue = -32; green_to_blue <= 32; green_to_blue += step) { |
| for (red_to_blue = -32; red_to_blue <= 32; red_to_blue += step) { |
| int all_y; |
| int histo[256] = { 0 }; |
| Multipliers tx; |
| tx.green_to_red_ = green_to_red; |
| tx.green_to_blue_ = green_to_blue; |
| tx.red_to_blue_ = red_to_blue; |
| for (all_y = tile_y_offset; all_y < all_y_max; ++all_y) { |
| uint32_t predict; |
| int all_x; |
| int ix = all_y * xsize + tile_x_offset; |
| for (all_x = tile_x_offset; all_x < all_x_max; ++all_x, ++ix) { |
| if (SkipRepeatedPixels(argb, ix, xsize)) { |
| continue; |
| } |
| predict = TransformColor(&tx, argb[ix], 0); |
| ++histo[predict & 0xff]; // blue. |
| } |
| } |
| cur_diff = |
| PredictionCostCrossColor(&accumulated_blue_histo[0], &histo[0]); |
| if (tx.green_to_blue_ == prevX.green_to_blue_) { |
| cur_diff -= 3; // favor keeping the areas locally similar |
| } |
| if (tx.green_to_blue_ == prevY.green_to_blue_) { |
| cur_diff -= 3; // favor keeping the areas locally similar |
| } |
| if (tx.red_to_blue_ == prevX.red_to_blue_) { |
| cur_diff -= 3; // favor keeping the areas locally similar |
| } |
| if (tx.red_to_blue_ == prevY.red_to_blue_) { |
| cur_diff -= 3; // favor keeping the areas locally similar |
| } |
| if (tx.green_to_blue_ == 0) { |
| cur_diff -= 3; |
| } |
| if (tx.red_to_blue_ == 0) { |
| cur_diff -= 3; |
| } |
| if (cur_diff < best_diff) { |
| best_diff = cur_diff; |
| best_tx = tx; |
| } |
| } |
| } |
| return best_tx; |
| } |
| |
| static void CopyTileWithColorTransform(int xsize, int ysize, |
| int tile_x, int tile_y, int bits, |
| Multipliers color_transform, |
| uint32_t* const argb) { |
| int y; |
| int xscan = 1 << bits; |
| int yscan = 1 << bits; |
| tile_x <<= bits; |
| tile_y <<= bits; |
| if (xscan > xsize - tile_x) { |
| xscan = xsize - tile_x; |
| } |
| if (yscan > ysize - tile_y) { |
| yscan = ysize - tile_y; |
| } |
| yscan += tile_y; |
| for (y = tile_y; y < yscan; ++y) { |
| int ix = y * xsize + tile_x; |
| const int end_ix = ix + xscan; |
| for (; ix < end_ix; ++ix) { |
| argb[ix] = TransformColor(&color_transform, argb[ix], 0); |
| } |
| } |
| } |
| |
| void VP8LColorSpaceTransform(int width, int height, int bits, int step, |
| uint32_t* const argb, uint32_t* image) { |
| const int max_tile_size = 1 << bits; |
| int tile_xsize = VP8LSubSampleSize(width, bits); |
| int tile_ysize = VP8LSubSampleSize(height, bits); |
| int accumulated_red_histo[256] = { 0 }; |
| int accumulated_blue_histo[256] = { 0 }; |
| int tile_y; |
| int tile_x; |
| Multipliers prevX; |
| Multipliers prevY; |
| MultipliersClear(&prevY); |
| MultipliersClear(&prevX); |
| for (tile_y = 0; tile_y < tile_ysize; ++tile_y) { |
| for (tile_x = 0; tile_x < tile_xsize; ++tile_x) { |
| Multipliers color_transform; |
| int all_x_max; |
| int y; |
| const int tile_y_offset = tile_y * max_tile_size; |
| const int tile_x_offset = tile_x * max_tile_size; |
| if (tile_y != 0) { |
| ColorCodeToMultipliers(image[tile_y * tile_xsize + tile_x - 1], &prevX); |
| ColorCodeToMultipliers(image[(tile_y - 1) * tile_xsize + tile_x], |
| &prevY); |
| } else if (tile_x != 0) { |
| ColorCodeToMultipliers(image[tile_y * tile_xsize + tile_x - 1], &prevX); |
| } |
| color_transform = |
| GetBestColorTransformForTile(tile_x, tile_y, bits, |
| prevX, prevY, |
| step, width, height, |
| &accumulated_red_histo[0], |
| &accumulated_blue_histo[0], |
| argb); |
| image[tile_y * tile_xsize + tile_x] = |
| MultipliersToColorCode(&color_transform); |
| CopyTileWithColorTransform(width, height, tile_x, tile_y, bits, |
| color_transform, argb); |
| |
| // Gather accumulated histogram data. |
| all_x_max = tile_x_offset + max_tile_size; |
| if (all_x_max > width) { |
| all_x_max = width; |
| } |
| for (y = 0; y < max_tile_size; ++y) { |
| int ix; |
| int all_x; |
| int all_y = tile_y_offset + y; |
| if (all_y >= height) { |
| break; |
| } |
| ix = all_y * width + tile_x_offset; |
| for (all_x = tile_x_offset; all_x < all_x_max; ++all_x, ++ix) { |
| if (ix >= 2 && |
| argb[ix] == argb[ix - 2] && |
| argb[ix] == argb[ix - 1]) { |
| continue; // repeated pixels are handled by backward references |
| } |
| if (ix >= width + 2 && |
| argb[ix - 2] == argb[ix - width - 2] && |
| argb[ix - 1] == argb[ix - width - 1] && |
| argb[ix] == argb[ix - width]) { |
| continue; // repeated pixels are handled by backward references |
| } |
| ++accumulated_red_histo[(argb[ix] >> 16) & 0xff]; |
| ++accumulated_blue_histo[argb[ix] & 0xff]; |
| } |
| } |
| } |
| } |
| } |
| |
| // Color space inverse transform. |
| static void ColorSpaceInverseTransform(const VP8LTransform* const transform, |
| int y_start, int y_end, uint32_t* data) { |
| const int width = transform->xsize_; |
| const int mask = (1 << transform->bits_) - 1; |
| const int tiles_per_row = VP8LSubSampleSize(width, transform->bits_); |
| int y = y_start; |
| const uint32_t* pred_row = |
| transform->data_ + (y >> transform->bits_) * tiles_per_row; |
| |
| while (y < y_end) { |
| const uint32_t* pred = pred_row; |
| Multipliers m = { 0, 0, 0 }; |
| int x; |
| |
| for (x = 0; x < width; ++x) { |
| if ((x & mask) == 0) ColorCodeToMultipliers(*pred++, &m); |
| data[x] = TransformColor(&m, data[x], 1); |
| } |
| data += width; |
| ++y; |
| if ((y & mask) == 0) pred_row += tiles_per_row;; |
| } |
| } |
| |
| // Separate out pixels packed together using pixel-bundling. |
| static void ColorIndexInverseTransform( |
| const VP8LTransform* const transform, |
| int y_start, int y_end, const uint32_t* src, uint32_t* dst) { |
| int y; |
| const int bits_per_pixel = 8 >> transform->bits_; |
| const int width = transform->xsize_; |
| const uint32_t* const color_map = transform->data_; |
| if (bits_per_pixel < 8) { |
| const int pixels_per_byte = 1 << transform->bits_; |
| const int count_mask = pixels_per_byte - 1; |
| const uint32_t bit_mask = (1 << bits_per_pixel) - 1; |
| for (y = y_start; y < y_end; ++y) { |
| uint32_t packed_pixels = 0; |
| int x; |
| for (x = 0; x < width; ++x) { |
| // We need to load fresh 'packed_pixels' once every 'bytes_per_pixels' |
| // increments of x. Fortunately, pixels_per_byte is a power of 2, so |
| // can just use a mask for that, instead of decrementing a counter. |
| if ((x & count_mask) == 0) packed_pixels = ((*src++) >> 8) & 0xff; |
| *dst++ = color_map[packed_pixels & bit_mask]; |
| packed_pixels >>= bits_per_pixel; |
| } |
| } |
| } else { |
| for (y = y_start; y < y_end; ++y) { |
| int x; |
| for (x = 0; x < width; ++x) { |
| *dst++ = color_map[((*src++) >> 8) & 0xff]; |
| } |
| } |
| } |
| } |
| |
| void VP8LInverseTransform(const VP8LTransform* const transform, |
| int row_start, int row_end, |
| const uint32_t* const in, uint32_t* const out) { |
| assert(row_start < row_end); |
| assert(row_end <= transform->ysize_); |
| switch (transform->type_) { |
| case SUBTRACT_GREEN: |
| AddGreenToBlueAndRed(transform, row_start, row_end, out); |
| break; |
| case PREDICTOR_TRANSFORM: |
| PredictorInverseTransform(transform, row_start, row_end, out); |
| if (row_end != transform->ysize_) { |
| // The last predicted row in this iteration will be the top-pred row |
| // for the first row in next iteration. |
| const int width = transform->xsize_; |
| memcpy(out - width, out + (row_end - row_start - 1) * width, |
| width * sizeof(*out)); |
| } |
| break; |
| case CROSS_COLOR_TRANSFORM: |
| ColorSpaceInverseTransform(transform, row_start, row_end, out); |
| break; |
| case COLOR_INDEXING_TRANSFORM: |
| ColorIndexInverseTransform(transform, row_start, row_end, in, out); |
| break; |
| } |
| } |
| |
| //------------------------------------------------------------------------------ |
| // Color space conversion. |
| |
| static int is_big_endian(void) { |
| static const union { |
| uint16_t w; |
| uint8_t b[2]; |
| } tmp = { 1 }; |
| return (tmp.b[0] != 1); |
| } |
| |
| static void ConvertBGRAToRGB(const uint32_t* src, |
| int num_pixels, uint8_t* dst) { |
| const uint32_t* const src_end = src + num_pixels; |
| while (src < src_end) { |
| const uint32_t argb = *src++; |
| *dst++ = (argb >> 16) & 0xff; |
| *dst++ = (argb >> 8) & 0xff; |
| *dst++ = (argb >> 0) & 0xff; |
| } |
| } |
| |
| static void ConvertBGRAToRGBA(const uint32_t* src, |
| int num_pixels, uint8_t* dst) { |
| const uint32_t* const src_end = src + num_pixels; |
| while (src < src_end) { |
| const uint32_t argb = *src++; |
| *dst++ = (argb >> 16) & 0xff; |
| *dst++ = (argb >> 8) & 0xff; |
| *dst++ = (argb >> 0) & 0xff; |
| *dst++ = (argb >> 24) & 0xff; |
| } |
| } |
| |
| static void ConvertBGRAToRGBA4444(const uint32_t* src, |
| int num_pixels, uint8_t* dst) { |
| const uint32_t* const src_end = src + num_pixels; |
| while (src < src_end) { |
| const uint32_t argb = *src++; |
| *dst++ = ((argb >> 16) & 0xf0) | ((argb >> 12) & 0xf); |
| *dst++ = ((argb >> 0) & 0xf0) | ((argb >> 28) & 0xf); |
| } |
| } |
| |
| static void ConvertBGRAToRGB565(const uint32_t* src, |
| int num_pixels, uint8_t* dst) { |
| const uint32_t* const src_end = src + num_pixels; |
| while (src < src_end) { |
| const uint32_t argb = *src++; |
| *dst++ = ((argb >> 16) & 0xf8) | ((argb >> 13) & 0x7); |
| *dst++ = ((argb >> 5) & 0xe0) | ((argb >> 3) & 0x1f); |
| } |
| } |
| |
| static void ConvertBGRAToBGR(const uint32_t* src, |
| int num_pixels, uint8_t* dst) { |
| const uint32_t* const src_end = src + num_pixels; |
| while (src < src_end) { |
| const uint32_t argb = *src++; |
| *dst++ = (argb >> 0) & 0xff; |
| *dst++ = (argb >> 8) & 0xff; |
| *dst++ = (argb >> 16) & 0xff; |
| } |
| } |
| |
| static void CopyOrSwap(const uint32_t* src, int num_pixels, uint8_t* dst, |
| int swap_on_big_endian) { |
| if (is_big_endian() == swap_on_big_endian) { |
| const uint32_t* const src_end = src + num_pixels; |
| while (src < src_end) { |
| uint32_t argb = *src++; |
| #if !defined(__BIG_ENDIAN__) && (defined(__i386__) || defined(__x86_64__)) |
| __asm__ volatile("bswap %0" : "=r"(argb) : "0"(argb)); |
| *(uint32_t*)dst = argb; |
| dst += sizeof(argb); |
| #elif !defined(__BIG_ENDIAN__) && defined(_MSC_VER) |
| argb = _byteswap_ulong(argb); |
| *(uint32_t*)dst = argb; |
| dst += sizeof(argb); |
| #else |
| *dst++ = (argb >> 24) & 0xff; |
| *dst++ = (argb >> 16) & 0xff; |
| *dst++ = (argb >> 8) & 0xff; |
| *dst++ = (argb >> 0) & 0xff; |
| #endif |
| } |
| } else { |
| memcpy(dst, src, num_pixels * sizeof(*src)); |
| } |
| } |
| |
| void VP8LConvertFromBGRA(const uint32_t* const in_data, int num_pixels, |
| WEBP_CSP_MODE out_colorspace, uint8_t* const rgba) { |
| switch (out_colorspace) { |
| case MODE_RGB: |
| ConvertBGRAToRGB(in_data, num_pixels, rgba); |
| break; |
| case MODE_RGBA: |
| ConvertBGRAToRGBA(in_data, num_pixels, rgba); |
| break; |
| case MODE_rgbA: |
| ConvertBGRAToRGBA(in_data, num_pixels, rgba); |
| WebPApplyAlphaMultiply(rgba, 0, num_pixels, 1, 0); |
| break; |
| case MODE_BGR: |
| ConvertBGRAToBGR(in_data, num_pixels, rgba); |
| break; |
| case MODE_BGRA: |
| CopyOrSwap(in_data, num_pixels, rgba, 1); |
| break; |
| case MODE_bgrA: |
| CopyOrSwap(in_data, num_pixels, rgba, 1); |
| WebPApplyAlphaMultiply(rgba, 0, num_pixels, 1, 0); |
| break; |
| case MODE_ARGB: |
| CopyOrSwap(in_data, num_pixels, rgba, 0); |
| break; |
| case MODE_Argb: |
| CopyOrSwap(in_data, num_pixels, rgba, 0); |
| WebPApplyAlphaMultiply(rgba, 1, num_pixels, 1, 0); |
| break; |
| case MODE_RGBA_4444: |
| ConvertBGRAToRGBA4444(in_data, num_pixels, rgba); |
| break; |
| case MODE_rgbA_4444: |
| ConvertBGRAToRGBA4444(in_data, num_pixels, rgba); |
| WebPApplyAlphaMultiply4444(rgba, num_pixels, 1, 0); |
| break; |
| case MODE_RGB_565: |
| ConvertBGRAToRGB565(in_data, num_pixels, rgba); |
| break; |
| default: |
| assert(0); // Code flow should not reach here. |
| } |
| } |
| |
| //------------------------------------------------------------------------------ |
| |
| #if defined(__cplusplus) || defined(c_plusplus) |
| } // extern "C" |
| #endif |