Refactor histograms in predictors.

Replace the 2d histograms with uint32_t 1d versions (to avoid
pointer casting and to use the optimized VP8LAddVectorEq).

Change-Id: I90b0fe98390b49e3fd03e3484289571cf7ae6eca
This commit is contained in:
Vincent Rabaud 2024-05-03 22:09:38 +02:00
parent a7aa7525b8
commit a90160e11a
6 changed files with 90 additions and 97 deletions

View File

@ -155,13 +155,13 @@ extern VP8LTransformColorFunc VP8LTransformColor;
typedef void (*VP8LCollectColorBlueTransformsFunc)( typedef void (*VP8LCollectColorBlueTransformsFunc)(
const uint32_t* argb, int stride, const uint32_t* argb, int stride,
int tile_width, int tile_height, int tile_width, int tile_height,
int green_to_blue, int red_to_blue, int histo[]); int green_to_blue, int red_to_blue, uint32_t histo[]);
extern VP8LCollectColorBlueTransformsFunc VP8LCollectColorBlueTransforms; extern VP8LCollectColorBlueTransformsFunc VP8LCollectColorBlueTransforms;
typedef void (*VP8LCollectColorRedTransformsFunc)( typedef void (*VP8LCollectColorRedTransformsFunc)(
const uint32_t* argb, int stride, const uint32_t* argb, int stride,
int tile_width, int tile_height, int tile_width, int tile_height,
int green_to_red, int histo[]); int green_to_red, uint32_t histo[]);
extern VP8LCollectColorRedTransformsFunc VP8LCollectColorRedTransforms; extern VP8LCollectColorRedTransformsFunc VP8LCollectColorRedTransforms;
// Expose some C-only fallback functions // Expose some C-only fallback functions
@ -170,11 +170,11 @@ void VP8LTransformColor_C(const VP8LMultipliers* const m,
void VP8LSubtractGreenFromBlueAndRed_C(uint32_t* argb_data, int num_pixels); void VP8LSubtractGreenFromBlueAndRed_C(uint32_t* argb_data, int num_pixels);
void VP8LCollectColorRedTransforms_C(const uint32_t* argb, int stride, void VP8LCollectColorRedTransforms_C(const uint32_t* argb, int stride,
int tile_width, int tile_height, int tile_width, int tile_height,
int green_to_red, int histo[]); int green_to_red, uint32_t histo[]);
void VP8LCollectColorBlueTransforms_C(const uint32_t* argb, int stride, void VP8LCollectColorBlueTransforms_C(const uint32_t* argb, int stride,
int tile_width, int tile_height, int tile_width, int tile_height,
int green_to_blue, int red_to_blue, int green_to_blue, int red_to_blue,
int histo[]); uint32_t histo[]);
extern VP8LPredictorAddSubFunc VP8LPredictorsSub[16]; extern VP8LPredictorAddSubFunc VP8LPredictorsSub[16];
extern VP8LPredictorAddSubFunc VP8LPredictorsSub_C[16]; extern VP8LPredictorAddSubFunc VP8LPredictorsSub_C[16];
@ -185,8 +185,8 @@ extern VP8LPredictorAddSubFunc VP8LPredictorsSub_C[16];
typedef uint32_t (*VP8LCostFunc)(const uint32_t* population, int length); typedef uint32_t (*VP8LCostFunc)(const uint32_t* population, int length);
typedef uint32_t (*VP8LCostCombinedFunc)(const uint32_t* X, const uint32_t* Y, typedef uint32_t (*VP8LCostCombinedFunc)(const uint32_t* X, const uint32_t* Y,
int length); int length);
typedef float (*VP8LCombinedShannonEntropyFunc)(const int X[256], typedef float (*VP8LCombinedShannonEntropyFunc)(const uint32_t X[256],
const int Y[256]); const uint32_t Y[256]);
extern VP8LCostFunc VP8LExtraCost; extern VP8LCostFunc VP8LExtraCost;
extern VP8LCostCombinedFunc VP8LExtraCostCombined; extern VP8LCostCombinedFunc VP8LExtraCostCombined;

View File

@ -400,14 +400,15 @@ static float FastLog2Slow_C(uint32_t v) {
// Methods to calculate Entropy (Shannon). // Methods to calculate Entropy (Shannon).
// Compute the combined Shanon's entropy for distribution {X} and {X+Y} // Compute the combined Shanon's entropy for distribution {X} and {X+Y}
static float CombinedShannonEntropy_C(const int X[256], const int Y[256]) { static float CombinedShannonEntropy_C(const uint32_t X[256],
const uint32_t Y[256]) {
int i; int i;
float retval = 0.f; float retval = 0.f;
int sumX = 0, sumXY = 0; uint32_t sumX = 0, sumXY = 0;
for (i = 0; i < 256; ++i) { for (i = 0; i < 256; ++i) {
const int x = X[i]; const uint32_t x = X[i];
if (x != 0) { if (x != 0) {
const int xy = x + Y[i]; const uint32_t xy = x + Y[i];
sumX += x; sumX += x;
retval -= VP8LFastSLog2(x); retval -= VP8LFastSLog2(x);
sumXY += xy; sumXY += xy;
@ -577,7 +578,7 @@ static WEBP_INLINE uint8_t TransformColorBlue(uint8_t green_to_blue,
void VP8LCollectColorRedTransforms_C(const uint32_t* argb, int stride, void VP8LCollectColorRedTransforms_C(const uint32_t* argb, int stride,
int tile_width, int tile_height, int tile_width, int tile_height,
int green_to_red, int histo[]) { int green_to_red, uint32_t histo[]) {
while (tile_height-- > 0) { while (tile_height-- > 0) {
int x; int x;
for (x = 0; x < tile_width; ++x) { for (x = 0; x < tile_width; ++x) {
@ -590,7 +591,7 @@ void VP8LCollectColorRedTransforms_C(const uint32_t* argb, int stride,
void VP8LCollectColorBlueTransforms_C(const uint32_t* argb, int stride, void VP8LCollectColorBlueTransforms_C(const uint32_t* argb, int stride,
int tile_width, int tile_height, int tile_width, int tile_height,
int green_to_blue, int red_to_blue, int green_to_blue, int red_to_blue,
int histo[]) { uint32_t histo[]) {
while (tile_height-- > 0) { while (tile_height-- > 0) {
int x; int x;
for (x = 0; x < tile_width; ++x) { for (x = 0; x < tile_width; ++x) {

View File

@ -171,13 +171,9 @@ static WEBP_INLINE uint8_t TransformColorBlue(uint8_t green_to_blue,
return (new_blue & 0xff); return (new_blue & 0xff);
} }
static void CollectColorBlueTransforms_MIPSdspR2(const uint32_t* argb, static void CollectColorBlueTransforms_MIPSdspR2(
int stride, const uint32_t* argb, int stride, int tile_width, int tile_height,
int tile_width, int green_to_blue, int red_to_blue, uint32_t histo[]) {
int tile_height,
int green_to_blue,
int red_to_blue,
int histo[]) {
const int rtb = (red_to_blue << 16) | (red_to_blue & 0xffff); const int rtb = (red_to_blue << 16) | (red_to_blue & 0xffff);
const int gtb = (green_to_blue << 16) | (green_to_blue & 0xffff); const int gtb = (green_to_blue << 16) | (green_to_blue & 0xffff);
const uint32_t mask = 0xff00ffu; const uint32_t mask = 0xff00ffu;
@ -226,11 +222,10 @@ static WEBP_INLINE uint8_t TransformColorRed(uint8_t green_to_red,
} }
static void CollectColorRedTransforms_MIPSdspR2(const uint32_t* argb, static void CollectColorRedTransforms_MIPSdspR2(const uint32_t* argb,
int stride, int stride, int tile_width,
int tile_width,
int tile_height, int tile_height,
int green_to_red, int green_to_red,
int histo[]) { uint32_t histo[]) {
const int gtr = (green_to_red << 16) | (green_to_red & 0xffff); const int gtr = (green_to_red << 16) | (green_to_red & 0xffff);
while (tile_height-- > 0) { while (tile_height-- > 0) {
int x; int x;

View File

@ -82,7 +82,7 @@ static void TransformColor_SSE2(const VP8LMultipliers* const m,
static void CollectColorBlueTransforms_SSE2(const uint32_t* argb, int stride, static void CollectColorBlueTransforms_SSE2(const uint32_t* argb, int stride,
int tile_width, int tile_height, int tile_width, int tile_height,
int green_to_blue, int red_to_blue, int green_to_blue, int red_to_blue,
int histo[]) { uint32_t histo[]) {
const __m128i mults_r = MK_CST_16(CST_5b(red_to_blue), 0); const __m128i mults_r = MK_CST_16(CST_5b(red_to_blue), 0);
const __m128i mults_g = MK_CST_16(0, CST_5b(green_to_blue)); const __m128i mults_g = MK_CST_16(0, CST_5b(green_to_blue));
const __m128i mask_g = _mm_set1_epi32(0x00ff00); // green mask const __m128i mask_g = _mm_set1_epi32(0x00ff00); // green mask
@ -128,7 +128,7 @@ static void CollectColorBlueTransforms_SSE2(const uint32_t* argb, int stride,
static void CollectColorRedTransforms_SSE2(const uint32_t* argb, int stride, static void CollectColorRedTransforms_SSE2(const uint32_t* argb, int stride,
int tile_width, int tile_height, int tile_width, int tile_height,
int green_to_red, int histo[]) { int green_to_red, uint32_t histo[]) {
const __m128i mults_g = MK_CST_16(0, CST_5b(green_to_red)); const __m128i mults_g = MK_CST_16(0, CST_5b(green_to_red));
const __m128i mask_g = _mm_set1_epi32(0x00ff00); // green mask const __m128i mask_g = _mm_set1_epi32(0x00ff00); // green mask
const __m128i mask = _mm_set1_epi32(0xff); const __m128i mask = _mm_set1_epi32(0xff);
@ -237,10 +237,11 @@ static void AddVectorEq_SSE2(const uint32_t* a, uint32_t* out, int size) {
// when compared to -noasm. // when compared to -noasm.
#if !(defined(WEBP_HAVE_SLOW_CLZ_CTZ) || defined(__i386__) || defined(_M_IX86)) #if !(defined(WEBP_HAVE_SLOW_CLZ_CTZ) || defined(__i386__) || defined(_M_IX86))
static float CombinedShannonEntropy_SSE2(const int X[256], const int Y[256]) { static float CombinedShannonEntropy_SSE2(const uint32_t X[256],
const uint32_t Y[256]) {
int i; int i;
float retval = 0.f; float retval = 0.f;
int sumX = 0, sumXY = 0; uint32_t sumX = 0, sumXY = 0;
const __m128i zero = _mm_setzero_si128(); const __m128i zero = _mm_setzero_si128();
for (i = 0; i < 256; i += 16) { for (i = 0; i < 256; i += 16) {
@ -260,7 +261,7 @@ static float CombinedShannonEntropy_SSE2(const int X[256], const int Y[256]) {
int32_t my = _mm_movemask_epi8(_mm_cmpgt_epi8(y4, zero)) | mx; int32_t my = _mm_movemask_epi8(_mm_cmpgt_epi8(y4, zero)) | mx;
while (my) { while (my) {
const int32_t j = BitsCtz(my); const int32_t j = BitsCtz(my);
int xy; uint32_t xy;
if ((mx >> j) & 1) { if ((mx >> j) & 1) {
const int x = X[i + j]; const int x = X[i + j];
sumXY += x; sumXY += x;

View File

@ -98,7 +98,7 @@ static void SubtractGreenFromBlueAndRed_SSE41(uint32_t* argb_data,
static void CollectColorBlueTransforms_SSE41(const uint32_t* argb, int stride, static void CollectColorBlueTransforms_SSE41(const uint32_t* argb, int stride,
int tile_width, int tile_height, int tile_width, int tile_height,
int green_to_blue, int red_to_blue, int green_to_blue, int red_to_blue,
int histo[]) { uint32_t histo[]) {
const __m128i mult = const __m128i mult =
MK_CST_16(CST_5b(red_to_blue) + 256,CST_5b(green_to_blue)); MK_CST_16(CST_5b(red_to_blue) + 256,CST_5b(green_to_blue));
const __m128i perm = const __m128i perm =
@ -143,8 +143,8 @@ static void CollectColorBlueTransforms_SSE41(const uint32_t* argb, int stride,
static void CollectColorRedTransforms_SSE41(const uint32_t* argb, int stride, static void CollectColorRedTransforms_SSE41(const uint32_t* argb, int stride,
int tile_width, int tile_height, int tile_width, int tile_height,
int green_to_red, int histo[]) { int green_to_red,
uint32_t histo[]) {
const __m128i mult = MK_CST_16(0, CST_5b(green_to_red)); const __m128i mult = MK_CST_16(0, CST_5b(green_to_red));
const __m128i mask_g = _mm_set1_epi32(0x0000ff00); const __m128i mask_g = _mm_set1_epi32(0x0000ff00);
if (tile_width >= 4) { if (tile_width >= 4) {

View File

@ -20,7 +20,7 @@
#include "src/enc/vp8li_enc.h" #include "src/enc/vp8li_enc.h"
#define MAX_DIFF_COST (1e30f) #define MAX_DIFF_COST (1e30f)
#define HISTO_SIZE (4 * 256)
static const float kSpatialPredictorBias = 15.f; static const float kSpatialPredictorBias = 15.f;
static const int kPredLowEffort = 11; static const int kPredLowEffort = 11;
static const uint32_t kMaskAlpha = 0xff000000; static const uint32_t kMaskAlpha = 0xff000000;
@ -31,8 +31,10 @@ static WEBP_INLINE int GetMin(int a, int b) { return (a > b) ? b : a; }
//------------------------------------------------------------------------------ //------------------------------------------------------------------------------
// Methods to calculate Entropy (Shannon). // Methods to calculate Entropy (Shannon).
static float PredictionCostSpatial(const int counts[256], int weight_0, // Compute a bias for prediction entropy using a global heuristic to favor
float exp_val) { // values closer to 0. Hence the final negative sign.
static float PredictionCostBias(const uint32_t counts[256], int weight_0,
float exp_val) {
const int significant_symbols = 256 >> 4; const int significant_symbols = 256 >> 4;
const float exp_decay_factor = 0.6f; const float exp_decay_factor = 0.6f;
float bits = (float)weight_0 * counts[0]; float bits = (float)weight_0 * counts[0];
@ -44,23 +46,31 @@ static float PredictionCostSpatial(const int counts[256], int weight_0,
return (float)(-0.1 * bits); return (float)(-0.1 * bits);
} }
static float PredictionCostSpatialHistogram(const int accumulated[4][256], static float PredictionCostSpatialHistogram(
const int tile[4][256]) { const uint32_t accumulated[HISTO_SIZE], const uint32_t tile[HISTO_SIZE],
int mode, int left_mode, int above_mode) {
int i; int i;
float retval = 0.f; float retval = 0.f;
for (i = 0; i < 4; ++i) { for (i = 0; i < 4; ++i) {
const float kExpValue = 0.94f; const float kExpValue = 0.94f;
retval += PredictionCostSpatial(tile[i], 1, kExpValue); retval += PredictionCostBias(&tile[i * 256], 1, kExpValue);
retval += VP8LCombinedShannonEntropy(tile[i], accumulated[i]); // Compute the new cost if 'tile' is added to 'accumulate' but also add the
// cost of the current histogram to guide the spatial predictor selection.
// Basically, favor low entropy, locally and globally.
retval += VP8LCombinedShannonEntropy(&tile[i * 256], &accumulated[i * 256]);
} }
return (float)retval; // Favor keeping the areas locally similar.
if (mode == left_mode) retval -= kSpatialPredictorBias;
if (mode == above_mode) retval -= kSpatialPredictorBias;
return retval;
} }
static WEBP_INLINE void UpdateHisto(int histo_argb[4][256], uint32_t argb) { static WEBP_INLINE void UpdateHisto(uint32_t histo_argb[HISTO_SIZE],
++histo_argb[0][argb >> 24]; uint32_t argb) {
++histo_argb[1][(argb >> 16) & 0xff]; ++histo_argb[0 * 256 + (argb >> 24)];
++histo_argb[2][(argb >> 8) & 0xff]; ++histo_argb[1 * 256 + ((argb >> 16) & 0xff)];
++histo_argb[3][argb & 0xff]; ++histo_argb[2 * 256 + ((argb >> 8) & 0xff)];
++histo_argb[3 * 256 + (argb & 0xff)];
} }
//------------------------------------------------------------------------------ //------------------------------------------------------------------------------
@ -296,14 +306,11 @@ static WEBP_INLINE void GetResidual(
// applied, quantizing residuals to multiples of quantization levels up to // applied, quantizing residuals to multiples of quantization levels up to
// max_quantization (the actual quantization level depends on smoothness near // max_quantization (the actual quantization level depends on smoothness near
// the given pixel). // the given pixel).
static int GetBestPredictorForTile(int width, int height, static int GetBestPredictorForTile(
int tile_x, int tile_y, int bits, int width, int height, int tile_x, int tile_y, int bits,
int accumulated[4][256], uint32_t accumulated[HISTO_SIZE], uint32_t* const argb_scratch,
uint32_t* const argb_scratch, const uint32_t* const argb, int max_quantization, int exact,
const uint32_t* const argb, int used_subtract_green, const uint32_t* const modes) {
int max_quantization,
int exact, int used_subtract_green,
const uint32_t* const modes) {
const int kNumPredModes = 14; const int kNumPredModes = 14;
const int start_x = tile_x << bits; const int start_x = tile_x << bits;
const int start_y = tile_y << bits; const int start_y = tile_y << bits;
@ -333,12 +340,11 @@ static int GetBestPredictorForTile(int width, int height,
float best_diff = MAX_DIFF_COST; float best_diff = MAX_DIFF_COST;
int best_mode = 0; int best_mode = 0;
int mode; int mode;
int histo_stack_1[4][256]; uint32_t histo_stack_1[HISTO_SIZE];
int histo_stack_2[4][256]; uint32_t histo_stack_2[HISTO_SIZE];
// Need pointers to be able to swap arrays. // Need pointers to be able to swap arrays.
int (*histo_argb)[256] = histo_stack_1; uint32_t* histo_argb = histo_stack_1;
int (*best_histo)[256] = histo_stack_2; uint32_t* best_histo = histo_stack_2;
int i, j;
uint32_t residuals[1 << MAX_TRANSFORM_BITS]; uint32_t residuals[1 << MAX_TRANSFORM_BITS];
assert(bits <= MAX_TRANSFORM_BITS); assert(bits <= MAX_TRANSFORM_BITS);
assert(max_x <= (1 << MAX_TRANSFORM_BITS)); assert(max_x <= (1 << MAX_TRANSFORM_BITS));
@ -383,14 +389,11 @@ static int GetBestPredictorForTile(int width, int height,
UpdateHisto(histo_argb, residuals[relative_x]); UpdateHisto(histo_argb, residuals[relative_x]);
} }
} }
cur_diff = PredictionCostSpatialHistogram( cur_diff = PredictionCostSpatialHistogram(accumulated, histo_argb, mode,
(const int (*)[256])accumulated, (const int (*)[256])histo_argb); left_mode, above_mode);
// Favor keeping the areas locally similar.
if (mode == left_mode) cur_diff -= kSpatialPredictorBias;
if (mode == above_mode) cur_diff -= kSpatialPredictorBias;
if (cur_diff < best_diff) { if (cur_diff < best_diff) {
int (*tmp)[256] = histo_argb; uint32_t* tmp = histo_argb;
histo_argb = best_histo; histo_argb = best_histo;
best_histo = tmp; best_histo = tmp;
best_diff = cur_diff; best_diff = cur_diff;
@ -398,12 +401,7 @@ static int GetBestPredictorForTile(int width, int height,
} }
} }
for (i = 0; i < 4; i++) { VP8LAddVectorEq(best_histo, accumulated, HISTO_SIZE);
for (j = 0; j < 256; j++) {
accumulated[i][j] += best_histo[i][j];
}
}
return best_mode; return best_mode;
} }
@ -482,8 +480,6 @@ int VP8LResidualImage(int width, int height, int bits, int low_effort,
const int tiles_per_row = VP8LSubSampleSize(width, bits); const int tiles_per_row = VP8LSubSampleSize(width, bits);
const int tiles_per_col = VP8LSubSampleSize(height, bits); const int tiles_per_col = VP8LSubSampleSize(height, bits);
int percent_start = *percent; int percent_start = *percent;
int tile_y;
int histo[4][256];
const int max_quantization = 1 << VP8LNearLosslessBits(near_lossless_quality); const int max_quantization = 1 << VP8LNearLosslessBits(near_lossless_quality);
if (low_effort) { if (low_effort) {
int i; int i;
@ -491,7 +487,8 @@ int VP8LResidualImage(int width, int height, int bits, int low_effort,
image[i] = ARGB_BLACK | (kPredLowEffort << 8); image[i] = ARGB_BLACK | (kPredLowEffort << 8);
} }
} else { } else {
memset(histo, 0, sizeof(histo)); int tile_y;
uint32_t histo[HISTO_SIZE] = { 0 };
for (tile_y = 0; tile_y < tiles_per_col; ++tile_y) { for (tile_y = 0; tile_y < tiles_per_col; ++tile_y) {
int tile_x; int tile_x;
for (tile_x = 0; tile_x < tiles_per_row; ++tile_x) { for (tile_x = 0; tile_x < tiles_per_row; ++tile_x) {
@ -539,20 +536,20 @@ static WEBP_INLINE uint32_t MultipliersToColorCode(
m->green_to_red_; m->green_to_red_;
} }
static float PredictionCostCrossColor(const int accumulated[256], static float PredictionCostCrossColor(const uint32_t accumulated[256],
const int counts[256]) { const uint32_t counts[256]) {
// Favor low entropy, locally and globally. // Favor low entropy, locally and globally.
// Favor small absolute values for PredictionCostSpatial // Favor small absolute values for PredictionCostSpatial
static const float kExpValue = 2.4f; static const float kExpValue = 2.4f;
return VP8LCombinedShannonEntropy(counts, accumulated) + return VP8LCombinedShannonEntropy(counts, accumulated) +
PredictionCostSpatial(counts, 3, kExpValue); PredictionCostBias(counts, 3, kExpValue);
} }
static float GetPredictionCostCrossColorRed( static float GetPredictionCostCrossColorRed(
const uint32_t* argb, int stride, int tile_width, int tile_height, const uint32_t* argb, int stride, int tile_width, int tile_height,
VP8LMultipliers prev_x, VP8LMultipliers prev_y, int green_to_red, VP8LMultipliers prev_x, VP8LMultipliers prev_y, int green_to_red,
const int accumulated_red_histo[256]) { const uint32_t accumulated_red_histo[256]) {
int histo[256] = { 0 }; uint32_t histo[256] = { 0 };
float cur_diff; float cur_diff;
VP8LCollectColorRedTransforms(argb, stride, tile_width, tile_height, VP8LCollectColorRedTransforms(argb, stride, tile_width, tile_height,
@ -571,10 +568,11 @@ static float GetPredictionCostCrossColorRed(
return cur_diff; return cur_diff;
} }
static void GetBestGreenToRed( static void GetBestGreenToRed(const uint32_t* argb, int stride, int tile_width,
const uint32_t* argb, int stride, int tile_width, int tile_height, int tile_height, VP8LMultipliers prev_x,
VP8LMultipliers prev_x, VP8LMultipliers prev_y, int quality, VP8LMultipliers prev_y, int quality,
const int accumulated_red_histo[256], VP8LMultipliers* const best_tx) { const uint32_t accumulated_red_histo[256],
VP8LMultipliers* const best_tx) {
const int kMaxIters = 4 + ((7 * quality) >> 8); // in range [4..6] const int kMaxIters = 4 + ((7 * quality) >> 8); // in range [4..6]
int green_to_red_best = 0; int green_to_red_best = 0;
int iter, offset; int iter, offset;
@ -603,9 +601,9 @@ static void GetBestGreenToRed(
static float GetPredictionCostCrossColorBlue( static float GetPredictionCostCrossColorBlue(
const uint32_t* argb, int stride, int tile_width, int tile_height, const uint32_t* argb, int stride, int tile_width, int tile_height,
VP8LMultipliers prev_x, VP8LMultipliers prev_y, VP8LMultipliers prev_x, VP8LMultipliers prev_y, int green_to_blue,
int green_to_blue, int red_to_blue, const int accumulated_blue_histo[256]) { int red_to_blue, const uint32_t accumulated_blue_histo[256]) {
int histo[256] = { 0 }; uint32_t histo[256] = { 0 };
float cur_diff; float cur_diff;
VP8LCollectColorBlueTransforms(argb, stride, tile_width, tile_height, VP8LCollectColorBlueTransforms(argb, stride, tile_width, tile_height,
@ -635,11 +633,12 @@ static float GetPredictionCostCrossColorBlue(
#define kGreenRedToBlueNumAxis 8 #define kGreenRedToBlueNumAxis 8
#define kGreenRedToBlueMaxIters 7 #define kGreenRedToBlueMaxIters 7
static void GetBestGreenRedToBlue( static void GetBestGreenRedToBlue(const uint32_t* argb, int stride,
const uint32_t* argb, int stride, int tile_width, int tile_height, int tile_width, int tile_height,
VP8LMultipliers prev_x, VP8LMultipliers prev_y, int quality, VP8LMultipliers prev_x,
const int accumulated_blue_histo[256], VP8LMultipliers prev_y, int quality,
VP8LMultipliers* const best_tx) { const uint32_t accumulated_blue_histo[256],
VP8LMultipliers* const best_tx) {
const int8_t offset[kGreenRedToBlueNumAxis][2] = const int8_t offset[kGreenRedToBlueNumAxis][2] =
{{0, -1}, {0, 1}, {-1, 0}, {1, 0}, {-1, -1}, {-1, 1}, {1, -1}, {1, 1}}; {{0, -1}, {0, 1}, {-1, 0}, {1, 0}, {-1, -1}, {-1, 1}, {1, -1}, {1, 1}};
const int8_t delta_lut[kGreenRedToBlueMaxIters] = { 16, 16, 8, 4, 2, 2, 2 }; const int8_t delta_lut[kGreenRedToBlueMaxIters] = { 16, 16, 8, 4, 2, 2, 2 };
@ -684,13 +683,10 @@ static void GetBestGreenRedToBlue(
#undef kGreenRedToBlueNumAxis #undef kGreenRedToBlueNumAxis
static VP8LMultipliers GetBestColorTransformForTile( static VP8LMultipliers GetBestColorTransformForTile(
int tile_x, int tile_y, int bits, int tile_x, int tile_y, int bits, VP8LMultipliers prev_x,
VP8LMultipliers prev_x, VP8LMultipliers prev_y, int quality, int xsize, int ysize,
VP8LMultipliers prev_y, const uint32_t accumulated_red_histo[256],
int quality, int xsize, int ysize, const uint32_t accumulated_blue_histo[256], const uint32_t* const argb) {
const int accumulated_red_histo[256],
const int accumulated_blue_histo[256],
const uint32_t* const argb) {
const int max_tile_size = 1 << bits; const int max_tile_size = 1 << bits;
const int tile_y_offset = tile_y * max_tile_size; const int tile_y_offset = tile_y * max_tile_size;
const int tile_x_offset = tile_x * max_tile_size; const int tile_x_offset = tile_x * max_tile_size;
@ -733,8 +729,8 @@ int VP8LColorSpaceTransform(int width, int height, int bits, int quality,
const int tile_xsize = VP8LSubSampleSize(width, bits); const int tile_xsize = VP8LSubSampleSize(width, bits);
const int tile_ysize = VP8LSubSampleSize(height, bits); const int tile_ysize = VP8LSubSampleSize(height, bits);
int percent_start = *percent; int percent_start = *percent;
int accumulated_red_histo[256] = { 0 }; uint32_t accumulated_red_histo[256] = { 0 };
int accumulated_blue_histo[256] = { 0 }; uint32_t accumulated_blue_histo[256] = { 0 };
int tile_x, tile_y; int tile_x, tile_y;
VP8LMultipliers prev_x, prev_y; VP8LMultipliers prev_x, prev_y;
MultipliersClear(&prev_y); MultipliersClear(&prev_y);