2015-02-07 11:13:26 +01:00
|
|
|
// Copyright 2014 Google Inc. All Rights Reserved.
|
|
|
|
//
|
|
|
|
// Use of this source code is governed by a BSD-style license
|
|
|
|
// that can be found in the COPYING file in the root of the source
|
|
|
|
// tree. An additional intellectual property rights grant can be found
|
|
|
|
// in the file PATENTS. All contributing project authors may
|
|
|
|
// be found in the AUTHORS file in the root of the source tree.
|
|
|
|
// -----------------------------------------------------------------------------
|
|
|
|
//
|
|
|
|
// Author: Djordje Pesut (djordje.pesut@imgtec.com)
|
|
|
|
|
|
|
|
#include "./dsp.h"
|
|
|
|
|
|
|
|
#if defined(WEBP_USE_MIPS32)
|
|
|
|
|
|
|
|
#include "../enc/cost.h"
|
|
|
|
|
|
|
|
static int GetResidualCost(int ctx0, const VP8Residual* const res) {
|
|
|
|
int n = res->first;
|
|
|
|
// should be prob[VP8EncBands[n]], but it's equivalent for n=0 or 1
|
|
|
|
int p0 = res->prob[n][ctx0][0];
|
|
|
|
const uint16_t* t = res->cost[n][ctx0];
|
|
|
|
int cost;
|
|
|
|
const int const_2 = 2;
|
|
|
|
const int const_255 = 255;
|
|
|
|
const int const_max_level = MAX_VARIABLE_LEVEL;
|
|
|
|
int res_cost;
|
|
|
|
int res_prob;
|
|
|
|
int res_coeffs;
|
|
|
|
int res_last;
|
|
|
|
int v_reg;
|
|
|
|
int b_reg;
|
|
|
|
int ctx_reg;
|
|
|
|
int cost_add, temp_1, temp_2, temp_3;
|
|
|
|
|
|
|
|
if (res->last < 0) {
|
|
|
|
return VP8BitCost(0, p0);
|
|
|
|
}
|
|
|
|
|
|
|
|
cost = (ctx0 == 0) ? VP8BitCost(1, p0) : 0;
|
|
|
|
|
|
|
|
res_cost = (int)res->cost;
|
|
|
|
res_prob = (int)res->prob;
|
|
|
|
res_coeffs = (int)res->coeffs;
|
|
|
|
res_last = (int)res->last;
|
|
|
|
|
|
|
|
__asm__ volatile(
|
|
|
|
".set push \n\t"
|
|
|
|
".set noreorder \n\t"
|
|
|
|
|
|
|
|
"sll %[temp_1], %[n], 1 \n\t"
|
|
|
|
"addu %[res_coeffs], %[res_coeffs], %[temp_1] \n\t"
|
|
|
|
"slt %[temp_2], %[n], %[res_last] \n\t"
|
|
|
|
"bnez %[temp_2], 1f \n\t"
|
|
|
|
" li %[cost_add], 0 \n\t"
|
|
|
|
"b 2f \n\t"
|
|
|
|
" nop \n\t"
|
|
|
|
"1: \n\t"
|
|
|
|
"lh %[v_reg], 0(%[res_coeffs]) \n\t"
|
|
|
|
"addu %[b_reg], %[n], %[VP8EncBands] \n\t"
|
|
|
|
"move %[temp_1], %[const_max_level] \n\t"
|
|
|
|
"addu %[cost], %[cost], %[cost_add] \n\t"
|
|
|
|
"negu %[temp_2], %[v_reg] \n\t"
|
|
|
|
"slti %[temp_3], %[v_reg], 0 \n\t"
|
|
|
|
"movn %[v_reg], %[temp_2], %[temp_3] \n\t"
|
|
|
|
"lbu %[b_reg], 1(%[b_reg]) \n\t"
|
|
|
|
"li %[cost_add], 0 \n\t"
|
|
|
|
|
|
|
|
"sltiu %[temp_3], %[v_reg], 2 \n\t"
|
|
|
|
"move %[ctx_reg], %[v_reg] \n\t"
|
|
|
|
"movz %[ctx_reg], %[const_2], %[temp_3] \n\t"
|
|
|
|
// cost += VP8LevelCost(t, v);
|
|
|
|
"slt %[temp_3], %[v_reg], %[const_max_level] \n\t"
|
|
|
|
"movn %[temp_1], %[v_reg], %[temp_3] \n\t"
|
|
|
|
"sll %[temp_2], %[v_reg], 1 \n\t"
|
|
|
|
"addu %[temp_2], %[temp_2], %[VP8LevelFixedCosts] \n\t"
|
|
|
|
"lhu %[temp_2], 0(%[temp_2]) \n\t"
|
|
|
|
"sll %[temp_1], %[temp_1], 1 \n\t"
|
|
|
|
"addu %[temp_1], %[temp_1], %[t] \n\t"
|
|
|
|
"lhu %[temp_3], 0(%[temp_1]) \n\t"
|
|
|
|
"addu %[cost], %[cost], %[temp_2] \n\t"
|
|
|
|
|
|
|
|
// t = res->cost[b][ctx];
|
|
|
|
"sll %[temp_1], %[ctx_reg], 7 \n\t"
|
|
|
|
"sll %[temp_2], %[ctx_reg], 3 \n\t"
|
|
|
|
"addu %[cost], %[cost], %[temp_3] \n\t"
|
|
|
|
"addu %[temp_1], %[temp_1], %[temp_2] \n\t"
|
|
|
|
"sll %[temp_2], %[b_reg], 3 \n\t"
|
|
|
|
"sll %[temp_3], %[b_reg], 5 \n\t"
|
|
|
|
"sub %[temp_2], %[temp_3], %[temp_2] \n\t"
|
|
|
|
"sll %[temp_3], %[temp_2], 4 \n\t"
|
|
|
|
"addu %[temp_1], %[temp_1], %[temp_3] \n\t"
|
|
|
|
"addu %[temp_2], %[temp_2], %[res_cost] \n\t"
|
|
|
|
"addiu %[n], %[n], 1 \n\t"
|
|
|
|
"addu %[t], %[temp_1], %[temp_2] \n\t"
|
|
|
|
"slt %[temp_1], %[n], %[res_last] \n\t"
|
|
|
|
"bnez %[temp_1], 1b \n\t"
|
|
|
|
" addiu %[res_coeffs], %[res_coeffs], 2 \n\t"
|
|
|
|
"2: \n\t"
|
|
|
|
|
|
|
|
".set pop \n\t"
|
|
|
|
: [cost]"+r"(cost), [t]"+r"(t), [n]"+r"(n), [v_reg]"=&r"(v_reg),
|
|
|
|
[ctx_reg]"=&r"(ctx_reg), [b_reg]"=&r"(b_reg), [cost_add]"=&r"(cost_add),
|
|
|
|
[temp_1]"=&r"(temp_1), [temp_2]"=&r"(temp_2), [temp_3]"=&r"(temp_3)
|
|
|
|
: [const_2]"r"(const_2), [const_255]"r"(const_255), [res_last]"r"(res_last),
|
|
|
|
[VP8EntropyCost]"r"(VP8EntropyCost), [VP8EncBands]"r"(VP8EncBands),
|
|
|
|
[const_max_level]"r"(const_max_level), [res_prob]"r"(res_prob),
|
|
|
|
[VP8LevelFixedCosts]"r"(VP8LevelFixedCosts), [res_coeffs]"r"(res_coeffs),
|
|
|
|
[res_cost]"r"(res_cost)
|
|
|
|
: "memory"
|
|
|
|
);
|
|
|
|
|
|
|
|
// Last coefficient is always non-zero
|
|
|
|
{
|
|
|
|
const int v = abs(res->coeffs[n]);
|
|
|
|
assert(v != 0);
|
|
|
|
cost += VP8LevelCost(t, v);
|
|
|
|
if (n < 15) {
|
|
|
|
const int b = VP8EncBands[n + 1];
|
|
|
|
const int ctx = (v == 1) ? 1 : 2;
|
|
|
|
const int last_p0 = res->prob[b][ctx][0];
|
|
|
|
cost += VP8BitCost(0, last_p0);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return cost;
|
|
|
|
}
|
|
|
|
|
2015-02-09 10:56:23 +01:00
|
|
|
static void SetResidualCoeffs(const int16_t* const coeffs,
|
|
|
|
VP8Residual* const res) {
|
|
|
|
const int16_t* p_coeffs = (int16_t*)coeffs;
|
|
|
|
int temp0, temp1, temp2, n, n1;
|
|
|
|
assert(res->first == 0 || coeffs[0] == 0);
|
|
|
|
|
|
|
|
__asm__ volatile (
|
|
|
|
".set push \n\t"
|
|
|
|
".set noreorder \n\t"
|
|
|
|
"addiu %[p_coeffs], %[p_coeffs], 28 \n\t"
|
|
|
|
"li %[n], 15 \n\t"
|
|
|
|
"li %[temp2], -1 \n\t"
|
|
|
|
"0: \n\t"
|
|
|
|
"ulw %[temp0], 0(%[p_coeffs]) \n\t"
|
|
|
|
"beqz %[temp0], 1f \n\t"
|
|
|
|
#if defined(WORDS_BIGENDIAN)
|
|
|
|
" sll %[temp1], %[temp0], 16 \n\t"
|
|
|
|
#else
|
|
|
|
" srl %[temp1], %[temp0], 16 \n\t"
|
|
|
|
#endif
|
|
|
|
"addiu %[n1], %[n], -1 \n\t"
|
|
|
|
"movz %[temp0], %[n1], %[temp1] \n\t"
|
|
|
|
"movn %[temp0], %[n], %[temp1] \n\t"
|
|
|
|
"j 2f \n\t"
|
|
|
|
" addiu %[temp2], %[temp0], 0 \n\t"
|
|
|
|
"1: \n\t"
|
|
|
|
"addiu %[n], %[n], -2 \n\t"
|
|
|
|
"bgtz %[n], 0b \n\t"
|
|
|
|
" addiu %[p_coeffs], %[p_coeffs], -4 \n\t"
|
|
|
|
"2: \n\t"
|
|
|
|
".set pop \n\t"
|
|
|
|
: [p_coeffs]"+&r"(p_coeffs), [temp0]"=&r"(temp0),
|
|
|
|
[temp1]"=&r"(temp1), [temp2]"=&r"(temp2),
|
|
|
|
[n]"=&r"(n), [n1]"=&r"(n1)
|
|
|
|
:
|
|
|
|
: "memory"
|
|
|
|
);
|
|
|
|
res->last = temp2;
|
|
|
|
res->coeffs = coeffs;
|
|
|
|
}
|
|
|
|
|
2015-02-07 11:13:26 +01:00
|
|
|
#endif // WEBP_USE_MIPS32
|
|
|
|
|
|
|
|
//------------------------------------------------------------------------------
|
|
|
|
// Entry point
|
|
|
|
|
|
|
|
extern WEBP_TSAN_IGNORE_FUNCTION void VP8EncDspCostInitMIPS32(void);
|
|
|
|
|
2015-02-10 07:39:14 +01:00
|
|
|
void WEBP_TSAN_IGNORE_FUNCTION VP8EncDspCostInitMIPS32(void) {
|
2015-02-07 11:13:26 +01:00
|
|
|
#if defined(WEBP_USE_MIPS32)
|
|
|
|
VP8GetResidualCost = GetResidualCost;
|
2015-02-09 10:56:23 +01:00
|
|
|
VP8SetResidualCoeffs = SetResidualCoeffs;
|
2015-02-07 11:13:26 +01:00
|
|
|
#endif // WEBP_USE_MIPS32
|
|
|
|
}
|
|
|
|
|
|
|
|
//------------------------------------------------------------------------------
|