292 lines
		
	
	
		
			11 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			292 lines
		
	
	
		
			11 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
/*
 | 
						|
 * Copyright (c) 2016, Alliance for Open Media. All rights reserved
 | 
						|
 *
 | 
						|
 * This source code is subject to the terms of the BSD 2 Clause License and
 | 
						|
 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
 | 
						|
 * was not distributed with this source code in the LICENSE file, you can
 | 
						|
 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
 | 
						|
 * Media Patent License 1.0 was not distributed with this source code in the
 | 
						|
 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
 | 
						|
 */
 | 
						|
#include "aom_dsp/bitwriter.h"
 | 
						|
 | 
						|
#include "av1/common/common.h"
 | 
						|
#include "av1/common/entropy.h"
 | 
						|
#include "av1/encoder/cost.h"
 | 
						|
#include "av1/encoder/subexp.h"
 | 
						|
 | 
						|
#define av1_cost_upd256 ((int)(av1_cost_one(upd) - av1_cost_zero(upd)))
 | 
						|
 | 
						|
static const uint8_t update_bits[255] = {
 | 
						|
  5,  5,  5,  5,  5,  5,  5,  5,  5,  5,  5,  5,  5,  5,  5,  5,  6,  6,  6,
 | 
						|
  6,  6,  6,  6,  6,  6,  6,  6,  6,  6,  6,  6,  6,  8,  8,  8,  8,  8,  8,
 | 
						|
  8,  8,  8,  8,  8,  8,  8,  8,  8,  8,  8,  8,  8,  8,  8,  8,  8,  8,  8,
 | 
						|
  8,  8,  8,  8,  8,  8,  8,  10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10,
 | 
						|
  10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10,
 | 
						|
  10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10,
 | 
						|
  10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 10, 11, 11, 11,
 | 
						|
  11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
 | 
						|
  11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
 | 
						|
  11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
 | 
						|
  11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
 | 
						|
  11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
 | 
						|
  11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
 | 
						|
  11, 11, 11, 11, 11, 11, 11, 0,
 | 
						|
};
 | 
						|
 | 
						|
static int recenter_nonneg(int v, int m) {
 | 
						|
  if (v > (m << 1))
 | 
						|
    return v;
 | 
						|
  else if (v >= m)
 | 
						|
    return ((v - m) << 1);
 | 
						|
  else
 | 
						|
    return ((m - v) << 1) - 1;
 | 
						|
}
 | 
						|
 | 
						|
static int remap_prob(int v, int m) {
 | 
						|
  int i;
 | 
						|
  static const uint8_t map_table[MAX_PROB - 1] = {
 | 
						|
    // generated by:
 | 
						|
    //   map_table[j] = split_index(j, MAX_PROB - 1, MODULUS_PARAM);
 | 
						|
    20,  21,  22,  23,  24,  25,  0,   26,  27,  28,  29,  30,  31,  32,  33,
 | 
						|
    34,  35,  36,  37,  1,   38,  39,  40,  41,  42,  43,  44,  45,  46,  47,
 | 
						|
    48,  49,  2,   50,  51,  52,  53,  54,  55,  56,  57,  58,  59,  60,  61,
 | 
						|
    3,   62,  63,  64,  65,  66,  67,  68,  69,  70,  71,  72,  73,  4,   74,
 | 
						|
    75,  76,  77,  78,  79,  80,  81,  82,  83,  84,  85,  5,   86,  87,  88,
 | 
						|
    89,  90,  91,  92,  93,  94,  95,  96,  97,  6,   98,  99,  100, 101, 102,
 | 
						|
    103, 104, 105, 106, 107, 108, 109, 7,   110, 111, 112, 113, 114, 115, 116,
 | 
						|
    117, 118, 119, 120, 121, 8,   122, 123, 124, 125, 126, 127, 128, 129, 130,
 | 
						|
    131, 132, 133, 9,   134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144,
 | 
						|
    145, 10,  146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 11,
 | 
						|
    158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 12,  170, 171,
 | 
						|
    172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 13,  182, 183, 184, 185,
 | 
						|
    186, 187, 188, 189, 190, 191, 192, 193, 14,  194, 195, 196, 197, 198, 199,
 | 
						|
    200, 201, 202, 203, 204, 205, 15,  206, 207, 208, 209, 210, 211, 212, 213,
 | 
						|
    214, 215, 216, 217, 16,  218, 219, 220, 221, 222, 223, 224, 225, 226, 227,
 | 
						|
    228, 229, 17,  230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241,
 | 
						|
    18,  242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 19,
 | 
						|
  };
 | 
						|
  v--;
 | 
						|
  m--;
 | 
						|
  if ((m << 1) <= MAX_PROB)
 | 
						|
    i = recenter_nonneg(v, m) - 1;
 | 
						|
  else
 | 
						|
    i = recenter_nonneg(MAX_PROB - 1 - v, MAX_PROB - 1 - m) - 1;
 | 
						|
 | 
						|
  i = map_table[i];
 | 
						|
  return i;
 | 
						|
}
 | 
						|
 | 
						|
static int prob_diff_update_cost(aom_prob newp, aom_prob oldp) {
 | 
						|
  int delp = remap_prob(newp, oldp);
 | 
						|
  return update_bits[delp] << AV1_PROB_COST_SHIFT;
 | 
						|
}
 | 
						|
 | 
						|
static void encode_uniform(aom_writer *w, int v) {
 | 
						|
  const int l = 8;
 | 
						|
  const int m = (1 << l) - 190;
 | 
						|
  if (v < m) {
 | 
						|
    aom_write_literal(w, v, l - 1);
 | 
						|
  } else {
 | 
						|
    aom_write_literal(w, m + ((v - m) >> 1), l - 1);
 | 
						|
    aom_write_literal(w, (v - m) & 1, 1);
 | 
						|
  }
 | 
						|
}
 | 
						|
 | 
						|
static INLINE int write_bit_gte(aom_writer *w, int word, int test) {
 | 
						|
  aom_write_literal(w, word >= test, 1);
 | 
						|
  return word >= test;
 | 
						|
}
 | 
						|
 | 
						|
static void encode_term_subexp(aom_writer *w, int word) {
 | 
						|
  if (!write_bit_gte(w, word, 16)) {
 | 
						|
    aom_write_literal(w, word, 4);
 | 
						|
  } else if (!write_bit_gte(w, word, 32)) {
 | 
						|
    aom_write_literal(w, word - 16, 4);
 | 
						|
  } else if (!write_bit_gte(w, word, 64)) {
 | 
						|
    aom_write_literal(w, word - 32, 5);
 | 
						|
  } else {
 | 
						|
    encode_uniform(w, word - 64);
 | 
						|
  }
 | 
						|
}
 | 
						|
 | 
						|
void av1_write_prob_diff_update(aom_writer *w, aom_prob newp, aom_prob oldp) {
 | 
						|
  const int delp = remap_prob(newp, oldp);
 | 
						|
  encode_term_subexp(w, delp);
 | 
						|
}
 | 
						|
 | 
						|
int av1_prob_diff_update_savings_search(const unsigned int *ct, aom_prob oldp,
 | 
						|
                                        aom_prob *bestp, aom_prob upd) {
 | 
						|
  const uint32_t old_b = cost_branch256(ct, oldp);
 | 
						|
  int bestsavings = 0;
 | 
						|
  aom_prob newp, bestnewp = oldp;
 | 
						|
  const int step = *bestp > oldp ? -1 : 1;
 | 
						|
 | 
						|
  for (newp = *bestp; newp != oldp; newp += step) {
 | 
						|
    const uint32_t new_b = cost_branch256(ct, newp);
 | 
						|
    const uint32_t update_b =
 | 
						|
        prob_diff_update_cost(newp, oldp) + av1_cost_upd256;
 | 
						|
    const int savings = (int)((int64_t)old_b - new_b - update_b);
 | 
						|
    if (savings > bestsavings) {
 | 
						|
      bestsavings = savings;
 | 
						|
      bestnewp = newp;
 | 
						|
    }
 | 
						|
  }
 | 
						|
  *bestp = bestnewp;
 | 
						|
  return bestsavings;
 | 
						|
}
 | 
						|
 | 
						|
int av1_prob_diff_update_savings_search_model(const unsigned int *ct,
 | 
						|
                                              const aom_prob *oldp,
 | 
						|
                                              aom_prob *bestp, aom_prob upd,
 | 
						|
                                              int stepsize) {
 | 
						|
  int i, old_b, new_b, update_b, savings, bestsavings;
 | 
						|
  int newp;
 | 
						|
  const int step_sign = *bestp > oldp[PIVOT_NODE] ? -1 : 1;
 | 
						|
  const int step = stepsize * step_sign;
 | 
						|
  aom_prob bestnewp, newplist[ENTROPY_NODES], oldplist[ENTROPY_NODES];
 | 
						|
  av1_model_to_full_probs(oldp, oldplist);
 | 
						|
  memcpy(newplist, oldp, sizeof(aom_prob) * UNCONSTRAINED_NODES);
 | 
						|
  for (i = UNCONSTRAINED_NODES, old_b = 0; i < ENTROPY_NODES; ++i)
 | 
						|
    old_b += cost_branch256(ct + 2 * i, oldplist[i]);
 | 
						|
  old_b += cost_branch256(ct + 2 * PIVOT_NODE, oldplist[PIVOT_NODE]);
 | 
						|
 | 
						|
  bestsavings = 0;
 | 
						|
  bestnewp = oldp[PIVOT_NODE];
 | 
						|
 | 
						|
  assert(stepsize > 0);
 | 
						|
 | 
						|
  for (newp = *bestp; (newp - oldp[PIVOT_NODE]) * step_sign < 0; newp += step) {
 | 
						|
    if (newp < 1 || newp > 255) continue;
 | 
						|
    newplist[PIVOT_NODE] = newp;
 | 
						|
    av1_model_to_full_probs(newplist, newplist);
 | 
						|
    for (i = UNCONSTRAINED_NODES, new_b = 0; i < ENTROPY_NODES; ++i)
 | 
						|
      new_b += cost_branch256(ct + 2 * i, newplist[i]);
 | 
						|
    new_b += cost_branch256(ct + 2 * PIVOT_NODE, newplist[PIVOT_NODE]);
 | 
						|
    update_b = prob_diff_update_cost(newp, oldp[PIVOT_NODE]) + av1_cost_upd256;
 | 
						|
    savings = old_b - new_b - update_b;
 | 
						|
    if (savings > bestsavings) {
 | 
						|
      bestsavings = savings;
 | 
						|
      bestnewp = newp;
 | 
						|
    }
 | 
						|
  }
 | 
						|
 | 
						|
  *bestp = bestnewp;
 | 
						|
  return bestsavings;
 | 
						|
}
 | 
						|
 | 
						|
#if CONFIG_ENTROPY
 | 
						|
static int get_cost(unsigned int ct[][2], aom_prob p, int n) {
 | 
						|
  int i, p0 = p;
 | 
						|
  unsigned int total_ct[2] = { 0, 0 };
 | 
						|
  int cost = 0;
 | 
						|
 | 
						|
  for (i = 0; i <= n; ++i) {
 | 
						|
    cost += cost_branch256(ct[i], p);
 | 
						|
    total_ct[0] += ct[i][0];
 | 
						|
    total_ct[1] += ct[i][1];
 | 
						|
    if (i < n)
 | 
						|
      p = av1_merge_probs(p0, total_ct, COEF_COUNT_SAT_BITS,
 | 
						|
                          COEF_MAX_UPDATE_FACTOR_BITS);
 | 
						|
  }
 | 
						|
  return cost;
 | 
						|
}
 | 
						|
 | 
						|
int av1_prob_update_search_subframe(unsigned int ct[][2], aom_prob oldp,
 | 
						|
                                    aom_prob *bestp, aom_prob upd, int n) {
 | 
						|
  const int old_b = get_cost(ct, oldp, n);
 | 
						|
  int bestsavings = 0;
 | 
						|
  aom_prob newp, bestnewp = oldp;
 | 
						|
  const int step = *bestp > oldp ? -1 : 1;
 | 
						|
 | 
						|
  for (newp = *bestp; newp != oldp; newp += step) {
 | 
						|
    const int new_b = get_cost(ct, newp, n);
 | 
						|
    const int update_b = prob_diff_update_cost(newp, oldp) + av1_cost_upd256;
 | 
						|
    const int savings = old_b - new_b - update_b;
 | 
						|
    if (savings > bestsavings) {
 | 
						|
      bestsavings = savings;
 | 
						|
      bestnewp = newp;
 | 
						|
    }
 | 
						|
  }
 | 
						|
  *bestp = bestnewp;
 | 
						|
  return bestsavings;
 | 
						|
}
 | 
						|
 | 
						|
int av1_prob_update_search_model_subframe(unsigned int ct[ENTROPY_NODES]
 | 
						|
                                                         [COEF_PROBS_BUFS][2],
 | 
						|
                                          const aom_prob *oldp, aom_prob *bestp,
 | 
						|
                                          aom_prob upd, int stepsize, int n) {
 | 
						|
  int i, old_b, new_b, update_b, savings, bestsavings;
 | 
						|
  int newp;
 | 
						|
  const int step_sign = *bestp > oldp[PIVOT_NODE] ? -1 : 1;
 | 
						|
  const int step = stepsize * step_sign;
 | 
						|
  aom_prob bestnewp, newplist[ENTROPY_NODES], oldplist[ENTROPY_NODES];
 | 
						|
  av1_model_to_full_probs(oldp, oldplist);
 | 
						|
  memcpy(newplist, oldp, sizeof(aom_prob) * UNCONSTRAINED_NODES);
 | 
						|
  for (i = UNCONSTRAINED_NODES, old_b = 0; i < ENTROPY_NODES; ++i)
 | 
						|
    old_b += get_cost(ct[i], oldplist[i], n);
 | 
						|
  old_b += get_cost(ct[PIVOT_NODE], oldplist[PIVOT_NODE], n);
 | 
						|
 | 
						|
  bestsavings = 0;
 | 
						|
  bestnewp = oldp[PIVOT_NODE];
 | 
						|
 | 
						|
  assert(stepsize > 0);
 | 
						|
 | 
						|
  for (newp = *bestp; (newp - oldp[PIVOT_NODE]) * step_sign < 0; newp += step) {
 | 
						|
    if (newp < 1 || newp > 255) continue;
 | 
						|
    newplist[PIVOT_NODE] = newp;
 | 
						|
    av1_model_to_full_probs(newplist, newplist);
 | 
						|
    for (i = UNCONSTRAINED_NODES, new_b = 0; i < ENTROPY_NODES; ++i)
 | 
						|
      new_b += get_cost(ct[i], newplist[i], n);
 | 
						|
    new_b += get_cost(ct[PIVOT_NODE], newplist[PIVOT_NODE], n);
 | 
						|
    update_b = prob_diff_update_cost(newp, oldp[PIVOT_NODE]) + av1_cost_upd256;
 | 
						|
    savings = old_b - new_b - update_b;
 | 
						|
    if (savings > bestsavings) {
 | 
						|
      bestsavings = savings;
 | 
						|
      bestnewp = newp;
 | 
						|
    }
 | 
						|
  }
 | 
						|
 | 
						|
  *bestp = bestnewp;
 | 
						|
  return bestsavings;
 | 
						|
}
 | 
						|
#endif  // CONFIG_ENTROPY
 | 
						|
 | 
						|
void av1_cond_prob_diff_update(aom_writer *w, aom_prob *oldp,
 | 
						|
                               const unsigned int ct[2]) {
 | 
						|
  const aom_prob upd = DIFF_UPDATE_PROB;
 | 
						|
  aom_prob newp = get_binary_prob(ct[0], ct[1]);
 | 
						|
  const int savings =
 | 
						|
      av1_prob_diff_update_savings_search(ct, *oldp, &newp, upd);
 | 
						|
  assert(newp >= 1);
 | 
						|
  if (savings > 0) {
 | 
						|
    aom_write(w, 1, upd);
 | 
						|
    av1_write_prob_diff_update(w, newp, *oldp);
 | 
						|
    *oldp = newp;
 | 
						|
  } else {
 | 
						|
    aom_write(w, 0, upd);
 | 
						|
  }
 | 
						|
}
 | 
						|
 | 
						|
int av1_cond_prob_diff_update_savings(aom_prob *oldp,
 | 
						|
                                      const unsigned int ct[2]) {
 | 
						|
  const aom_prob upd = DIFF_UPDATE_PROB;
 | 
						|
  aom_prob newp = get_binary_prob(ct[0], ct[1]);
 | 
						|
  const int savings =
 | 
						|
      av1_prob_diff_update_savings_search(ct, *oldp, &newp, upd);
 | 
						|
  return savings;
 | 
						|
}
 | 
						|
 | 
						|
void aom_write_primitive_symmetric(aom_writer *w, int word,
 | 
						|
                                   unsigned int abs_bits) {
 | 
						|
  if (word == 0) {
 | 
						|
    aom_write_bit(w, 0);
 | 
						|
  } else {
 | 
						|
    const int x = abs(word);
 | 
						|
    const int s = word < 0;
 | 
						|
    aom_write_bit(w, 1);
 | 
						|
    aom_write_bit(w, s);
 | 
						|
    aom_write_literal(w, x - 1, abs_bits);
 | 
						|
  }
 | 
						|
}
 |