2
0

dirac_arith.h 4.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196
  1. /*
  2. * Copyright (C) 2007 Marco Gerards <marco@gnu.org>
  3. * Copyright (C) 2009 David Conrad
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /**
  22. * @file
  23. * Arithmetic decoder for Dirac
  24. * @author Marco Gerards <marco@gnu.org>
  25. */
  26. #ifndef AVCODEC_DIRAC_ARITH_H
  27. #define AVCODEC_DIRAC_ARITH_H
  28. #include "libavutil/x86/asm.h"
  29. #include "bytestream.h"
  30. #include "get_bits.h"
  31. enum dirac_arith_contexts {
  32. CTX_ZPZN_F1,
  33. CTX_ZPNN_F1,
  34. CTX_NPZN_F1,
  35. CTX_NPNN_F1,
  36. CTX_ZP_F2,
  37. CTX_ZP_F3,
  38. CTX_ZP_F4,
  39. CTX_ZP_F5,
  40. CTX_ZP_F6,
  41. CTX_NP_F2,
  42. CTX_NP_F3,
  43. CTX_NP_F4,
  44. CTX_NP_F5,
  45. CTX_NP_F6,
  46. CTX_COEFF_DATA,
  47. CTX_SIGN_NEG,
  48. CTX_SIGN_ZERO,
  49. CTX_SIGN_POS,
  50. CTX_ZERO_BLOCK,
  51. CTX_DELTA_Q_F,
  52. CTX_DELTA_Q_DATA,
  53. CTX_DELTA_Q_SIGN,
  54. DIRAC_CTX_COUNT
  55. };
  56. // Dirac resets the arith decoder between decoding various types of data,
  57. // so many contexts are never used simultaneously. Thus, we can reduce
  58. // the number of contexts needed by reusing them.
  59. #define CTX_SB_F1 CTX_ZP_F5
  60. #define CTX_SB_DATA 0
  61. #define CTX_PMODE_REF1 0
  62. #define CTX_PMODE_REF2 1
  63. #define CTX_GLOBAL_BLOCK 2
  64. #define CTX_MV_F1 CTX_ZP_F2
  65. #define CTX_MV_DATA 0
  66. #define CTX_DC_F1 CTX_ZP_F5
  67. #define CTX_DC_DATA 0
  68. typedef struct {
  69. unsigned low;
  70. uint16_t range;
  71. int16_t counter;
  72. const uint8_t *bytestream;
  73. const uint8_t *bytestream_end;
  74. uint16_t contexts[DIRAC_CTX_COUNT];
  75. } DiracArith;
  76. extern const uint8_t ff_dirac_next_ctx[DIRAC_CTX_COUNT];
  77. extern const uint16_t ff_dirac_prob[256];
  78. extern int16_t ff_dirac_prob_branchless[256][2];
  79. static inline void renorm(DiracArith *c)
  80. {
  81. #if HAVE_FAST_CLZ
  82. int shift = 14 - av_log2_16bit(c->range-1) + ((c->range-1)>>15);
  83. c->low <<= shift;
  84. c->range <<= shift;
  85. c->counter += shift;
  86. #else
  87. while (c->range <= 0x4000) {
  88. c->low <<= 1;
  89. c->range <<= 1;
  90. c->counter++;
  91. }
  92. #endif
  93. }
  94. static inline void refill(DiracArith *c)
  95. {
  96. int counter = c->counter;
  97. if (counter >= 0) {
  98. int new = bytestream_get_be16(&c->bytestream);
  99. // the spec defines overread bits to be 1, and streams rely on this
  100. if (c->bytestream > c->bytestream_end) {
  101. new |= 0xff;
  102. if (c->bytestream > c->bytestream_end+1)
  103. new |= 0xff00;
  104. c->bytestream = c->bytestream_end;
  105. }
  106. c->low += new << counter;
  107. counter -= 16;
  108. }
  109. c->counter = counter;
  110. }
  111. static inline int dirac_get_arith_bit(DiracArith *c, int ctx)
  112. {
  113. int prob_zero = c->contexts[ctx];
  114. int range_times_prob, bit;
  115. unsigned low = c->low;
  116. int range = c->range;
  117. range_times_prob = (c->range * prob_zero) >> 16;
  118. #if ARCH_X86 && HAVE_FAST_CMOV && HAVE_INLINE_ASM && HAVE_6REGS
  119. low -= range_times_prob << 16;
  120. range -= range_times_prob;
  121. bit = 0;
  122. __asm__(
  123. "cmpl %5, %4 \n\t"
  124. "setae %b0 \n\t"
  125. "cmovb %3, %2 \n\t"
  126. "cmovb %5, %1 \n\t"
  127. : "+q"(bit), "+r"(range), "+r"(low)
  128. : "r"(c->low), "r"(c->low>>16),
  129. "r"(range_times_prob)
  130. );
  131. #else
  132. bit = (low >> 16) >= range_times_prob;
  133. if (bit) {
  134. low -= range_times_prob << 16;
  135. range -= range_times_prob;
  136. } else {
  137. range = range_times_prob;
  138. }
  139. #endif
  140. c->contexts[ctx] += ff_dirac_prob_branchless[prob_zero>>8][bit];
  141. c->low = low;
  142. c->range = range;
  143. renorm(c);
  144. refill(c);
  145. return bit;
  146. }
  147. static inline int dirac_get_arith_uint(DiracArith *c, int follow_ctx, int data_ctx)
  148. {
  149. int ret = 1;
  150. while (!dirac_get_arith_bit(c, follow_ctx)) {
  151. if (ret >= 0x40000000) {
  152. av_log(NULL, AV_LOG_ERROR, "dirac_get_arith_uint overflow\n");
  153. return -1;
  154. }
  155. ret <<= 1;
  156. ret += dirac_get_arith_bit(c, data_ctx);
  157. follow_ctx = ff_dirac_next_ctx[follow_ctx];
  158. }
  159. return ret-1;
  160. }
  161. static inline int dirac_get_arith_int(DiracArith *c, int follow_ctx, int data_ctx)
  162. {
  163. int ret = dirac_get_arith_uint(c, follow_ctx, data_ctx);
  164. if (ret && dirac_get_arith_bit(c, data_ctx+1))
  165. ret = -ret;
  166. return ret;
  167. }
  168. void ff_dirac_init_arith_tables(void);
  169. void ff_dirac_init_arith_decoder(DiracArith *c, GetBitContext *gb, int length);
  170. #endif /* AVCODEC_DIRAC_ARITH_H */