You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

202 lines
5.1KB

  1. /*
  2. * Copyright (C) 2007 Marco Gerards <marco@gnu.org>
  3. * Copyright (C) 2009 David Conrad
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /**
  22. * @file
  23. * Arithmetic decoder for Dirac
  24. * @author Marco Gerards <marco@gnu.org>
  25. */
  26. #ifndef AVCODEC_DIRAC_ARITH_H
  27. #define AVCODEC_DIRAC_ARITH_H
  28. #include "libavutil/x86/asm.h"
  29. #include "bytestream.h"
  30. #include "get_bits.h"
  31. enum dirac_arith_contexts {
  32. CTX_ZPZN_F1,
  33. CTX_ZPNN_F1,
  34. CTX_NPZN_F1,
  35. CTX_NPNN_F1,
  36. CTX_ZP_F2,
  37. CTX_ZP_F3,
  38. CTX_ZP_F4,
  39. CTX_ZP_F5,
  40. CTX_ZP_F6,
  41. CTX_NP_F2,
  42. CTX_NP_F3,
  43. CTX_NP_F4,
  44. CTX_NP_F5,
  45. CTX_NP_F6,
  46. CTX_COEFF_DATA,
  47. CTX_SIGN_NEG,
  48. CTX_SIGN_ZERO,
  49. CTX_SIGN_POS,
  50. CTX_ZERO_BLOCK,
  51. CTX_DELTA_Q_F,
  52. CTX_DELTA_Q_DATA,
  53. CTX_DELTA_Q_SIGN,
  54. DIRAC_CTX_COUNT
  55. };
  56. // Dirac resets the arith decoder between decoding various types of data,
  57. // so many contexts are never used simultaneously. Thus, we can reduce
  58. // the number of contexts needed by reusing them.
  59. #define CTX_SB_F1 CTX_ZP_F5
  60. #define CTX_SB_DATA 0
  61. #define CTX_PMODE_REF1 0
  62. #define CTX_PMODE_REF2 1
  63. #define CTX_GLOBAL_BLOCK 2
  64. #define CTX_MV_F1 CTX_ZP_F2
  65. #define CTX_MV_DATA 0
  66. #define CTX_DC_F1 CTX_ZP_F5
  67. #define CTX_DC_DATA 0
  68. typedef struct {
  69. unsigned low;
  70. uint16_t range;
  71. int16_t counter;
  72. const uint8_t *bytestream;
  73. const uint8_t *bytestream_end;
  74. uint16_t contexts[DIRAC_CTX_COUNT];
  75. int error;
  76. int overread;
  77. } DiracArith;
  78. extern const uint8_t ff_dirac_next_ctx[DIRAC_CTX_COUNT];
  79. extern int16_t ff_dirac_prob_branchless[256][2];
  80. static inline void renorm(DiracArith *c)
  81. {
  82. #if HAVE_FAST_CLZ
  83. int shift = 14 - av_log2_16bit(c->range-1) + ((c->range-1)>>15);
  84. c->low <<= shift;
  85. c->range <<= shift;
  86. c->counter += shift;
  87. #else
  88. while (c->range <= 0x4000) {
  89. c->low <<= 1;
  90. c->range <<= 1;
  91. c->counter++;
  92. }
  93. #endif
  94. }
  95. static inline void refill(DiracArith *c)
  96. {
  97. int counter = c->counter;
  98. if (counter >= 0) {
  99. int new = bytestream_get_be16(&c->bytestream);
  100. // the spec defines overread bits to be 1, and streams rely on this
  101. if (c->bytestream > c->bytestream_end) {
  102. new |= 0xff;
  103. if (c->bytestream > c->bytestream_end+1)
  104. new |= 0xff00;
  105. c->bytestream = c->bytestream_end;
  106. c->overread ++;
  107. if (c->overread > 4)
  108. c->error = AVERROR_INVALIDDATA;
  109. }
  110. c->low += new << counter;
  111. counter -= 16;
  112. }
  113. c->counter = counter;
  114. }
  115. static inline int dirac_get_arith_bit(DiracArith *c, int ctx)
  116. {
  117. int prob_zero = c->contexts[ctx];
  118. int range_times_prob, bit;
  119. unsigned low = c->low;
  120. int range = c->range;
  121. range_times_prob = (c->range * prob_zero) >> 16;
  122. #if ARCH_X86 && HAVE_FAST_CMOV && HAVE_INLINE_ASM && HAVE_6REGS
  123. low -= range_times_prob << 16;
  124. range -= range_times_prob;
  125. bit = 0;
  126. __asm__(
  127. "cmpl %5, %4 \n\t"
  128. "setae %b0 \n\t"
  129. "cmovb %3, %2 \n\t"
  130. "cmovb %5, %1 \n\t"
  131. : "+q"(bit), "+r"(range), "+r"(low)
  132. : "r"(c->low), "r"(c->low>>16),
  133. "r"(range_times_prob)
  134. );
  135. #else
  136. bit = (low >> 16) >= range_times_prob;
  137. if (bit) {
  138. low -= range_times_prob << 16;
  139. range -= range_times_prob;
  140. } else {
  141. range = range_times_prob;
  142. }
  143. #endif
  144. c->contexts[ctx] += ff_dirac_prob_branchless[prob_zero>>8][bit];
  145. c->low = low;
  146. c->range = range;
  147. renorm(c);
  148. refill(c);
  149. return bit;
  150. }
  151. static inline int dirac_get_arith_uint(DiracArith *c, int follow_ctx, int data_ctx)
  152. {
  153. int ret = 1;
  154. while (!dirac_get_arith_bit(c, follow_ctx)) {
  155. if (ret >= 0x40000000) {
  156. av_log(NULL, AV_LOG_ERROR, "dirac_get_arith_uint overflow\n");
  157. c->error = AVERROR_INVALIDDATA;
  158. return -1;
  159. }
  160. ret <<= 1;
  161. ret += dirac_get_arith_bit(c, data_ctx);
  162. follow_ctx = ff_dirac_next_ctx[follow_ctx];
  163. }
  164. return ret-1;
  165. }
  166. static inline int dirac_get_arith_int(DiracArith *c, int follow_ctx, int data_ctx)
  167. {
  168. int ret = dirac_get_arith_uint(c, follow_ctx, data_ctx);
  169. if (ret && dirac_get_arith_bit(c, data_ctx+1))
  170. ret = -ret;
  171. return ret;
  172. }
  173. void ff_dirac_init_arith_tables(void);
  174. void ff_dirac_init_arith_decoder(DiracArith *c, GetBitContext *gb, int length);
  175. #endif /* AVCODEC_DIRAC_ARITH_H */