You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

199 lines
5.0KB

  1. /*
  2. * Copyright (C) 2007 Marco Gerards <marco@gnu.org>
  3. * Copyright (C) 2009 David Conrad
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /**
  22. * @file
  23. * Arithmetic decoder for Dirac
  24. * @author Marco Gerards <marco@gnu.org>
  25. */
  26. #ifndef AVCODEC_DIRAC_ARITH_H
  27. #define AVCODEC_DIRAC_ARITH_H
  28. #include "libavutil/x86/asm.h"
  29. #include "bytestream.h"
  30. #include "get_bits.h"
  31. enum dirac_arith_contexts {
  32. CTX_ZPZN_F1,
  33. CTX_ZPNN_F1,
  34. CTX_NPZN_F1,
  35. CTX_NPNN_F1,
  36. CTX_ZP_F2,
  37. CTX_ZP_F3,
  38. CTX_ZP_F4,
  39. CTX_ZP_F5,
  40. CTX_ZP_F6,
  41. CTX_NP_F2,
  42. CTX_NP_F3,
  43. CTX_NP_F4,
  44. CTX_NP_F5,
  45. CTX_NP_F6,
  46. CTX_COEFF_DATA,
  47. CTX_SIGN_NEG,
  48. CTX_SIGN_ZERO,
  49. CTX_SIGN_POS,
  50. CTX_ZERO_BLOCK,
  51. CTX_DELTA_Q_F,
  52. CTX_DELTA_Q_DATA,
  53. CTX_DELTA_Q_SIGN,
  54. DIRAC_CTX_COUNT
  55. };
  56. // Dirac resets the arith decoder between decoding various types of data,
  57. // so many contexts are never used simultaneously. Thus, we can reduce
  58. // the number of contexts needed by reusing them.
  59. #define CTX_SB_F1 CTX_ZP_F5
  60. #define CTX_SB_DATA 0
  61. #define CTX_PMODE_REF1 0
  62. #define CTX_PMODE_REF2 1
  63. #define CTX_GLOBAL_BLOCK 2
  64. #define CTX_MV_F1 CTX_ZP_F2
  65. #define CTX_MV_DATA 0
  66. #define CTX_DC_F1 CTX_ZP_F5
  67. #define CTX_DC_DATA 0
  68. typedef struct {
  69. unsigned low;
  70. uint16_t range;
  71. int16_t counter;
  72. const uint8_t *bytestream;
  73. const uint8_t *bytestream_end;
  74. uint16_t contexts[DIRAC_CTX_COUNT];
  75. int error;
  76. } DiracArith;
  77. extern const uint8_t ff_dirac_next_ctx[DIRAC_CTX_COUNT];
  78. extern const uint16_t ff_dirac_prob[256];
  79. extern int16_t ff_dirac_prob_branchless[256][2];
  80. static inline void renorm(DiracArith *c)
  81. {
  82. #if HAVE_FAST_CLZ
  83. int shift = 14 - av_log2_16bit(c->range-1) + ((c->range-1)>>15);
  84. c->low <<= shift;
  85. c->range <<= shift;
  86. c->counter += shift;
  87. #else
  88. while (c->range <= 0x4000) {
  89. c->low <<= 1;
  90. c->range <<= 1;
  91. c->counter++;
  92. }
  93. #endif
  94. }
  95. static inline void refill(DiracArith *c)
  96. {
  97. int counter = c->counter;
  98. if (counter >= 0) {
  99. int new = bytestream_get_be16(&c->bytestream);
  100. // the spec defines overread bits to be 1, and streams rely on this
  101. if (c->bytestream > c->bytestream_end) {
  102. new |= 0xff;
  103. if (c->bytestream > c->bytestream_end+1)
  104. new |= 0xff00;
  105. c->bytestream = c->bytestream_end;
  106. }
  107. c->low += new << counter;
  108. counter -= 16;
  109. }
  110. c->counter = counter;
  111. }
  112. static inline int dirac_get_arith_bit(DiracArith *c, int ctx)
  113. {
  114. int prob_zero = c->contexts[ctx];
  115. int range_times_prob, bit;
  116. unsigned low = c->low;
  117. int range = c->range;
  118. range_times_prob = (c->range * prob_zero) >> 16;
  119. #if ARCH_X86 && HAVE_FAST_CMOV && HAVE_INLINE_ASM && HAVE_6REGS
  120. low -= range_times_prob << 16;
  121. range -= range_times_prob;
  122. bit = 0;
  123. __asm__(
  124. "cmpl %5, %4 \n\t"
  125. "setae %b0 \n\t"
  126. "cmovb %3, %2 \n\t"
  127. "cmovb %5, %1 \n\t"
  128. : "+q"(bit), "+r"(range), "+r"(low)
  129. : "r"(c->low), "r"(c->low>>16),
  130. "r"(range_times_prob)
  131. );
  132. #else
  133. bit = (low >> 16) >= range_times_prob;
  134. if (bit) {
  135. low -= range_times_prob << 16;
  136. range -= range_times_prob;
  137. } else {
  138. range = range_times_prob;
  139. }
  140. #endif
  141. c->contexts[ctx] += ff_dirac_prob_branchless[prob_zero>>8][bit];
  142. c->low = low;
  143. c->range = range;
  144. renorm(c);
  145. refill(c);
  146. return bit;
  147. }
  148. static inline int dirac_get_arith_uint(DiracArith *c, int follow_ctx, int data_ctx)
  149. {
  150. int ret = 1;
  151. while (!dirac_get_arith_bit(c, follow_ctx)) {
  152. if (ret >= 0x40000000) {
  153. av_log(NULL, AV_LOG_ERROR, "dirac_get_arith_uint overflow\n");
  154. c->error = AVERROR_INVALIDDATA;
  155. return -1;
  156. }
  157. ret <<= 1;
  158. ret += dirac_get_arith_bit(c, data_ctx);
  159. follow_ctx = ff_dirac_next_ctx[follow_ctx];
  160. }
  161. return ret-1;
  162. }
  163. static inline int dirac_get_arith_int(DiracArith *c, int follow_ctx, int data_ctx)
  164. {
  165. int ret = dirac_get_arith_uint(c, follow_ctx, data_ctx);
  166. if (ret && dirac_get_arith_bit(c, data_ctx+1))
  167. ret = -ret;
  168. return ret;
  169. }
  170. void ff_dirac_init_arith_tables(void);
  171. void ff_dirac_init_arith_decoder(DiracArith *c, GetBitContext *gb, int length);
  172. #endif /* AVCODEC_DIRAC_ARITH_H */