You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

829 lines
26KB

  1. /*
  2. * This file is part of FFmpeg.
  3. *
  4. * FFmpeg is free software; you can redistribute it and/or
  5. * modify it under the terms of the GNU Lesser General Public
  6. * License as published by the Free Software Foundation; either
  7. * version 2.1 of the License, or (at your option) any later version.
  8. *
  9. * FFmpeg is distributed in the hope that it will be useful,
  10. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  12. * Lesser General Public License for more details.
  13. *
  14. * You should have received a copy of the GNU Lesser General Public
  15. * License along with FFmpeg; if not, write to the Free Software
  16. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  17. */
  18. /**
  19. * @file
  20. * @brief IntraX8 (J-Frame) subdecoder, used by WMV2 and VC-1
  21. */
  22. #include "libavutil/avassert.h"
  23. #include "libavutil/thread.h"
  24. #include "avcodec.h"
  25. #include "get_bits.h"
  26. #include "idctdsp.h"
  27. #include "msmpeg4data.h"
  28. #include "intrax8huf.h"
  29. #include "intrax8.h"
  30. #include "intrax8dsp.h"
  31. #include "mpegutils.h"
  32. #define MAX_TABLE_DEPTH(table_bits, max_bits) \
  33. ((max_bits + table_bits - 1) / table_bits)
  34. #define DC_VLC_BITS 9
  35. #define AC_VLC_BITS 9
  36. #define OR_VLC_BITS 7
  37. #define DC_VLC_MTD MAX_TABLE_DEPTH(DC_VLC_BITS, MAX_DC_VLC_BITS)
  38. #define AC_VLC_MTD MAX_TABLE_DEPTH(AC_VLC_BITS, MAX_AC_VLC_BITS)
  39. #define OR_VLC_MTD MAX_TABLE_DEPTH(OR_VLC_BITS, MAX_OR_VLC_BITS)
  40. static VLC j_ac_vlc[2][2][8]; // [quant < 13], [intra / inter], [select]
  41. static VLC j_dc_vlc[2][8]; // [quant], [select]
  42. static VLC j_orient_vlc[2][4]; // [quant], [select]
  43. static av_cold void x8_vlc_init(void)
  44. {
  45. int i;
  46. int offset = 0;
  47. static VLC_TYPE table[28150][2];
  48. // set ac tables
  49. #define init_ac_vlc(dst, src) \
  50. do { \
  51. dst.table = &table[offset]; \
  52. dst.table_allocated = FF_ARRAY_ELEMS(table) - offset; \
  53. init_vlc(&dst, AC_VLC_BITS, 77, &src[1], 4, 2, &src[0], 4, 2, \
  54. INIT_VLC_STATIC_OVERLONG); \
  55. offset += dst.table_size; \
  56. } while(0)
  57. for (i = 0; i < 8; i++) {
  58. init_ac_vlc(j_ac_vlc[0][0][i], x8_ac0_highquant_table[i][0]);
  59. init_ac_vlc(j_ac_vlc[0][1][i], x8_ac1_highquant_table[i][0]);
  60. init_ac_vlc(j_ac_vlc[1][0][i], x8_ac0_lowquant_table[i][0]);
  61. init_ac_vlc(j_ac_vlc[1][1][i], x8_ac1_lowquant_table[i][0]);
  62. }
  63. #undef init_ac_vlc
  64. // set dc tables
  65. #define init_dc_vlc(dst, src) \
  66. do { \
  67. dst.table = &table[offset]; \
  68. dst.table_allocated = FF_ARRAY_ELEMS(table) - offset; \
  69. init_vlc(&dst, DC_VLC_BITS, 34, &src[1], 4, 2, &src[0], 4, 2, \
  70. INIT_VLC_STATIC_OVERLONG); \
  71. offset += dst.table_size; \
  72. } while(0)
  73. for (i = 0; i < 8; i++) {
  74. init_dc_vlc(j_dc_vlc[0][i], x8_dc_highquant_table[i][0]);
  75. init_dc_vlc(j_dc_vlc[1][i], x8_dc_lowquant_table[i][0]);
  76. }
  77. #undef init_dc_vlc
  78. // set orient tables
  79. #define init_or_vlc(dst, src) \
  80. do { \
  81. dst.table = &table[offset]; \
  82. dst.table_allocated = FF_ARRAY_ELEMS(table) - offset; \
  83. init_vlc(&dst, OR_VLC_BITS, 12, &src[1], 4, 2, &src[0], 4, 2, \
  84. INIT_VLC_STATIC_OVERLONG); \
  85. offset += dst.table_size; \
  86. } while(0)
  87. for (i = 0; i < 2; i++)
  88. init_or_vlc(j_orient_vlc[0][i], x8_orient_highquant_table[i][0]);
  89. for (i = 0; i < 4; i++)
  90. init_or_vlc(j_orient_vlc[1][i], x8_orient_lowquant_table[i][0]);
  91. #undef init_or_vlc
  92. av_assert2(offset == FF_ARRAY_ELEMS(table));
  93. }
  94. static void x8_reset_vlc_tables(IntraX8Context *w)
  95. {
  96. memset(w->j_dc_vlc, 0, sizeof(w->j_dc_vlc));
  97. memset(w->j_ac_vlc, 0, sizeof(w->j_ac_vlc));
  98. w->j_orient_vlc = NULL;
  99. }
  100. static inline void x8_select_ac_table(IntraX8Context *const w, int mode)
  101. {
  102. int table_index;
  103. av_assert2(mode < 4);
  104. if (w->j_ac_vlc[mode])
  105. return;
  106. table_index = get_bits(w->gb, 3);
  107. // 2 modes use same tables
  108. w->j_ac_vlc[mode] = &j_ac_vlc[w->quant < 13][mode >> 1][table_index];
  109. av_assert2(w->j_ac_vlc[mode]);
  110. }
  111. static inline int x8_get_orient_vlc(IntraX8Context *w)
  112. {
  113. if (!w->j_orient_vlc) {
  114. int table_index = get_bits(w->gb, 1 + (w->quant < 13));
  115. w->j_orient_vlc = &j_orient_vlc[w->quant < 13][table_index];
  116. }
  117. return get_vlc2(w->gb, w->j_orient_vlc->table, OR_VLC_BITS, OR_VLC_MTD);
  118. }
  119. #define extra_bits(eb) (eb) // 3 bits
  120. #define extra_run (0xFF << 8) // 1 bit
  121. #define extra_level (0x00 << 8) // 1 bit
  122. #define run_offset(r) ((r) << 16) // 6 bits
  123. #define level_offset(l) ((l) << 24) // 5 bits
  124. static const uint32_t ac_decode_table[] = {
  125. /* 46 */ extra_bits(3) | extra_run | run_offset(16) | level_offset(0),
  126. /* 47 */ extra_bits(3) | extra_run | run_offset(24) | level_offset(0),
  127. /* 48 */ extra_bits(2) | extra_run | run_offset(4) | level_offset(1),
  128. /* 49 */ extra_bits(3) | extra_run | run_offset(8) | level_offset(1),
  129. /* 50 */ extra_bits(5) | extra_run | run_offset(32) | level_offset(0),
  130. /* 51 */ extra_bits(4) | extra_run | run_offset(16) | level_offset(1),
  131. /* 52 */ extra_bits(2) | extra_level | run_offset(0) | level_offset(4),
  132. /* 53 */ extra_bits(2) | extra_level | run_offset(0) | level_offset(8),
  133. /* 54 */ extra_bits(2) | extra_level | run_offset(0) | level_offset(12),
  134. /* 55 */ extra_bits(3) | extra_level | run_offset(0) | level_offset(16),
  135. /* 56 */ extra_bits(3) | extra_level | run_offset(0) | level_offset(24),
  136. /* 57 */ extra_bits(2) | extra_level | run_offset(1) | level_offset(3),
  137. /* 58 */ extra_bits(3) | extra_level | run_offset(1) | level_offset(7),
  138. /* 59 */ extra_bits(2) | extra_run | run_offset(16) | level_offset(0),
  139. /* 60 */ extra_bits(2) | extra_run | run_offset(20) | level_offset(0),
  140. /* 61 */ extra_bits(2) | extra_run | run_offset(24) | level_offset(0),
  141. /* 62 */ extra_bits(2) | extra_run | run_offset(28) | level_offset(0),
  142. /* 63 */ extra_bits(4) | extra_run | run_offset(32) | level_offset(0),
  143. /* 64 */ extra_bits(4) | extra_run | run_offset(48) | level_offset(0),
  144. /* 65 */ extra_bits(2) | extra_run | run_offset(4) | level_offset(1),
  145. /* 66 */ extra_bits(3) | extra_run | run_offset(8) | level_offset(1),
  146. /* 67 */ extra_bits(4) | extra_run | run_offset(16) | level_offset(1),
  147. /* 68 */ extra_bits(2) | extra_level | run_offset(0) | level_offset(4),
  148. /* 69 */ extra_bits(3) | extra_level | run_offset(0) | level_offset(8),
  149. /* 70 */ extra_bits(4) | extra_level | run_offset(0) | level_offset(16),
  150. /* 71 */ extra_bits(2) | extra_level | run_offset(1) | level_offset(3),
  151. /* 72 */ extra_bits(3) | extra_level | run_offset(1) | level_offset(7),
  152. };
  153. #undef extra_bits
  154. #undef extra_run
  155. #undef extra_level
  156. #undef run_offset
  157. #undef level_offset
  158. static void x8_get_ac_rlf(IntraX8Context *const w, const int mode,
  159. int *const run, int *const level, int *const final)
  160. {
  161. int i, e;
  162. // x8_select_ac_table(w, mode);
  163. i = get_vlc2(w->gb, w->j_ac_vlc[mode]->table, AC_VLC_BITS, AC_VLC_MTD);
  164. if (i < 46) { // [0-45]
  165. int t, l;
  166. if (i < 0) {
  167. *level =
  168. *final = // prevent 'may be used uninitialized'
  169. *run = 64; // this would cause error exit in the ac loop
  170. return;
  171. }
  172. /*
  173. * i == 0-15 r = 0-15 l = 0; r = i & %01111
  174. * i == 16-19 r = 0-3 l = 1; r = i & %00011
  175. * i == 20-21 r = 0-1 l = 2; r = i & %00001
  176. * i == 22 r = 0 l = 3; r = i & %00000
  177. */
  178. *final =
  179. t = i > 22;
  180. i -= 23 * t;
  181. /* l = lut_l[i / 2] = { 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 2, 3 }[i >> 1];
  182. * 11 10'01 01'00 00'00 00'00 00'00 00 => 0xE50000 */
  183. l = (0xE50000 >> (i & 0x1E)) & 3; // 0x1E or ~1 or (i >> 1 << 1)
  184. /* t = lut_mask[l] = { 0x0f, 0x03, 0x01, 0x00 }[l];
  185. * as i < 256 the higher bits do not matter */
  186. t = 0x01030F >> (l << 3);
  187. *run = i & t;
  188. *level = l;
  189. } else if (i < 73) { // [46-72]
  190. uint32_t sm;
  191. uint32_t mask;
  192. i -= 46;
  193. sm = ac_decode_table[i];
  194. e = get_bits(w->gb, sm & 0xF);
  195. sm >>= 8; // 3 bits
  196. mask = sm & 0xff;
  197. sm >>= 8; // 1 bit
  198. *run = (sm & 0xff) + (e & mask); // 6 bits
  199. *level = (sm >> 8) + (e & ~mask); // 5 bits
  200. *final = i > (58 - 46);
  201. } else if (i < 75) { // [73-74]
  202. static const uint8_t crazy_mix_runlevel[32] = {
  203. 0x22, 0x32, 0x33, 0x53, 0x23, 0x42, 0x43, 0x63,
  204. 0x24, 0x52, 0x34, 0x73, 0x25, 0x62, 0x44, 0x83,
  205. 0x26, 0x72, 0x35, 0x54, 0x27, 0x82, 0x45, 0x64,
  206. 0x28, 0x92, 0x36, 0x74, 0x29, 0xa2, 0x46, 0x84,
  207. };
  208. *final = !(i & 1);
  209. e = get_bits(w->gb, 5); // get the extra bits
  210. *run = crazy_mix_runlevel[e] >> 4;
  211. *level = crazy_mix_runlevel[e] & 0x0F;
  212. } else {
  213. *level = get_bits(w->gb, 7 - 3 * (i & 1));
  214. *run = get_bits(w->gb, 6);
  215. *final = get_bits1(w->gb);
  216. }
  217. return;
  218. }
  219. /* static const uint8_t dc_extra_sbits[] = {
  220. * 0, 1, 1, 1, 1, 2, 2, 3, 3, 4, 4, 5, 5, 6, 6, 7, 7,
  221. * }; */
  222. static const uint8_t dc_index_offset[] = {
  223. 0, 1, 2, 3, 4, 5, 7, 9, 13, 17, 25, 33, 49, 65, 97, 129, 193,
  224. };
  225. static int x8_get_dc_rlf(IntraX8Context *const w, const int mode,
  226. int *const level, int *const final)
  227. {
  228. int i, e, c;
  229. av_assert2(mode < 3);
  230. if (!w->j_dc_vlc[mode]) {
  231. int table_index = get_bits(w->gb, 3);
  232. // 4 modes, same table
  233. w->j_dc_vlc[mode] = &j_dc_vlc[w->quant < 13][table_index];
  234. }
  235. i = get_vlc2(w->gb, w->j_dc_vlc[mode]->table, DC_VLC_BITS, DC_VLC_MTD);
  236. /* (i >= 17) { i -= 17; final =1; } */
  237. c = i > 16;
  238. *final = c;
  239. i -= 17 * c;
  240. if (i <= 0) {
  241. *level = 0;
  242. return -i;
  243. }
  244. c = (i + 1) >> 1; // hackish way to calculate dc_extra_sbits[]
  245. c -= c > 1;
  246. e = get_bits(w->gb, c); // get the extra bits
  247. i = dc_index_offset[i] + (e >> 1);
  248. e = -(e & 1); // 0, 0xffffff
  249. *level = (i ^ e) - e; // (i ^ 0) - 0, (i ^ 0xff) - (-1)
  250. return 0;
  251. }
  252. // end of huffman
  253. static int x8_setup_spatial_predictor(IntraX8Context *const w, const int chroma)
  254. {
  255. int range;
  256. int sum;
  257. int quant;
  258. w->dsp.setup_spatial_compensation(w->dest[chroma], w->scratchpad,
  259. w->frame->linesize[chroma > 0],
  260. &range, &sum, w->edges);
  261. if (chroma) {
  262. w->orient = w->chroma_orient;
  263. quant = w->quant_dc_chroma;
  264. } else {
  265. quant = w->quant;
  266. }
  267. w->flat_dc = 0;
  268. if (range < quant || range < 3) {
  269. w->orient = 0;
  270. // yep you read right, a +-1 idct error may break decoding!
  271. if (range < 3) {
  272. w->flat_dc = 1;
  273. sum += 9;
  274. // ((1 << 17) + 9) / (8 + 8 + 1 + 2) = 6899
  275. w->predicted_dc = sum * 6899 >> 17;
  276. }
  277. }
  278. if (chroma)
  279. return 0;
  280. av_assert2(w->orient < 3);
  281. if (range < 2 * w->quant) {
  282. if ((w->edges & 3) == 0) {
  283. if (w->orient == 1)
  284. w->orient = 11;
  285. if (w->orient == 2)
  286. w->orient = 10;
  287. } else {
  288. w->orient = 0;
  289. }
  290. w->raw_orient = 0;
  291. } else {
  292. static const uint8_t prediction_table[3][12] = {
  293. { 0, 8, 4, 10, 11, 2, 6, 9, 1, 3, 5, 7 },
  294. { 4, 0, 8, 11, 10, 3, 5, 2, 6, 9, 1, 7 },
  295. { 8, 0, 4, 10, 11, 1, 7, 2, 6, 9, 3, 5 },
  296. };
  297. w->raw_orient = x8_get_orient_vlc(w);
  298. if (w->raw_orient < 0)
  299. return -1;
  300. av_assert2(w->raw_orient < 12);
  301. av_assert2(w->orient < 3);
  302. w->orient=prediction_table[w->orient][w->raw_orient];
  303. }
  304. return 0;
  305. }
  306. static void x8_update_predictions(IntraX8Context *const w, const int orient,
  307. const int est_run)
  308. {
  309. w->prediction_table[w->mb_x * 2 + (w->mb_y & 1)] = (est_run << 2) + 1 * (orient == 4) + 2 * (orient == 8);
  310. /*
  311. * y = 2n + 0 -> // 0 2 4
  312. * y = 2n + 1 -> // 1 3 5
  313. */
  314. }
  315. static void x8_get_prediction_chroma(IntraX8Context *const w)
  316. {
  317. w->edges = 1 * !(w->mb_x >> 1);
  318. w->edges |= 2 * !(w->mb_y >> 1);
  319. w->edges |= 4 * (w->mb_x >= (2 * w->mb_width - 1)); // mb_x for chroma would always be odd
  320. w->raw_orient = 0;
  321. // lut_co[8] = {inv,4,8,8, inv,4,8,8} <- => {1,1,0,0;1,1,0,0} => 0xCC
  322. if (w->edges & 3) {
  323. w->chroma_orient = 4 << ((0xCC >> w->edges) & 1);
  324. return;
  325. }
  326. // block[x - 1][y | 1 - 1)]
  327. w->chroma_orient = (w->prediction_table[2 * w->mb_x - 2] & 0x03) << 2;
  328. }
  329. static void x8_get_prediction(IntraX8Context *const w)
  330. {
  331. int a, b, c, i;
  332. w->edges = 1 * !w->mb_x;
  333. w->edges |= 2 * !w->mb_y;
  334. w->edges |= 4 * (w->mb_x >= (2 * w->mb_width - 1));
  335. switch (w->edges & 3) {
  336. case 0:
  337. break;
  338. case 1:
  339. // take the one from the above block[0][y - 1]
  340. w->est_run = w->prediction_table[!(w->mb_y & 1)] >> 2;
  341. w->orient = 1;
  342. return;
  343. case 2:
  344. // take the one from the previous block[x - 1][0]
  345. w->est_run = w->prediction_table[2 * w->mb_x - 2] >> 2;
  346. w->orient = 2;
  347. return;
  348. case 3:
  349. w->est_run = 16;
  350. w->orient = 0;
  351. return;
  352. }
  353. // no edge cases
  354. b = w->prediction_table[2 * w->mb_x + !(w->mb_y & 1)]; // block[x ][y - 1]
  355. a = w->prediction_table[2 * w->mb_x - 2 + (w->mb_y & 1)]; // block[x - 1][y ]
  356. c = w->prediction_table[2 * w->mb_x - 2 + !(w->mb_y & 1)]; // block[x - 1][y - 1]
  357. w->est_run = FFMIN(b, a);
  358. /* This condition has nothing to do with w->edges, even if it looks
  359. * similar it would trigger if e.g. x = 3; y = 2;
  360. * I guess somebody wrote something wrong and it became standard. */
  361. if ((w->mb_x & w->mb_y) != 0)
  362. w->est_run = FFMIN(c, w->est_run);
  363. w->est_run >>= 2;
  364. a &= 3;
  365. b &= 3;
  366. c &= 3;
  367. i = (0xFFEAF4C4 >> (2 * b + 8 * a)) & 3;
  368. if (i != 3)
  369. w->orient = i;
  370. else
  371. w->orient = (0xFFEAD8 >> (2 * c + 8 * (w->quant > 12))) & 3;
  372. /*
  373. * lut1[b][a] = {
  374. * ->{ 0, 1, 0, pad },
  375. * { 0, 1, X, pad },
  376. * { 2, 2, 2, pad }
  377. * }
  378. * pad 2 2 2;
  379. * pad X 1 0;
  380. * pad 0 1 0 <-
  381. * -> 11 10 '10 10 '11 11'01 00 '11 00'01 00 => 0xEAF4C4
  382. *
  383. * lut2[q>12][c] = {
  384. * ->{ 0, 2, 1, pad},
  385. * { 2, 2, 2, pad}
  386. * }
  387. * pad 2 2 2;
  388. * pad 1 2 0 <-
  389. * -> 11 10'10 10 '11 01'10 00 => 0xEAD8
  390. */
  391. }
  392. static void x8_ac_compensation(IntraX8Context *const w, const int direction,
  393. const int dc_level)
  394. {
  395. int t;
  396. #define B(x,y) w->block[0][w->idct_permutation[(x) + (y) * 8]]
  397. #define T(x) ((x) * dc_level + 0x8000) >> 16;
  398. switch (direction) {
  399. case 0:
  400. t = T(3811); // h
  401. B(1, 0) -= t;
  402. B(0, 1) -= t;
  403. t = T(487); // e
  404. B(2, 0) -= t;
  405. B(0, 2) -= t;
  406. t = T(506); // f
  407. B(3, 0) -= t;
  408. B(0, 3) -= t;
  409. t = T(135); // c
  410. B(4, 0) -= t;
  411. B(0, 4) -= t;
  412. B(2, 1) += t;
  413. B(1, 2) += t;
  414. B(3, 1) += t;
  415. B(1, 3) += t;
  416. t = T(173); // d
  417. B(5, 0) -= t;
  418. B(0, 5) -= t;
  419. t = T(61); // b
  420. B(6, 0) -= t;
  421. B(0, 6) -= t;
  422. B(5, 1) += t;
  423. B(1, 5) += t;
  424. t = T(42); // a
  425. B(7, 0) -= t;
  426. B(0, 7) -= t;
  427. B(4, 1) += t;
  428. B(1, 4) += t;
  429. B(4, 4) += t;
  430. t = T(1084); // g
  431. B(1, 1) += t;
  432. w->block_last_index[0] = FFMAX(w->block_last_index[0], 7 * 8);
  433. break;
  434. case 1:
  435. B(0, 1) -= T(6269);
  436. B(0, 3) -= T(708);
  437. B(0, 5) -= T(172);
  438. B(0, 7) -= T(73);
  439. w->block_last_index[0] = FFMAX(w->block_last_index[0], 7 * 8);
  440. break;
  441. case 2:
  442. B(1, 0) -= T(6269);
  443. B(3, 0) -= T(708);
  444. B(5, 0) -= T(172);
  445. B(7, 0) -= T(73);
  446. w->block_last_index[0] = FFMAX(w->block_last_index[0], 7);
  447. break;
  448. }
  449. #undef B
  450. #undef T
  451. }
  452. static void dsp_x8_put_solidcolor(const uint8_t pix, uint8_t *dst,
  453. const ptrdiff_t linesize)
  454. {
  455. int k;
  456. for (k = 0; k < 8; k++) {
  457. memset(dst, pix, 8);
  458. dst += linesize;
  459. }
  460. }
  461. static const int16_t quant_table[64] = {
  462. 256, 256, 256, 256, 256, 256, 259, 262,
  463. 265, 269, 272, 275, 278, 282, 285, 288,
  464. 292, 295, 299, 303, 306, 310, 314, 317,
  465. 321, 325, 329, 333, 337, 341, 345, 349,
  466. 353, 358, 362, 366, 371, 375, 379, 384,
  467. 389, 393, 398, 403, 408, 413, 417, 422,
  468. 428, 433, 438, 443, 448, 454, 459, 465,
  469. 470, 476, 482, 488, 493, 499, 505, 511,
  470. };
  471. static int x8_decode_intra_mb(IntraX8Context *const w, const int chroma)
  472. {
  473. uint8_t *scantable;
  474. int final, run, level;
  475. int ac_mode, dc_mode, est_run, dc_level;
  476. int pos, n;
  477. int zeros_only;
  478. int use_quant_matrix;
  479. int sign;
  480. av_assert2(w->orient < 12);
  481. w->bdsp.clear_block(w->block[0]);
  482. if (chroma)
  483. dc_mode = 2;
  484. else
  485. dc_mode = !!w->est_run; // 0, 1
  486. if (x8_get_dc_rlf(w, dc_mode, &dc_level, &final))
  487. return -1;
  488. n = 0;
  489. zeros_only = 0;
  490. if (!final) { // decode ac
  491. use_quant_matrix = w->use_quant_matrix;
  492. if (chroma) {
  493. ac_mode = 1;
  494. est_run = 64; // not used
  495. } else {
  496. if (w->raw_orient < 3)
  497. use_quant_matrix = 0;
  498. if (w->raw_orient > 4) {
  499. ac_mode = 0;
  500. est_run = 64;
  501. } else {
  502. if (w->est_run > 1) {
  503. ac_mode = 2;
  504. est_run = w->est_run;
  505. } else {
  506. ac_mode = 3;
  507. est_run = 64;
  508. }
  509. }
  510. }
  511. x8_select_ac_table(w, ac_mode);
  512. /* scantable_selector[12] = { 0, 2, 0, 1, 1, 1, 0, 2, 2, 0, 1, 2 }; <-
  513. * -> 10'01' 00'10' 10'00' 01'01' 01'00' 10'00 => 0x928548 */
  514. scantable = w->scantable[(0x928548 >> (2 * w->orient)) & 3].permutated;
  515. pos = 0;
  516. do {
  517. n++;
  518. if (n >= est_run) {
  519. ac_mode = 3;
  520. x8_select_ac_table(w, 3);
  521. }
  522. x8_get_ac_rlf(w, ac_mode, &run, &level, &final);
  523. pos += run + 1;
  524. if (pos > 63) {
  525. // this also handles vlc error in x8_get_ac_rlf
  526. return -1;
  527. }
  528. level = (level + 1) * w->dquant;
  529. level += w->qsum;
  530. sign = -get_bits1(w->gb);
  531. level = (level ^ sign) - sign;
  532. if (use_quant_matrix)
  533. level = (level * quant_table[pos]) >> 8;
  534. w->block[0][scantable[pos]] = level;
  535. } while (!final);
  536. w->block_last_index[0] = pos;
  537. } else { // DC only
  538. w->block_last_index[0] = 0;
  539. if (w->flat_dc && ((unsigned) (dc_level + 1)) < 3) { // [-1; 1]
  540. int32_t divide_quant = !chroma ? w->divide_quant_dc_luma
  541. : w->divide_quant_dc_chroma;
  542. int32_t dc_quant = !chroma ? w->quant
  543. : w->quant_dc_chroma;
  544. // original intent dc_level += predicted_dc/quant;
  545. // but it got lost somewhere in the rounding
  546. dc_level += (w->predicted_dc * divide_quant + (1 << 12)) >> 13;
  547. dsp_x8_put_solidcolor(av_clip_uint8((dc_level * dc_quant + 4) >> 3),
  548. w->dest[chroma],
  549. w->frame->linesize[!!chroma]);
  550. goto block_placed;
  551. }
  552. zeros_only = dc_level == 0;
  553. }
  554. if (!chroma)
  555. w->block[0][0] = dc_level * w->quant;
  556. else
  557. w->block[0][0] = dc_level * w->quant_dc_chroma;
  558. // there is !zero_only check in the original, but dc_level check is enough
  559. if ((unsigned int) (dc_level + 1) >= 3 && (w->edges & 3) != 3) {
  560. int direction;
  561. /* ac_comp_direction[orient] = { 0, 3, 3, 1, 1, 0, 0, 0, 2, 2, 2, 1 }; <-
  562. * -> 01'10' 10'10' 00'00' 00'01' 01'11' 11'00 => 0x6A017C */
  563. direction = (0x6A017C >> (w->orient * 2)) & 3;
  564. if (direction != 3) {
  565. // modify block_last[]
  566. x8_ac_compensation(w, direction, w->block[0][0]);
  567. }
  568. }
  569. if (w->flat_dc) {
  570. dsp_x8_put_solidcolor(w->predicted_dc, w->dest[chroma],
  571. w->frame->linesize[!!chroma]);
  572. } else {
  573. w->dsp.spatial_compensation[w->orient](w->scratchpad,
  574. w->dest[chroma],
  575. w->frame->linesize[!!chroma]);
  576. }
  577. if (!zeros_only)
  578. w->wdsp.idct_add(w->dest[chroma],
  579. w->frame->linesize[!!chroma],
  580. w->block[0]);
  581. block_placed:
  582. if (!chroma)
  583. x8_update_predictions(w, w->orient, n);
  584. if (w->loopfilter) {
  585. uint8_t *ptr = w->dest[chroma];
  586. ptrdiff_t linesize = w->frame->linesize[!!chroma];
  587. if (!((w->edges & 2) || (zeros_only && (w->orient | 4) == 4)))
  588. w->dsp.h_loop_filter(ptr, linesize, w->quant);
  589. if (!((w->edges & 1) || (zeros_only && (w->orient | 8) == 8)))
  590. w->dsp.v_loop_filter(ptr, linesize, w->quant);
  591. }
  592. return 0;
  593. }
  594. // FIXME maybe merge with ff_*
  595. static void x8_init_block_index(IntraX8Context *w, AVFrame *frame)
  596. {
  597. // not parent codec linesize as this would be wrong for field pics
  598. // not that IntraX8 has interlacing support ;)
  599. const ptrdiff_t linesize = frame->linesize[0];
  600. const ptrdiff_t uvlinesize = frame->linesize[1];
  601. w->dest[0] = frame->data[0];
  602. w->dest[1] = frame->data[1];
  603. w->dest[2] = frame->data[2];
  604. w->dest[0] += w->mb_y * linesize << 3;
  605. // chroma blocks are on add rows
  606. w->dest[1] += (w->mb_y & ~1) * uvlinesize << 2;
  607. w->dest[2] += (w->mb_y & ~1) * uvlinesize << 2;
  608. }
  609. av_cold int ff_intrax8_common_init(AVCodecContext *avctx,
  610. IntraX8Context *w, IDCTDSPContext *idsp,
  611. int16_t (*block)[64],
  612. int block_last_index[12],
  613. int mb_width, int mb_height)
  614. {
  615. static AVOnce init_static_once = AV_ONCE_INIT;
  616. w->avctx = avctx;
  617. w->idsp = *idsp;
  618. w->mb_width = mb_width;
  619. w->mb_height = mb_height;
  620. w->block = block;
  621. w->block_last_index = block_last_index;
  622. // two rows, 2 blocks per cannon mb
  623. w->prediction_table = av_mallocz(w->mb_width * 2 * 2);
  624. if (!w->prediction_table)
  625. return AVERROR(ENOMEM);
  626. ff_wmv2dsp_init(&w->wdsp);
  627. ff_init_scantable_permutation(w->idct_permutation,
  628. w->wdsp.idct_perm);
  629. ff_init_scantable(w->idct_permutation, &w->scantable[0],
  630. ff_wmv1_scantable[0]);
  631. ff_init_scantable(w->idct_permutation, &w->scantable[1],
  632. ff_wmv1_scantable[2]);
  633. ff_init_scantable(w->idct_permutation, &w->scantable[2],
  634. ff_wmv1_scantable[3]);
  635. ff_intrax8dsp_init(&w->dsp);
  636. ff_blockdsp_init(&w->bdsp, avctx);
  637. ff_thread_once(&init_static_once, x8_vlc_init);
  638. return 0;
  639. }
  640. av_cold void ff_intrax8_common_end(IntraX8Context *w)
  641. {
  642. av_freep(&w->prediction_table);
  643. }
  644. int ff_intrax8_decode_picture(IntraX8Context *w, Picture *pict,
  645. GetBitContext *gb, int *mb_x, int *mb_y,
  646. int dquant, int quant_offset,
  647. int loopfilter, int lowdelay)
  648. {
  649. int mb_xy;
  650. w->gb = gb;
  651. w->dquant = dquant;
  652. w->quant = dquant >> 1;
  653. w->qsum = quant_offset;
  654. w->frame = pict->f;
  655. w->loopfilter = loopfilter;
  656. w->use_quant_matrix = get_bits1(w->gb);
  657. w->mb_x = *mb_x;
  658. w->mb_y = *mb_y;
  659. w->divide_quant_dc_luma = ((1 << 16) + (w->quant >> 1)) / w->quant;
  660. if (w->quant < 5) {
  661. w->quant_dc_chroma = w->quant;
  662. w->divide_quant_dc_chroma = w->divide_quant_dc_luma;
  663. } else {
  664. w->quant_dc_chroma = w->quant + ((w->quant + 3) >> 3);
  665. w->divide_quant_dc_chroma = ((1 << 16) + (w->quant_dc_chroma >> 1)) / w->quant_dc_chroma;
  666. }
  667. x8_reset_vlc_tables(w);
  668. for (w->mb_y = 0; w->mb_y < w->mb_height * 2; w->mb_y++) {
  669. x8_init_block_index(w, w->frame);
  670. mb_xy = (w->mb_y >> 1) * (w->mb_width + 1);
  671. if (get_bits_left(gb) < 1)
  672. goto error;
  673. for (w->mb_x = 0; w->mb_x < w->mb_width * 2; w->mb_x++) {
  674. x8_get_prediction(w);
  675. if (x8_setup_spatial_predictor(w, 0))
  676. goto error;
  677. if (x8_decode_intra_mb(w, 0))
  678. goto error;
  679. if (w->mb_x & w->mb_y & 1) {
  680. x8_get_prediction_chroma(w);
  681. /* when setting up chroma, no vlc is read,
  682. * so no error condition can be reached */
  683. x8_setup_spatial_predictor(w, 1);
  684. if (x8_decode_intra_mb(w, 1))
  685. goto error;
  686. x8_setup_spatial_predictor(w, 2);
  687. if (x8_decode_intra_mb(w, 2))
  688. goto error;
  689. w->dest[1] += 8;
  690. w->dest[2] += 8;
  691. pict->qscale_table[mb_xy] = w->quant;
  692. mb_xy++;
  693. }
  694. w->dest[0] += 8;
  695. }
  696. if (w->mb_y & 1)
  697. ff_draw_horiz_band(w->avctx, w->frame, w->frame,
  698. (w->mb_y - 1) * 8, 16,
  699. PICT_FRAME, 0, lowdelay);
  700. }
  701. error:
  702. *mb_x = w->mb_x;
  703. *mb_y = w->mb_y;
  704. return 0;
  705. }