You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1419 lines
42KB

  1. /*
  2. * HEVC CABAC decoding
  3. *
  4. * Copyright (C) 2012 - 2013 Guillaume Martres
  5. * Copyright (C) 2012 - 2013 Gildas Cocherel
  6. *
  7. * This file is part of FFmpeg.
  8. *
  9. * FFmpeg is free software; you can redistribute it and/or
  10. * modify it under the terms of the GNU Lesser General Public
  11. * License as published by the Free Software Foundation; either
  12. * version 2.1 of the License, or (at your option) any later version.
  13. *
  14. * FFmpeg is distributed in the hope that it will be useful,
  15. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  16. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  17. * Lesser General Public License for more details.
  18. *
  19. * You should have received a copy of the GNU Lesser General Public
  20. * License along with FFmpeg; if not, write to the Free Software
  21. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  22. */
  23. #include "libavutil/attributes.h"
  24. #include "libavutil/common.h"
  25. #include "cabac_functions.h"
  26. #include "hevc.h"
  27. #define CABAC_MAX_BIN 100
  28. /**
  29. * number of bin by SyntaxElement.
  30. */
  31. static const int8_t num_bins_in_se[] = {
  32. 1, // sao_merge_flag
  33. 1, // sao_type_idx
  34. 0, // sao_eo_class
  35. 0, // sao_band_position
  36. 0, // sao_offset_abs
  37. 0, // sao_offset_sign
  38. 0, // end_of_slice_flag
  39. 3, // split_coding_unit_flag
  40. 1, // cu_transquant_bypass_flag
  41. 3, // skip_flag
  42. 3, // cu_qp_delta
  43. 1, // pred_mode
  44. 4, // part_mode
  45. 0, // pcm_flag
  46. 1, // prev_intra_luma_pred_mode
  47. 0, // mpm_idx
  48. 0, // rem_intra_luma_pred_mode
  49. 2, // intra_chroma_pred_mode
  50. 1, // merge_flag
  51. 1, // merge_idx
  52. 5, // inter_pred_idc
  53. 2, // ref_idx_l0
  54. 2, // ref_idx_l1
  55. 2, // abs_mvd_greater0_flag
  56. 2, // abs_mvd_greater1_flag
  57. 0, // abs_mvd_minus2
  58. 0, // mvd_sign_flag
  59. 1, // mvp_lx_flag
  60. 1, // no_residual_data_flag
  61. 3, // split_transform_flag
  62. 2, // cbf_luma
  63. 4, // cbf_cb, cbf_cr
  64. 2, // transform_skip_flag[][]
  65. 18, // last_significant_coeff_x_prefix
  66. 18, // last_significant_coeff_y_prefix
  67. 0, // last_significant_coeff_x_suffix
  68. 0, // last_significant_coeff_y_suffix
  69. 4, // significant_coeff_group_flag
  70. 42, // significant_coeff_flag
  71. 24, // coeff_abs_level_greater1_flag
  72. 6, // coeff_abs_level_greater2_flag
  73. 0, // coeff_abs_level_remaining
  74. 0, // coeff_sign_flag
  75. };
  76. /**
  77. * Offset to ctxIdx 0 in init_values and states, indexed by SyntaxElement.
  78. */
  79. static const int elem_offset[sizeof(num_bins_in_se)] = {
  80. 0,
  81. 1,
  82. 2,
  83. 2,
  84. 2,
  85. 2,
  86. 2,
  87. 2,
  88. 5,
  89. 6,
  90. 9,
  91. 12,
  92. 13,
  93. 17,
  94. 17,
  95. 18,
  96. 18,
  97. 18,
  98. 20,
  99. 21,
  100. 22,
  101. 27,
  102. 29,
  103. 31,
  104. 33,
  105. 35,
  106. 35,
  107. 35,
  108. 36,
  109. 37,
  110. 40,
  111. 42,
  112. 46,
  113. 48,
  114. 66,
  115. 84,
  116. 84,
  117. 84,
  118. 88,
  119. 130,
  120. 154,
  121. 160,
  122. 160,
  123. };
  124. #define CNU 154
  125. /**
  126. * Indexed by init_type
  127. */
  128. static const uint8_t init_values[3][HEVC_CONTEXTS] = {
  129. {
  130. // sao_merge_flag
  131. 153,
  132. // sao_type_idx
  133. 200,
  134. // split_coding_unit_flag
  135. 139, 141, 157,
  136. // cu_transquant_bypass_flag
  137. 154,
  138. // skip_flag
  139. CNU, CNU, CNU,
  140. // cu_qp_delta
  141. 154, 154, 154,
  142. // pred_mode
  143. CNU,
  144. // part_mode
  145. 184, CNU, CNU, CNU,
  146. // prev_intra_luma_pred_mode
  147. 184,
  148. // intra_chroma_pred_mode
  149. 63, 139,
  150. // merge_flag
  151. CNU,
  152. // merge_idx
  153. CNU,
  154. // inter_pred_idc
  155. CNU, CNU, CNU, CNU, CNU,
  156. // ref_idx_l0
  157. CNU, CNU,
  158. // ref_idx_l1
  159. CNU, CNU,
  160. // abs_mvd_greater1_flag
  161. CNU, CNU,
  162. // abs_mvd_greater1_flag
  163. CNU, CNU,
  164. // mvp_lx_flag
  165. CNU,
  166. // no_residual_data_flag
  167. CNU,
  168. // split_transform_flag
  169. 153, 138, 138,
  170. // cbf_luma
  171. 111, 141,
  172. // cbf_cb, cbf_cr
  173. 94, 138, 182, 154,
  174. // transform_skip_flag
  175. 139, 139,
  176. // last_significant_coeff_x_prefix
  177. 110, 110, 124, 125, 140, 153, 125, 127, 140, 109, 111, 143, 127, 111,
  178. 79, 108, 123, 63,
  179. // last_significant_coeff_y_prefix
  180. 110, 110, 124, 125, 140, 153, 125, 127, 140, 109, 111, 143, 127, 111,
  181. 79, 108, 123, 63,
  182. // significant_coeff_group_flag
  183. 91, 171, 134, 141,
  184. // significant_coeff_flag
  185. 111, 111, 125, 110, 110, 94, 124, 108, 124, 107, 125, 141, 179, 153,
  186. 125, 107, 125, 141, 179, 153, 125, 107, 125, 141, 179, 153, 125, 140,
  187. 139, 182, 182, 152, 136, 152, 136, 153, 136, 139, 111, 136, 139, 111,
  188. // coeff_abs_level_greater1_flag
  189. 140, 92, 137, 138, 140, 152, 138, 139, 153, 74, 149, 92, 139, 107,
  190. 122, 152, 140, 179, 166, 182, 140, 227, 122, 197,
  191. // coeff_abs_level_greater2_flag
  192. 138, 153, 136, 167, 152, 152,
  193. },
  194. {
  195. // sao_merge_flag
  196. 153,
  197. // sao_type_idx
  198. 185,
  199. // split_coding_unit_flag
  200. 107, 139, 126,
  201. // cu_transquant_bypass_flag
  202. 154,
  203. // skip_flag
  204. 197, 185, 201,
  205. // cu_qp_delta
  206. 154, 154, 154,
  207. // pred_mode
  208. 149,
  209. // part_mode
  210. 154, 139, 154, 154,
  211. // prev_intra_luma_pred_mode
  212. 154,
  213. // intra_chroma_pred_mode
  214. 152, 139,
  215. // merge_flag
  216. 110,
  217. // merge_idx
  218. 122,
  219. // inter_pred_idc
  220. 95, 79, 63, 31, 31,
  221. // ref_idx_l0
  222. 153, 153,
  223. // ref_idx_l1
  224. 153, 153,
  225. // abs_mvd_greater1_flag
  226. 140, 198,
  227. // abs_mvd_greater1_flag
  228. 140, 198,
  229. // mvp_lx_flag
  230. 168,
  231. // no_residual_data_flag
  232. 79,
  233. // split_transform_flag
  234. 124, 138, 94,
  235. // cbf_luma
  236. 153, 111,
  237. // cbf_cb, cbf_cr
  238. 149, 107, 167, 154,
  239. // transform_skip_flag
  240. 139, 139,
  241. // last_significant_coeff_x_prefix
  242. 125, 110, 94, 110, 95, 79, 125, 111, 110, 78, 110, 111, 111, 95,
  243. 94, 108, 123, 108,
  244. // last_significant_coeff_y_prefix
  245. 125, 110, 94, 110, 95, 79, 125, 111, 110, 78, 110, 111, 111, 95,
  246. 94, 108, 123, 108,
  247. // significant_coeff_group_flag
  248. 121, 140, 61, 154,
  249. // significant_coeff_flag
  250. 155, 154, 139, 153, 139, 123, 123, 63, 153, 166, 183, 140, 136, 153,
  251. 154, 166, 183, 140, 136, 153, 154, 166, 183, 140, 136, 153, 154, 170,
  252. 153, 123, 123, 107, 121, 107, 121, 167, 151, 183, 140, 151, 183, 140,
  253. // coeff_abs_level_greater1_flag
  254. 154, 196, 196, 167, 154, 152, 167, 182, 182, 134, 149, 136, 153, 121,
  255. 136, 137, 169, 194, 166, 167, 154, 167, 137, 182,
  256. // coeff_abs_level_greater2_flag
  257. 107, 167, 91, 122, 107, 167,
  258. },
  259. {
  260. // sao_merge_flag
  261. 153,
  262. // sao_type_idx
  263. 160,
  264. // split_coding_unit_flag
  265. 107, 139, 126,
  266. // cu_transquant_bypass_flag
  267. 154,
  268. // skip_flag
  269. 197, 185, 201,
  270. // cu_qp_delta
  271. 154, 154, 154,
  272. // pred_mode
  273. 134,
  274. // part_mode
  275. 154, 139, 154, 154,
  276. // prev_intra_luma_pred_mode
  277. 183,
  278. // intra_chroma_pred_mode
  279. 152, 139,
  280. // merge_flag
  281. 154,
  282. // merge_idx
  283. 137,
  284. // inter_pred_idc
  285. 95, 79, 63, 31, 31,
  286. // ref_idx_l0
  287. 153, 153,
  288. // ref_idx_l1
  289. 153, 153,
  290. // abs_mvd_greater1_flag
  291. 169, 198,
  292. // abs_mvd_greater1_flag
  293. 169, 198,
  294. // mvp_lx_flag
  295. 168,
  296. // no_residual_data_flag
  297. 79,
  298. // split_transform_flag
  299. 224, 167, 122,
  300. // cbf_luma
  301. 153, 111,
  302. // cbf_cb, cbf_cr
  303. 149, 92, 167, 154,
  304. // transform_skip_flag
  305. 139, 139,
  306. // last_significant_coeff_x_prefix
  307. 125, 110, 124, 110, 95, 94, 125, 111, 111, 79, 125, 126, 111, 111,
  308. 79, 108, 123, 93,
  309. // last_significant_coeff_y_prefix
  310. 125, 110, 124, 110, 95, 94, 125, 111, 111, 79, 125, 126, 111, 111,
  311. 79, 108, 123, 93,
  312. // significant_coeff_group_flag
  313. 121, 140, 61, 154,
  314. // significant_coeff_flag
  315. 170, 154, 139, 153, 139, 123, 123, 63, 124, 166, 183, 140, 136, 153,
  316. 154, 166, 183, 140, 136, 153, 154, 166, 183, 140, 136, 153, 154, 170,
  317. 153, 138, 138, 122, 121, 122, 121, 167, 151, 183, 140, 151, 183, 140,
  318. // coeff_abs_level_greater1_flag
  319. 154, 196, 167, 167, 154, 152, 167, 182, 182, 134, 149, 136, 153, 121,
  320. 136, 122, 169, 208, 166, 167, 154, 152, 167, 182,
  321. // coeff_abs_level_greater2_flag
  322. 107, 167, 91, 107, 107, 167,
  323. },
  324. };
  325. static const uint8_t scan_1x1[1] = {
  326. 0,
  327. };
  328. static const uint8_t horiz_scan2x2_x[4] = {
  329. 0, 1, 0, 1,
  330. };
  331. static const uint8_t horiz_scan2x2_y[4] = {
  332. 0, 0, 1, 1
  333. };
  334. static const uint8_t horiz_scan4x4_x[16] = {
  335. 0, 1, 2, 3,
  336. 0, 1, 2, 3,
  337. 0, 1, 2, 3,
  338. 0, 1, 2, 3,
  339. };
  340. static const uint8_t horiz_scan4x4_y[16] = {
  341. 0, 0, 0, 0,
  342. 1, 1, 1, 1,
  343. 2, 2, 2, 2,
  344. 3, 3, 3, 3,
  345. };
  346. static const uint8_t horiz_scan8x8_inv[8][8] = {
  347. { 0, 1, 2, 3, 16, 17, 18, 19, },
  348. { 4, 5, 6, 7, 20, 21, 22, 23, },
  349. { 8, 9, 10, 11, 24, 25, 26, 27, },
  350. { 12, 13, 14, 15, 28, 29, 30, 31, },
  351. { 32, 33, 34, 35, 48, 49, 50, 51, },
  352. { 36, 37, 38, 39, 52, 53, 54, 55, },
  353. { 40, 41, 42, 43, 56, 57, 58, 59, },
  354. { 44, 45, 46, 47, 60, 61, 62, 63, },
  355. };
  356. static const uint8_t diag_scan4x1_x[4] = {
  357. 0, 1, 2, 3,
  358. };
  359. static const uint8_t diag_scan1x4_y[4] = {
  360. 0, 1, 2, 3,
  361. };
  362. static const uint8_t diag_scan2x2_x[4] = {
  363. 0, 0, 1, 1,
  364. };
  365. static const uint8_t diag_scan2x2_y[4] = {
  366. 0, 1, 0, 1,
  367. };
  368. static const uint8_t diag_scan2x2_inv[2][2] = {
  369. { 0, 2, },
  370. { 1, 3, },
  371. };
  372. static const uint8_t diag_scan8x2_x[16] = {
  373. 0, 0, 1, 1,
  374. 2, 2, 3, 3,
  375. 4, 4, 5, 5,
  376. 6, 6, 7, 7,
  377. };
  378. static const uint8_t diag_scan8x2_y[16] = {
  379. 0, 1, 0, 1,
  380. 0, 1, 0, 1,
  381. 0, 1, 0, 1,
  382. 0, 1, 0, 1,
  383. };
  384. static const uint8_t diag_scan8x2_inv[2][8] = {
  385. { 0, 2, 4, 6, 8, 10, 12, 14, },
  386. { 1, 3, 5, 7, 9, 11, 13, 15, },
  387. };
  388. static const uint8_t diag_scan2x8_x[16] = {
  389. 0, 0, 1, 0,
  390. 1, 0, 1, 0,
  391. 1, 0, 1, 0,
  392. 1, 0, 1, 1,
  393. };
  394. static const uint8_t diag_scan2x8_y[16] = {
  395. 0, 1, 0, 2,
  396. 1, 3, 2, 4,
  397. 3, 5, 4, 6,
  398. 5, 7, 6, 7,
  399. };
  400. static const uint8_t diag_scan2x8_inv[8][2] = {
  401. { 0, 2, },
  402. { 1, 4, },
  403. { 3, 6, },
  404. { 5, 8, },
  405. { 7, 10, },
  406. { 9, 12, },
  407. { 11, 14, },
  408. { 13, 15, },
  409. };
  410. const uint8_t ff_hevc_diag_scan4x4_x[16] = {
  411. 0, 0, 1, 0,
  412. 1, 2, 0, 1,
  413. 2, 3, 1, 2,
  414. 3, 2, 3, 3,
  415. };
  416. const uint8_t ff_hevc_diag_scan4x4_y[16] = {
  417. 0, 1, 0, 2,
  418. 1, 0, 3, 2,
  419. 1, 0, 3, 2,
  420. 1, 3, 2, 3,
  421. };
  422. static const uint8_t diag_scan4x4_inv[4][4] = {
  423. { 0, 2, 5, 9, },
  424. { 1, 4, 8, 12, },
  425. { 3, 7, 11, 14, },
  426. { 6, 10, 13, 15, },
  427. };
  428. const uint8_t ff_hevc_diag_scan8x8_x[64] = {
  429. 0, 0, 1, 0,
  430. 1, 2, 0, 1,
  431. 2, 3, 0, 1,
  432. 2, 3, 4, 0,
  433. 1, 2, 3, 4,
  434. 5, 0, 1, 2,
  435. 3, 4, 5, 6,
  436. 0, 1, 2, 3,
  437. 4, 5, 6, 7,
  438. 1, 2, 3, 4,
  439. 5, 6, 7, 2,
  440. 3, 4, 5, 6,
  441. 7, 3, 4, 5,
  442. 6, 7, 4, 5,
  443. 6, 7, 5, 6,
  444. 7, 6, 7, 7,
  445. };
  446. const uint8_t ff_hevc_diag_scan8x8_y[64] = {
  447. 0, 1, 0, 2,
  448. 1, 0, 3, 2,
  449. 1, 0, 4, 3,
  450. 2, 1, 0, 5,
  451. 4, 3, 2, 1,
  452. 0, 6, 5, 4,
  453. 3, 2, 1, 0,
  454. 7, 6, 5, 4,
  455. 3, 2, 1, 0,
  456. 7, 6, 5, 4,
  457. 3, 2, 1, 7,
  458. 6, 5, 4, 3,
  459. 2, 7, 6, 5,
  460. 4, 3, 7, 6,
  461. 5, 4, 7, 6,
  462. 5, 7, 6, 7,
  463. };
  464. static const uint8_t diag_scan8x8_inv[8][8] = {
  465. { 0, 2, 5, 9, 14, 20, 27, 35, },
  466. { 1, 4, 8, 13, 19, 26, 34, 42, },
  467. { 3, 7, 12, 18, 25, 33, 41, 48, },
  468. { 6, 11, 17, 24, 32, 40, 47, 53, },
  469. { 10, 16, 23, 31, 39, 46, 52, 57, },
  470. { 15, 22, 30, 38, 45, 51, 56, 60, },
  471. { 21, 29, 37, 44, 50, 55, 59, 62, },
  472. { 28, 36, 43, 49, 54, 58, 61, 63, },
  473. };
  474. void ff_hevc_save_states(HEVCContext *s, int ctb_addr_ts)
  475. {
  476. if (s->pps->entropy_coding_sync_enabled_flag &&
  477. ((ctb_addr_ts % s->sps->ctb_width) == 2 ||
  478. (s->sps->ctb_width == 2 &&
  479. (ctb_addr_ts % s->sps->ctb_width) == 0))) {
  480. memcpy(s->cabac_state, s->HEVClc.cabac_state, HEVC_CONTEXTS);
  481. }
  482. }
  483. static void load_states(HEVCContext *s)
  484. {
  485. memcpy(s->HEVClc.cabac_state, s->cabac_state, HEVC_CONTEXTS);
  486. }
  487. static void cabac_reinit(HEVCLocalContext *lc)
  488. {
  489. skip_bytes(&lc->cc, 0);
  490. }
  491. static void cabac_init_decoder(HEVCContext *s)
  492. {
  493. GetBitContext *gb = &s->HEVClc.gb;
  494. skip_bits(gb, 1);
  495. align_get_bits(gb);
  496. ff_init_cabac_decoder(&s->HEVClc.cc,
  497. gb->buffer + get_bits_count(gb) / 8,
  498. (get_bits_left(gb) + 7) / 8);
  499. }
  500. static void cabac_init_state(HEVCContext *s)
  501. {
  502. int init_type = 2 - s->sh.slice_type;
  503. int i;
  504. if (s->sh.cabac_init_flag && s->sh.slice_type != I_SLICE)
  505. init_type ^= 3;
  506. for (i = 0; i < HEVC_CONTEXTS; i++) {
  507. int init_value = init_values[init_type][i];
  508. int m = (init_value >> 4) * 5 - 45;
  509. int n = ((init_value & 15) << 3) - 16;
  510. int pre = 2 * (((m * av_clip_c(s->sh.slice_qp, 0, 51)) >> 4) + n) - 127;
  511. pre ^= pre >> 31;
  512. if (pre > 124)
  513. pre = 124 + (pre & 1);
  514. s->HEVClc.cabac_state[i] = pre;
  515. }
  516. }
  517. void ff_hevc_cabac_init(HEVCContext *s, int ctb_addr_ts)
  518. {
  519. if (ctb_addr_ts == s->pps->ctb_addr_rs_to_ts[s->sh.slice_ctb_addr_rs]) {
  520. cabac_init_decoder(s);
  521. if ((s->sh.dependent_slice_segment_flag == 0) ||
  522. (s->pps->tiles_enabled_flag &&
  523. (s->pps->tile_id[ctb_addr_ts] != s->pps->tile_id[ctb_addr_ts - 1])))
  524. cabac_init_state(s);
  525. if (!s->sh.first_slice_in_pic_flag && s->pps->entropy_coding_sync_enabled_flag) {
  526. if ((ctb_addr_ts % s->sps->ctb_width) == 0) {
  527. if (s->sps->ctb_width == 1)
  528. cabac_init_state(s);
  529. else if (s->sh.dependent_slice_segment_flag == 1)
  530. load_states(s);
  531. }
  532. }
  533. } else {
  534. if (s->pps->tiles_enabled_flag &&
  535. (s->pps->tile_id[ctb_addr_ts] != s->pps->tile_id[ctb_addr_ts - 1])) {
  536. cabac_reinit(&s->HEVClc);
  537. cabac_init_state(s);
  538. }
  539. if (s->pps->entropy_coding_sync_enabled_flag) {
  540. if ((ctb_addr_ts % s->sps->ctb_width) == 0) {
  541. get_cabac_terminate(&s->HEVClc.cc);
  542. cabac_reinit(&s->HEVClc);
  543. if (s->sps->ctb_width == 1)
  544. cabac_init_state(s);
  545. else
  546. load_states(s);
  547. }
  548. }
  549. }
  550. }
  551. #define GET_CABAC(ctx) get_cabac(&s->HEVClc.cc, &s->HEVClc.cabac_state[ctx])
  552. int ff_hevc_sao_merge_flag_decode(HEVCContext *s)
  553. {
  554. return GET_CABAC(elem_offset[SAO_MERGE_FLAG]);
  555. }
  556. int ff_hevc_sao_type_idx_decode(HEVCContext *s)
  557. {
  558. if (!GET_CABAC(elem_offset[SAO_TYPE_IDX]))
  559. return 0;
  560. if (!get_cabac_bypass(&s->HEVClc.cc))
  561. return SAO_BAND;
  562. return SAO_EDGE;
  563. }
  564. int ff_hevc_sao_band_position_decode(HEVCContext *s)
  565. {
  566. int i;
  567. int value = get_cabac_bypass(&s->HEVClc.cc);
  568. for (i = 0; i < 4; i++)
  569. value = (value << 1) | get_cabac_bypass(&s->HEVClc.cc);
  570. return value;
  571. }
  572. int ff_hevc_sao_offset_abs_decode(HEVCContext *s)
  573. {
  574. int i = 0;
  575. int length = (1 << (FFMIN(s->sps->bit_depth, 10) - 5)) - 1;
  576. while (i < length && get_cabac_bypass(&s->HEVClc.cc))
  577. i++;
  578. return i;
  579. }
  580. int ff_hevc_sao_offset_sign_decode(HEVCContext *s)
  581. {
  582. return get_cabac_bypass(&s->HEVClc.cc);
  583. }
  584. int ff_hevc_sao_eo_class_decode(HEVCContext *s)
  585. {
  586. int ret = (get_cabac_bypass(&s->HEVClc.cc) << 1);
  587. ret |= get_cabac_bypass(&s->HEVClc.cc);
  588. return ret;
  589. }
  590. int ff_hevc_end_of_slice_flag_decode(HEVCContext *s)
  591. {
  592. return get_cabac_terminate(&s->HEVClc.cc);
  593. }
  594. int ff_hevc_cu_transquant_bypass_flag_decode(HEVCContext *s)
  595. {
  596. return GET_CABAC(elem_offset[CU_TRANSQUANT_BYPASS_FLAG]);
  597. }
  598. int ff_hevc_skip_flag_decode(HEVCContext *s, int x0, int y0, int x_cb, int y_cb)
  599. {
  600. int pic_width_in_ctb = s->sps->width >> s->sps->log2_min_coding_block_size;
  601. int inc = 0;
  602. int x0b = x0 & ((1 << s->sps->log2_ctb_size) - 1);
  603. int y0b = y0 & ((1 << s->sps->log2_ctb_size) - 1);
  604. if (s->HEVClc.ctb_left_flag || x0b)
  605. inc = SAMPLE_CTB(s->skip_flag, x_cb-1, y_cb);
  606. if (s->HEVClc.ctb_up_flag || y0b)
  607. inc += SAMPLE_CTB(s->skip_flag, x_cb, y_cb-1);
  608. return GET_CABAC(elem_offset[SKIP_FLAG] + inc);
  609. }
  610. int ff_hevc_cu_qp_delta_abs(HEVCContext *s)
  611. {
  612. int prefix_val = 0;
  613. int suffix_val = 0;
  614. int inc = 0;
  615. while (prefix_val < 5 && GET_CABAC(elem_offset[CU_QP_DELTA] + inc)) {
  616. prefix_val++;
  617. inc = 1;
  618. }
  619. if (prefix_val >= 5) {
  620. int k = 0;
  621. while (k < CABAC_MAX_BIN && get_cabac_bypass(&s->HEVClc.cc)) {
  622. suffix_val += 1 << k;
  623. k++;
  624. }
  625. if (k == CABAC_MAX_BIN)
  626. av_log(s->avctx, AV_LOG_ERROR, "CABAC_MAX_BIN : %d\n", k);
  627. while (k--)
  628. suffix_val += get_cabac_bypass(&s->HEVClc.cc) << k;
  629. }
  630. return prefix_val + suffix_val;
  631. }
  632. int ff_hevc_cu_qp_delta_sign_flag(HEVCContext *s)
  633. {
  634. return get_cabac_bypass(&s->HEVClc.cc);
  635. }
  636. int ff_hevc_pred_mode_decode(HEVCContext *s)
  637. {
  638. return GET_CABAC(elem_offset[PRED_MODE_FLAG]);
  639. }
  640. int ff_hevc_split_coding_unit_flag_decode(HEVCContext *s, int ct_depth, int x0, int y0)
  641. {
  642. int inc = 0, depth_left = 0, depth_top = 0;
  643. int x0b = x0 & ((1 << s->sps->log2_ctb_size) - 1);
  644. int y0b = y0 & ((1 << s->sps->log2_ctb_size) - 1);
  645. int x_cb = x0 >> s->sps->log2_min_coding_block_size;
  646. int y_cb = y0 >> s->sps->log2_min_coding_block_size;
  647. if (s->HEVClc.ctb_left_flag || x0b)
  648. depth_left = s->tab_ct_depth[(y_cb)*s->sps->min_cb_width + x_cb-1];
  649. if (s->HEVClc.ctb_up_flag || y0b)
  650. depth_top = s->tab_ct_depth[(y_cb-1)*s->sps->min_cb_width + x_cb];
  651. inc += (depth_left > ct_depth);
  652. inc += (depth_top > ct_depth);
  653. return GET_CABAC(elem_offset[SPLIT_CODING_UNIT_FLAG] + inc);
  654. }
  655. int ff_hevc_part_mode_decode(HEVCContext *s, int log2_cb_size)
  656. {
  657. if (GET_CABAC(elem_offset[PART_MODE])) // 1
  658. return PART_2Nx2N;
  659. if (log2_cb_size == s->sps->log2_min_coding_block_size) {
  660. if (s->HEVClc.cu.pred_mode == MODE_INTRA) // 0
  661. return PART_NxN;
  662. if (GET_CABAC(elem_offset[PART_MODE] + 1)) // 01
  663. return PART_2NxN;
  664. if (log2_cb_size == 3) // 00
  665. return PART_Nx2N;
  666. if (GET_CABAC(elem_offset[PART_MODE] + 2)) // 001
  667. return PART_Nx2N;
  668. return PART_NxN; // 000
  669. }
  670. if (!s->sps->amp_enabled_flag) {
  671. if (GET_CABAC(elem_offset[PART_MODE] + 1)) // 01
  672. return PART_2NxN;
  673. return PART_Nx2N;
  674. }
  675. if (GET_CABAC(elem_offset[PART_MODE] + 1)) { // 01X, 01XX
  676. if (GET_CABAC(elem_offset[PART_MODE] + 3)) // 011
  677. return PART_2NxN;
  678. if (get_cabac_bypass(&s->HEVClc.cc)) // 0101
  679. return PART_2NxnD;
  680. return PART_2NxnU; // 0100
  681. }
  682. if (GET_CABAC(elem_offset[PART_MODE] + 3)) // 001
  683. return PART_Nx2N;
  684. if (get_cabac_bypass(&s->HEVClc.cc)) // 0001
  685. return PART_nRx2N;
  686. return PART_nLx2N; // 0000
  687. }
  688. int ff_hevc_pcm_flag_decode(HEVCContext *s)
  689. {
  690. return get_cabac_terminate(&s->HEVClc.cc);
  691. }
  692. int ff_hevc_prev_intra_luma_pred_flag_decode(HEVCContext *s)
  693. {
  694. return GET_CABAC(elem_offset[PREV_INTRA_LUMA_PRED_FLAG]);
  695. }
  696. int ff_hevc_mpm_idx_decode(HEVCContext *s)
  697. {
  698. int i = 0;
  699. while (i < 2 && get_cabac_bypass(&s->HEVClc.cc))
  700. i++;
  701. return i;
  702. }
  703. int ff_hevc_rem_intra_luma_pred_mode_decode(HEVCContext *s)
  704. {
  705. int i;
  706. int value = get_cabac_bypass(&s->HEVClc.cc);
  707. for (i = 0; i < 4; i++)
  708. value = (value << 1) | get_cabac_bypass(&s->HEVClc.cc);
  709. return value;
  710. }
  711. int ff_hevc_intra_chroma_pred_mode_decode(HEVCContext *s)
  712. {
  713. int ret;
  714. if (!GET_CABAC(elem_offset[INTRA_CHROMA_PRED_MODE]))
  715. return 4;
  716. ret = (get_cabac_bypass(&s->HEVClc.cc) << 1);
  717. ret |= get_cabac_bypass(&s->HEVClc.cc);
  718. return ret;
  719. }
  720. int ff_hevc_merge_idx_decode(HEVCContext *s)
  721. {
  722. int i = GET_CABAC(elem_offset[MERGE_IDX]);
  723. if (i != 0) {
  724. while (i < s->sh.max_num_merge_cand-1 && get_cabac_bypass(&s->HEVClc.cc))
  725. i++;
  726. }
  727. return i;
  728. }
  729. int ff_hevc_merge_flag_decode(HEVCContext *s)
  730. {
  731. return GET_CABAC(elem_offset[MERGE_FLAG]);
  732. }
  733. int ff_hevc_inter_pred_idc_decode(HEVCContext *s, int nPbW, int nPbH)
  734. {
  735. if (nPbW + nPbH == 12)
  736. return GET_CABAC(elem_offset[INTER_PRED_IDC] + 4);
  737. if (GET_CABAC(elem_offset[INTER_PRED_IDC] + s->HEVClc.ct.depth))
  738. return PRED_BI;
  739. return GET_CABAC(elem_offset[INTER_PRED_IDC] + 4);
  740. }
  741. int ff_hevc_ref_idx_lx_decode(HEVCContext *s, int num_ref_idx_lx)
  742. {
  743. int i = 0;
  744. int max = num_ref_idx_lx - 1;
  745. int max_ctx = FFMIN(max, 2);
  746. while (i < max_ctx && GET_CABAC(elem_offset[REF_IDX_L0] + i))
  747. i++;
  748. if (i == 2) {
  749. while (i < max && get_cabac_bypass(&s->HEVClc.cc))
  750. i++;
  751. }
  752. return i;
  753. }
  754. int ff_hevc_mvp_lx_flag_decode(HEVCContext *s)
  755. {
  756. return GET_CABAC(elem_offset[MVP_LX_FLAG]);
  757. }
  758. int ff_hevc_no_residual_syntax_flag_decode(HEVCContext *s)
  759. {
  760. return GET_CABAC(elem_offset[NO_RESIDUAL_DATA_FLAG]);
  761. }
  762. static av_always_inline int abs_mvd_greater0_flag_decode(HEVCContext *s)
  763. {
  764. return GET_CABAC(elem_offset[ABS_MVD_GREATER0_FLAG]);
  765. }
  766. static av_always_inline int abs_mvd_greater1_flag_decode(HEVCContext *s)
  767. {
  768. return GET_CABAC(elem_offset[ABS_MVD_GREATER1_FLAG] + 1);
  769. }
  770. static av_always_inline int mvd_decode(HEVCContext *s)
  771. {
  772. int ret = 2;
  773. int k = 1;
  774. while (k < CABAC_MAX_BIN && get_cabac_bypass(&s->HEVClc.cc)) {
  775. ret += 1 << k;
  776. k++;
  777. }
  778. if (k == CABAC_MAX_BIN)
  779. av_log(s->avctx, AV_LOG_ERROR, "CABAC_MAX_BIN : %d\n", k);
  780. while (k--)
  781. ret += get_cabac_bypass(&s->HEVClc.cc) << k;
  782. return get_cabac_bypass_sign(&s->HEVClc.cc, -ret);
  783. }
  784. static av_always_inline int mvd_sign_flag_decode(HEVCContext *s)
  785. {
  786. return get_cabac_bypass_sign(&s->HEVClc.cc, -1);
  787. }
  788. int ff_hevc_split_transform_flag_decode(HEVCContext *s, int log2_trafo_size)
  789. {
  790. return GET_CABAC(elem_offset[SPLIT_TRANSFORM_FLAG] + 5 - log2_trafo_size);
  791. }
  792. int ff_hevc_cbf_cb_cr_decode(HEVCContext *s, int trafo_depth)
  793. {
  794. return GET_CABAC(elem_offset[CBF_CB_CR] + trafo_depth);
  795. }
  796. int ff_hevc_cbf_luma_decode(HEVCContext *s, int trafo_depth)
  797. {
  798. return GET_CABAC(elem_offset[CBF_LUMA] + !trafo_depth);
  799. }
  800. int ff_hevc_transform_skip_flag_decode(HEVCContext *s, int c_idx)
  801. {
  802. return GET_CABAC(elem_offset[TRANSFORM_SKIP_FLAG] + !!c_idx);
  803. }
  804. #define LAST_SIG_COEFF(elem) \
  805. int i = 0; \
  806. int max = (log2_size << 1) - 1; \
  807. int ctx_offset, ctx_shift; \
  808. \
  809. if (c_idx == 0) { \
  810. ctx_offset = 3 * (log2_size - 2) + ((log2_size - 1) >> 2); \
  811. ctx_shift = (log2_size + 1) >> 2; \
  812. } else { \
  813. ctx_offset = 15; \
  814. ctx_shift = log2_size - 2; \
  815. } \
  816. while (i < max && \
  817. GET_CABAC(elem_offset[elem] + (i >> ctx_shift) + ctx_offset)) \
  818. i++; \
  819. return i;
  820. static av_always_inline int last_significant_coeff_x_prefix_decode(HEVCContext *s, int c_idx,
  821. int log2_size)
  822. {
  823. LAST_SIG_COEFF(LAST_SIGNIFICANT_COEFF_X_PREFIX)
  824. }
  825. static av_always_inline int last_significant_coeff_y_prefix_decode(HEVCContext *s, int c_idx,
  826. int log2_size)
  827. {
  828. LAST_SIG_COEFF(LAST_SIGNIFICANT_COEFF_Y_PREFIX)
  829. }
  830. static av_always_inline int last_significant_coeff_suffix_decode(HEVCContext *s,
  831. int last_significant_coeff_prefix)
  832. {
  833. int i;
  834. int length = (last_significant_coeff_prefix >> 1) - 1;
  835. int value = get_cabac_bypass(&s->HEVClc.cc);
  836. for (i = 1; i < length; i++)
  837. value = (value << 1) | get_cabac_bypass(&s->HEVClc.cc);
  838. return value;
  839. }
  840. static av_always_inline int significant_coeff_group_flag_decode(HEVCContext *s, int c_idx, int ctx_cg)
  841. {
  842. int inc;
  843. inc = FFMIN(ctx_cg, 1) + (c_idx>0 ? 2 : 0);
  844. return GET_CABAC(elem_offset[SIGNIFICANT_COEFF_GROUP_FLAG] + inc);
  845. }
  846. static av_always_inline int significant_coeff_flag_decode(HEVCContext *s, int c_idx, int x_c, int y_c,
  847. int log2_trafo_size, int scan_idx, int prev_sig)
  848. {
  849. static const uint8_t ctx_idx_map[] = {
  850. 0, 1, 4, 5, 2, 3, 4, 5, 6, 6, 8, 8, 7, 7, 8, 8
  851. };
  852. int x_cg = x_c >> 2;
  853. int y_cg = y_c >> 2;
  854. int sig_ctx;
  855. int inc;
  856. if (x_c + y_c == 0) {
  857. sig_ctx = 0;
  858. } else if (log2_trafo_size == 2) {
  859. sig_ctx = ctx_idx_map[(y_c << 2) + x_c];
  860. } else {
  861. switch (prev_sig) {
  862. case 0: {
  863. int x_off = x_c & 3;
  864. int y_off = y_c & 3;
  865. sig_ctx = ((x_off + y_off) == 0) ? 2 : ((x_off + y_off) <= 2) ? 1 : 0;
  866. }
  867. break;
  868. case 1:
  869. sig_ctx = 2 - FFMIN(y_c & 3, 2);
  870. break;
  871. case 2:
  872. sig_ctx = 2 - FFMIN(x_c & 3, 2);
  873. break;
  874. default:
  875. sig_ctx = 2;
  876. }
  877. if (c_idx == 0 && (x_cg > 0 || y_cg > 0))
  878. sig_ctx += 3;
  879. if (log2_trafo_size == 3) {
  880. sig_ctx += (scan_idx == SCAN_DIAG) ? 9 : 15;
  881. } else {
  882. sig_ctx += c_idx ? 12 : 21;
  883. }
  884. }
  885. if (c_idx == 0) {
  886. inc = sig_ctx;
  887. } else {
  888. inc = sig_ctx + 27;
  889. }
  890. return GET_CABAC(elem_offset[SIGNIFICANT_COEFF_FLAG] + inc);
  891. }
  892. static av_always_inline int coeff_abs_level_greater1_flag_decode(HEVCContext *s, int c_idx, int inc)
  893. {
  894. if (c_idx > 0)
  895. inc += 16;
  896. return GET_CABAC(elem_offset[COEFF_ABS_LEVEL_GREATER1_FLAG] + inc);
  897. }
  898. static av_always_inline int coeff_abs_level_greater2_flag_decode(HEVCContext *s, int c_idx, int inc)
  899. {
  900. if (c_idx > 0)
  901. inc += 4;
  902. return GET_CABAC(elem_offset[COEFF_ABS_LEVEL_GREATER2_FLAG] + inc);
  903. }
  904. static av_always_inline int coeff_abs_level_remaining_decode(HEVCContext *s, int base_level, int rc_rice_param)
  905. {
  906. int prefix = 0;
  907. int suffix = 0;
  908. int last_coeff_abs_level_remaining;
  909. int i;
  910. while (prefix < CABAC_MAX_BIN && get_cabac_bypass(&s->HEVClc.cc))
  911. prefix++;
  912. if (prefix == CABAC_MAX_BIN)
  913. av_log(s->avctx, AV_LOG_ERROR, "CABAC_MAX_BIN : %d\n", prefix);
  914. if (prefix < 3) {
  915. for (i = 0; i < rc_rice_param; i++)
  916. suffix = (suffix << 1) | get_cabac_bypass(&s->HEVClc.cc);
  917. last_coeff_abs_level_remaining = (prefix << rc_rice_param) + suffix;
  918. } else {
  919. int prefix_minus3 = prefix - 3;
  920. for (i = 0; i < prefix_minus3 + rc_rice_param; i++)
  921. suffix = (suffix << 1) | get_cabac_bypass(&s->HEVClc.cc);
  922. last_coeff_abs_level_remaining = (((1 << prefix_minus3) + 3 - 1)
  923. << rc_rice_param) + suffix;
  924. }
  925. return last_coeff_abs_level_remaining;
  926. }
  927. static av_always_inline int coeff_sign_flag_decode(HEVCContext *s, uint8_t nb)
  928. {
  929. int i;
  930. int ret = 0;
  931. for (i = 0; i < nb; i++)
  932. ret = (ret << 1) | get_cabac_bypass(&s->HEVClc.cc);
  933. return ret;
  934. }
  935. void ff_hevc_hls_residual_coding(HEVCContext *s, int x0, int y0,
  936. int log2_trafo_size, enum ScanType scan_idx,
  937. int c_idx)
  938. {
  939. #define GET_COORD(offset, n) \
  940. do { \
  941. x_c = (scan_x_cg[offset >> 4] << 2) + scan_x_off[n]; \
  942. y_c = (scan_y_cg[offset >> 4] << 2) + scan_y_off[n]; \
  943. } while (0)
  944. HEVCLocalContext *lc = &s->HEVClc;
  945. int transform_skip_flag = 0;
  946. int last_significant_coeff_x, last_significant_coeff_y;
  947. int last_scan_pos;
  948. int n_end;
  949. int num_coeff = 0;
  950. int greater1_ctx = 1;
  951. int num_last_subset;
  952. int x_cg_last_sig, y_cg_last_sig;
  953. const uint8_t *scan_x_cg, *scan_y_cg, *scan_x_off, *scan_y_off;
  954. ptrdiff_t stride = s->frame->linesize[c_idx];
  955. int hshift = s->sps->hshift[c_idx];
  956. int vshift = s->sps->vshift[c_idx];
  957. uint8_t *dst = &s->frame->data[c_idx][(y0 >> vshift) * stride +
  958. ((x0 >> hshift) << s->sps->pixel_shift)];
  959. DECLARE_ALIGNED(16, int16_t, coeffs[MAX_TB_SIZE * MAX_TB_SIZE]) = {0};
  960. DECLARE_ALIGNED(8, uint8_t, significant_coeff_group_flag[8][8]) = {{0}};
  961. int trafo_size = 1 << log2_trafo_size;
  962. int i;
  963. int qp,shift,add,scale,scale_m;
  964. const uint8_t level_scale[] = { 40, 45, 51, 57, 64, 72 };
  965. const uint8_t *scale_matrix;
  966. uint8_t dc_scale;
  967. // Derive QP for dequant
  968. if (!lc->cu.cu_transquant_bypass_flag) {
  969. static const int qp_c[] = { 29, 30, 31, 32, 33, 33, 34, 34, 35, 35, 36, 36, 37, 37 };
  970. static const uint8_t rem6[51 + 2 * 6 + 1] = {
  971. 0, 1, 2, 3, 4, 5, 0, 1, 2, 3, 4, 5, 0, 1, 2, 3, 4, 5, 0, 1, 2,
  972. 3, 4, 5, 0, 1, 2, 3, 4, 5, 0, 1, 2, 3, 4, 5, 0, 1, 2, 3, 4, 5,
  973. 0, 1, 2, 3, 4, 5, 0, 1, 2, 3, 4, 5, 0, 1, 2, 3, 4, 5, 0, 1, 2, 3,
  974. };
  975. static const uint8_t div6[51 + 2 * 6 + 1] = {
  976. 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 3, 3, 3,
  977. 3, 3, 3, 4, 4, 4, 4, 4, 4, 5, 5, 5, 5, 5, 5, 6, 6, 6, 6, 6, 6,
  978. 7, 7, 7, 7, 7, 7, 8, 8, 8, 8, 8, 8, 9, 9, 9, 9, 9, 9, 10, 10, 10, 10,
  979. };
  980. int qp_y = lc->qp_y;
  981. if (c_idx == 0) {
  982. qp = qp_y + s->sps->qp_bd_offset;
  983. } else {
  984. int qp_i, offset;
  985. if (c_idx == 1)
  986. offset = s->pps->cb_qp_offset + s->sh.slice_cb_qp_offset;
  987. else
  988. offset = s->pps->cr_qp_offset + s->sh.slice_cr_qp_offset;
  989. qp_i = av_clip_c(qp_y + offset, - s->sps->qp_bd_offset, 57);
  990. if (qp_i < 30)
  991. qp = qp_i;
  992. else if (qp_i > 43)
  993. qp = qp_i - 6;
  994. else
  995. qp = qp_c[qp_i - 30];
  996. qp += s->sps->qp_bd_offset;
  997. }
  998. shift = s->sps->bit_depth + log2_trafo_size - 5;
  999. add = 1 << (shift-1);
  1000. scale = level_scale[rem6[qp]] << (div6[qp]);
  1001. scale_m = 16; // default when no custom scaling lists.
  1002. dc_scale = 16;
  1003. if (s->sps->scaling_list_enable_flag) {
  1004. const ScalingList *sl = s->pps->pps_scaling_list_data_present_flag ?
  1005. &s->pps->scaling_list : &s->sps->scaling_list;
  1006. int matrix_id = lc->cu.pred_mode != MODE_INTRA;
  1007. if (log2_trafo_size != 5)
  1008. matrix_id = 3 * matrix_id + c_idx;
  1009. scale_matrix = sl->sl[log2_trafo_size - 2][matrix_id];
  1010. if (log2_trafo_size >= 4)
  1011. dc_scale = sl->sl_dc[log2_trafo_size - 4][matrix_id];
  1012. }
  1013. }
  1014. if (s->pps->transform_skip_enabled_flag && !lc->cu.cu_transquant_bypass_flag &&
  1015. log2_trafo_size == 2) {
  1016. transform_skip_flag = ff_hevc_transform_skip_flag_decode(s, c_idx);
  1017. }
  1018. last_significant_coeff_x =
  1019. last_significant_coeff_x_prefix_decode(s, c_idx, log2_trafo_size);
  1020. last_significant_coeff_y =
  1021. last_significant_coeff_y_prefix_decode(s, c_idx, log2_trafo_size);
  1022. if (last_significant_coeff_x > 3) {
  1023. int suffix = last_significant_coeff_suffix_decode(s, last_significant_coeff_x);
  1024. last_significant_coeff_x = (1 << ((last_significant_coeff_x >> 1) - 1)) *
  1025. (2 + (last_significant_coeff_x & 1)) +
  1026. suffix;
  1027. }
  1028. if (last_significant_coeff_y > 3) {
  1029. int suffix = last_significant_coeff_suffix_decode(s, last_significant_coeff_y);
  1030. last_significant_coeff_y = (1 << ((last_significant_coeff_y >> 1) - 1)) *
  1031. (2 + (last_significant_coeff_y & 1)) +
  1032. suffix;
  1033. }
  1034. if (scan_idx == SCAN_VERT)
  1035. FFSWAP(int, last_significant_coeff_x, last_significant_coeff_y);
  1036. x_cg_last_sig = last_significant_coeff_x >> 2;
  1037. y_cg_last_sig = last_significant_coeff_y >> 2;
  1038. switch (scan_idx) {
  1039. case SCAN_DIAG: {
  1040. int last_x_c = last_significant_coeff_x & 3;
  1041. int last_y_c = last_significant_coeff_y & 3;
  1042. scan_x_off = ff_hevc_diag_scan4x4_x;
  1043. scan_y_off = ff_hevc_diag_scan4x4_y;
  1044. num_coeff = diag_scan4x4_inv[last_y_c][last_x_c];
  1045. if (trafo_size == 4) {
  1046. scan_x_cg = scan_1x1;
  1047. scan_y_cg = scan_1x1;
  1048. } else if (trafo_size == 8) {
  1049. num_coeff += diag_scan2x2_inv[y_cg_last_sig][x_cg_last_sig] << 4;
  1050. scan_x_cg = diag_scan2x2_x;
  1051. scan_y_cg = diag_scan2x2_y;
  1052. } else if (trafo_size == 16) {
  1053. num_coeff += diag_scan4x4_inv[y_cg_last_sig][x_cg_last_sig] << 4;
  1054. scan_x_cg = ff_hevc_diag_scan4x4_x;
  1055. scan_y_cg = ff_hevc_diag_scan4x4_y;
  1056. } else { // trafo_size == 32
  1057. num_coeff += diag_scan8x8_inv[y_cg_last_sig][x_cg_last_sig] << 4;
  1058. scan_x_cg = ff_hevc_diag_scan8x8_x;
  1059. scan_y_cg = ff_hevc_diag_scan8x8_y;
  1060. }
  1061. break;
  1062. }
  1063. case SCAN_HORIZ:
  1064. scan_x_cg = horiz_scan2x2_x;
  1065. scan_y_cg = horiz_scan2x2_y;
  1066. scan_x_off = horiz_scan4x4_x;
  1067. scan_y_off = horiz_scan4x4_y;
  1068. num_coeff = horiz_scan8x8_inv[last_significant_coeff_y][last_significant_coeff_x];
  1069. break;
  1070. default: //SCAN_VERT
  1071. scan_x_cg = horiz_scan2x2_y;
  1072. scan_y_cg = horiz_scan2x2_x;
  1073. scan_x_off = horiz_scan4x4_y;
  1074. scan_y_off = horiz_scan4x4_x;
  1075. num_coeff = horiz_scan8x8_inv[last_significant_coeff_x][last_significant_coeff_y];
  1076. break;
  1077. }
  1078. num_coeff++;
  1079. num_last_subset = (num_coeff - 1) >> 4;
  1080. for (i = num_last_subset; i >= 0; i--) {
  1081. int n, m;
  1082. int x_cg, y_cg, x_c, y_c, pos;
  1083. int implicit_non_zero_coeff = 0;
  1084. int64_t trans_coeff_level;
  1085. int prev_sig = 0;
  1086. int offset = i << 4;
  1087. uint8_t significant_coeff_flag_idx[16];
  1088. uint8_t nb_significant_coeff_flag = 0;
  1089. x_cg = scan_x_cg[i];
  1090. y_cg = scan_y_cg[i];
  1091. if ((i < num_last_subset) && (i > 0)) {
  1092. int ctx_cg = 0;
  1093. if (x_cg < (1 << (log2_trafo_size - 2)) - 1)
  1094. ctx_cg += significant_coeff_group_flag[x_cg + 1][y_cg];
  1095. if (y_cg < (1 << (log2_trafo_size - 2)) - 1)
  1096. ctx_cg += significant_coeff_group_flag[x_cg][y_cg + 1];
  1097. significant_coeff_group_flag[x_cg][y_cg] =
  1098. significant_coeff_group_flag_decode(s, c_idx, ctx_cg);
  1099. implicit_non_zero_coeff = 1;
  1100. } else {
  1101. significant_coeff_group_flag[x_cg][y_cg] =
  1102. ((x_cg == x_cg_last_sig && y_cg == y_cg_last_sig) ||
  1103. (x_cg == 0 && y_cg == 0));
  1104. }
  1105. last_scan_pos = num_coeff - offset - 1;
  1106. if (i == num_last_subset) {
  1107. n_end = last_scan_pos - 1;
  1108. significant_coeff_flag_idx[0] = last_scan_pos;
  1109. nb_significant_coeff_flag = 1;
  1110. } else {
  1111. n_end = 15;
  1112. }
  1113. if (x_cg < ((1 << log2_trafo_size) - 1) >> 2)
  1114. prev_sig = significant_coeff_group_flag[x_cg + 1][y_cg];
  1115. if (y_cg < ((1 << log2_trafo_size) - 1) >> 2)
  1116. prev_sig += (significant_coeff_group_flag[x_cg][y_cg + 1] << 1);
  1117. for (n = n_end; n >= 0; n--) {
  1118. GET_COORD(offset, n);
  1119. if (significant_coeff_group_flag[x_cg][y_cg] &&
  1120. (n > 0 || implicit_non_zero_coeff == 0)) {
  1121. if (significant_coeff_flag_decode(s, c_idx, x_c, y_c, log2_trafo_size, scan_idx, prev_sig) == 1) {
  1122. significant_coeff_flag_idx[nb_significant_coeff_flag] = n;
  1123. nb_significant_coeff_flag++;
  1124. implicit_non_zero_coeff = 0;
  1125. }
  1126. } else {
  1127. int last_cg = (x_c == (x_cg << 2) && y_c == (y_cg << 2));
  1128. if (last_cg && implicit_non_zero_coeff && significant_coeff_group_flag[x_cg][y_cg]) {
  1129. significant_coeff_flag_idx[nb_significant_coeff_flag] = n;
  1130. nb_significant_coeff_flag++;
  1131. }
  1132. }
  1133. }
  1134. n_end = nb_significant_coeff_flag;
  1135. if (n_end) {
  1136. int first_nz_pos_in_cg = 16;
  1137. int last_nz_pos_in_cg = -1;
  1138. int c_rice_param = 0;
  1139. int first_greater1_coeff_idx = -1;
  1140. uint8_t coeff_abs_level_greater1_flag[16] = {0};
  1141. uint16_t coeff_sign_flag;
  1142. int sum_abs = 0;
  1143. int sign_hidden = 0;
  1144. // initialize first elem of coeff_bas_level_greater1_flag
  1145. int ctx_set = (i > 0 && c_idx == 0) ? 2 : 0;
  1146. if (!(i == num_last_subset) && greater1_ctx == 0)
  1147. ctx_set++;
  1148. greater1_ctx = 1;
  1149. last_nz_pos_in_cg = significant_coeff_flag_idx[0];
  1150. for (m = 0; m < (n_end > 8 ? 8 : n_end); m++) {
  1151. int n_idx = significant_coeff_flag_idx[m];
  1152. int inc = (ctx_set << 2) + greater1_ctx;
  1153. coeff_abs_level_greater1_flag[n_idx] =
  1154. coeff_abs_level_greater1_flag_decode(s, c_idx, inc);
  1155. if (coeff_abs_level_greater1_flag[n_idx]) {
  1156. greater1_ctx = 0;
  1157. } else if (greater1_ctx > 0 && greater1_ctx < 3) {
  1158. greater1_ctx++;
  1159. }
  1160. if (coeff_abs_level_greater1_flag[n_idx] &&
  1161. first_greater1_coeff_idx == -1)
  1162. first_greater1_coeff_idx = n_idx;
  1163. }
  1164. first_nz_pos_in_cg = significant_coeff_flag_idx[n_end - 1];
  1165. sign_hidden = (last_nz_pos_in_cg - first_nz_pos_in_cg >= 4 &&
  1166. !lc->cu.cu_transquant_bypass_flag);
  1167. if (first_greater1_coeff_idx != -1) {
  1168. coeff_abs_level_greater1_flag[first_greater1_coeff_idx] += coeff_abs_level_greater2_flag_decode(s, c_idx, ctx_set);
  1169. }
  1170. if (!s->pps->sign_data_hiding_flag || !sign_hidden ) {
  1171. coeff_sign_flag = coeff_sign_flag_decode(s, nb_significant_coeff_flag) << (16 - nb_significant_coeff_flag);
  1172. } else {
  1173. coeff_sign_flag = coeff_sign_flag_decode(s, nb_significant_coeff_flag - 1) << (16 - (nb_significant_coeff_flag - 1));
  1174. }
  1175. for (m = 0; m < n_end; m++) {
  1176. n = significant_coeff_flag_idx[m];
  1177. GET_COORD(offset, n);
  1178. trans_coeff_level = 1 + coeff_abs_level_greater1_flag[n];
  1179. if (trans_coeff_level == ((m < 8) ?
  1180. ((n == first_greater1_coeff_idx) ? 3 : 2) : 1)) {
  1181. int last_coeff_abs_level_remaining = coeff_abs_level_remaining_decode(s, trans_coeff_level, c_rice_param);
  1182. trans_coeff_level += last_coeff_abs_level_remaining;
  1183. if (trans_coeff_level > (3 << c_rice_param))
  1184. c_rice_param = FFMIN(c_rice_param + 1, 4);
  1185. }
  1186. if (s->pps->sign_data_hiding_flag && sign_hidden) {
  1187. sum_abs += trans_coeff_level;
  1188. if (n == first_nz_pos_in_cg && (sum_abs&1))
  1189. trans_coeff_level = -trans_coeff_level;
  1190. }
  1191. if (coeff_sign_flag >> 15)
  1192. trans_coeff_level = -trans_coeff_level;
  1193. coeff_sign_flag <<= 1;
  1194. if(!lc->cu.cu_transquant_bypass_flag) {
  1195. if(s->sps->scaling_list_enable_flag) {
  1196. if(y_c || x_c || log2_trafo_size < 4) {
  1197. switch(log2_trafo_size) {
  1198. case 3: pos = (y_c << 3) + x_c; break;
  1199. case 4: pos = ((y_c >> 1) << 3) + (x_c >> 1); break;
  1200. case 5: pos = ((y_c >> 2) << 3) + (x_c >> 2); break;
  1201. default: pos = (y_c << 2) + x_c;
  1202. }
  1203. scale_m = scale_matrix[pos];
  1204. } else {
  1205. scale_m = dc_scale;
  1206. }
  1207. }
  1208. trans_coeff_level = (trans_coeff_level * (int64_t)scale * (int64_t)scale_m + add) >> shift;
  1209. if(trans_coeff_level < 0) {
  1210. if((~trans_coeff_level) & 0xFffffffffff8000)
  1211. trans_coeff_level = -32768;
  1212. } else {
  1213. if(trans_coeff_level & 0xffffffffffff8000)
  1214. trans_coeff_level = 32767;
  1215. }
  1216. }
  1217. coeffs[y_c * trafo_size + x_c] = trans_coeff_level;
  1218. }
  1219. }
  1220. }
  1221. if (lc->cu.cu_transquant_bypass_flag) {
  1222. s->hevcdsp.transquant_bypass[log2_trafo_size-2](dst, coeffs, stride);
  1223. } else {
  1224. if (transform_skip_flag)
  1225. s->hevcdsp.transform_skip(dst, coeffs, stride);
  1226. else if (lc->cu.pred_mode == MODE_INTRA && c_idx == 0 && log2_trafo_size == 2)
  1227. s->hevcdsp.transform_4x4_luma_add(dst, coeffs, stride);
  1228. else
  1229. s->hevcdsp.transform_add[log2_trafo_size-2](dst, coeffs, stride);
  1230. }
  1231. }
  1232. void ff_hevc_hls_mvd_coding(HEVCContext *s, int x0, int y0, int log2_cb_size)
  1233. {
  1234. HEVCLocalContext *lc = &s->HEVClc;
  1235. int x = abs_mvd_greater0_flag_decode(s);
  1236. int y = abs_mvd_greater0_flag_decode(s);
  1237. if (x)
  1238. x += abs_mvd_greater1_flag_decode(s);
  1239. if (y)
  1240. y += abs_mvd_greater1_flag_decode(s);
  1241. switch (x) {
  1242. case 2: lc->pu.mvd.x = mvd_decode(s); break;
  1243. case 1: lc->pu.mvd.x = mvd_sign_flag_decode(s); break;
  1244. case 0: lc->pu.mvd.x = 0; break;
  1245. }
  1246. switch (y) {
  1247. case 2: lc->pu.mvd.y = mvd_decode(s); break;
  1248. case 1: lc->pu.mvd.y = mvd_sign_flag_decode(s); break;
  1249. case 0: lc->pu.mvd.y = 0; break;
  1250. }
  1251. }