You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1460 lines
55KB

  1. /*
  2. * HEVC Parameter Set decoding
  3. *
  4. * Copyright (C) 2012 - 2103 Guillaume Martres
  5. * Copyright (C) 2012 - 2103 Mickael Raulet
  6. * Copyright (C) 2012 - 2013 Gildas Cocherel
  7. * Copyright (C) 2013 Vittorio Giovara
  8. *
  9. * This file is part of FFmpeg.
  10. *
  11. * FFmpeg is free software; you can redistribute it and/or
  12. * modify it under the terms of the GNU Lesser General Public
  13. * License as published by the Free Software Foundation; either
  14. * version 2.1 of the License, or (at your option) any later version.
  15. *
  16. * FFmpeg is distributed in the hope that it will be useful,
  17. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  18. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  19. * Lesser General Public License for more details.
  20. *
  21. * You should have received a copy of the GNU Lesser General Public
  22. * License along with FFmpeg; if not, write to the Free Software
  23. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  24. */
  25. #include "libavutil/imgutils.h"
  26. #include "golomb.h"
  27. #include "hevc.h"
  28. static const uint8_t default_scaling_list_intra[] = {
  29. 16, 16, 16, 16, 17, 18, 21, 24,
  30. 16, 16, 16, 16, 17, 19, 22, 25,
  31. 16, 16, 17, 18, 20, 22, 25, 29,
  32. 16, 16, 18, 21, 24, 27, 31, 36,
  33. 17, 17, 20, 24, 30, 35, 41, 47,
  34. 18, 19, 22, 27, 35, 44, 54, 65,
  35. 21, 22, 25, 31, 41, 54, 70, 88,
  36. 24, 25, 29, 36, 47, 65, 88, 115
  37. };
  38. static const uint8_t default_scaling_list_inter[] = {
  39. 16, 16, 16, 16, 17, 18, 20, 24,
  40. 16, 16, 16, 17, 18, 20, 24, 25,
  41. 16, 16, 17, 18, 20, 24, 25, 28,
  42. 16, 17, 18, 20, 24, 25, 28, 33,
  43. 17, 18, 20, 24, 25, 28, 33, 41,
  44. 18, 20, 24, 25, 28, 33, 41, 54,
  45. 20, 24, 25, 28, 33, 41, 54, 71,
  46. 24, 25, 28, 33, 41, 54, 71, 91
  47. };
  48. static const AVRational vui_sar[] = {
  49. { 0, 1 },
  50. { 1, 1 },
  51. { 12, 11 },
  52. { 10, 11 },
  53. { 16, 11 },
  54. { 40, 33 },
  55. { 24, 11 },
  56. { 20, 11 },
  57. { 32, 11 },
  58. { 80, 33 },
  59. { 18, 11 },
  60. { 15, 11 },
  61. { 64, 33 },
  62. { 160, 99 },
  63. { 4, 3 },
  64. { 3, 2 },
  65. { 2, 1 },
  66. };
  67. int ff_hevc_decode_short_term_rps(HEVCContext *s, ShortTermRPS *rps,
  68. const HEVCSPS *sps, int is_slice_header)
  69. {
  70. HEVCLocalContext *lc = s->HEVClc;
  71. uint8_t rps_predict = 0;
  72. int delta_poc;
  73. int k0 = 0;
  74. int k1 = 0;
  75. int k = 0;
  76. int i;
  77. GetBitContext *gb = &lc->gb;
  78. if (rps != sps->st_rps && sps->nb_st_rps)
  79. rps_predict = get_bits1(gb);
  80. if (rps_predict) {
  81. const ShortTermRPS *rps_ridx;
  82. int delta_rps;
  83. unsigned abs_delta_rps;
  84. uint8_t use_delta_flag = 0;
  85. uint8_t delta_rps_sign;
  86. if (is_slice_header) {
  87. unsigned int delta_idx = get_ue_golomb_long(gb) + 1;
  88. if (delta_idx > sps->nb_st_rps) {
  89. av_log(s->avctx, AV_LOG_ERROR,
  90. "Invalid value of delta_idx in slice header RPS: %d > %d.\n",
  91. delta_idx, sps->nb_st_rps);
  92. return AVERROR_INVALIDDATA;
  93. }
  94. rps_ridx = &sps->st_rps[sps->nb_st_rps - delta_idx];
  95. } else
  96. rps_ridx = &sps->st_rps[rps - sps->st_rps - 1];
  97. delta_rps_sign = get_bits1(gb);
  98. abs_delta_rps = get_ue_golomb_long(gb) + 1;
  99. if (abs_delta_rps < 1 || abs_delta_rps > 32768) {
  100. av_log(s->avctx, AV_LOG_ERROR,
  101. "Invalid value of abs_delta_rps: %d\n",
  102. abs_delta_rps);
  103. return AVERROR_INVALIDDATA;
  104. }
  105. delta_rps = (1 - (delta_rps_sign << 1)) * abs_delta_rps;
  106. for (i = 0; i <= rps_ridx->num_delta_pocs; i++) {
  107. int used = rps->used[k] = get_bits1(gb);
  108. if (!used)
  109. use_delta_flag = get_bits1(gb);
  110. if (used || use_delta_flag) {
  111. if (i < rps_ridx->num_delta_pocs)
  112. delta_poc = delta_rps + rps_ridx->delta_poc[i];
  113. else
  114. delta_poc = delta_rps;
  115. rps->delta_poc[k] = delta_poc;
  116. if (delta_poc < 0)
  117. k0++;
  118. else
  119. k1++;
  120. k++;
  121. }
  122. }
  123. rps->num_delta_pocs = k;
  124. rps->num_negative_pics = k0;
  125. // sort in increasing order (smallest first)
  126. if (rps->num_delta_pocs != 0) {
  127. int used, tmp;
  128. for (i = 1; i < rps->num_delta_pocs; i++) {
  129. delta_poc = rps->delta_poc[i];
  130. used = rps->used[i];
  131. for (k = i - 1; k >= 0; k--) {
  132. tmp = rps->delta_poc[k];
  133. if (delta_poc < tmp) {
  134. rps->delta_poc[k + 1] = tmp;
  135. rps->used[k + 1] = rps->used[k];
  136. rps->delta_poc[k] = delta_poc;
  137. rps->used[k] = used;
  138. }
  139. }
  140. }
  141. }
  142. if ((rps->num_negative_pics >> 1) != 0) {
  143. int used;
  144. k = rps->num_negative_pics - 1;
  145. // flip the negative values to largest first
  146. for (i = 0; i < rps->num_negative_pics >> 1; i++) {
  147. delta_poc = rps->delta_poc[i];
  148. used = rps->used[i];
  149. rps->delta_poc[i] = rps->delta_poc[k];
  150. rps->used[i] = rps->used[k];
  151. rps->delta_poc[k] = delta_poc;
  152. rps->used[k] = used;
  153. k--;
  154. }
  155. }
  156. } else {
  157. unsigned int prev, nb_positive_pics;
  158. rps->num_negative_pics = get_ue_golomb_long(gb);
  159. nb_positive_pics = get_ue_golomb_long(gb);
  160. if (rps->num_negative_pics >= MAX_REFS ||
  161. nb_positive_pics >= MAX_REFS) {
  162. av_log(s->avctx, AV_LOG_ERROR, "Too many refs in a short term RPS.\n");
  163. return AVERROR_INVALIDDATA;
  164. }
  165. rps->num_delta_pocs = rps->num_negative_pics + nb_positive_pics;
  166. if (rps->num_delta_pocs) {
  167. prev = 0;
  168. for (i = 0; i < rps->num_negative_pics; i++) {
  169. delta_poc = get_ue_golomb_long(gb) + 1;
  170. prev -= delta_poc;
  171. rps->delta_poc[i] = prev;
  172. rps->used[i] = get_bits1(gb);
  173. }
  174. prev = 0;
  175. for (i = 0; i < nb_positive_pics; i++) {
  176. delta_poc = get_ue_golomb_long(gb) + 1;
  177. prev += delta_poc;
  178. rps->delta_poc[rps->num_negative_pics + i] = prev;
  179. rps->used[rps->num_negative_pics + i] = get_bits1(gb);
  180. }
  181. }
  182. }
  183. return 0;
  184. }
  185. static void decode_profile_tier_level(HEVCContext *s, PTLCommon *ptl)
  186. {
  187. int i;
  188. HEVCLocalContext *lc = s->HEVClc;
  189. GetBitContext *gb = &lc->gb;
  190. ptl->profile_space = get_bits(gb, 2);
  191. ptl->tier_flag = get_bits1(gb);
  192. ptl->profile_idc = get_bits(gb, 5);
  193. if (ptl->profile_idc == FF_PROFILE_HEVC_MAIN)
  194. av_log(s->avctx, AV_LOG_DEBUG, "Main profile bitstream\n");
  195. else if (ptl->profile_idc == FF_PROFILE_HEVC_MAIN_10)
  196. av_log(s->avctx, AV_LOG_DEBUG, "Main 10 profile bitstream\n");
  197. else if (ptl->profile_idc == FF_PROFILE_HEVC_MAIN_STILL_PICTURE)
  198. av_log(s->avctx, AV_LOG_DEBUG, "Main Still Picture profile bitstream\n");
  199. else if (ptl->profile_idc == FF_PROFILE_HEVC_REXT)
  200. av_log(s->avctx, AV_LOG_DEBUG, "Range Extension profile bitstream\n");
  201. else
  202. av_log(s->avctx, AV_LOG_WARNING, "Unknown HEVC profile: %d\n", ptl->profile_idc);
  203. for (i = 0; i < 32; i++)
  204. ptl->profile_compatibility_flag[i] = get_bits1(gb);
  205. ptl->progressive_source_flag = get_bits1(gb);
  206. ptl->interlaced_source_flag = get_bits1(gb);
  207. ptl->non_packed_constraint_flag = get_bits1(gb);
  208. ptl->frame_only_constraint_flag = get_bits1(gb);
  209. skip_bits(gb, 16); // XXX_reserved_zero_44bits[0..15]
  210. skip_bits(gb, 16); // XXX_reserved_zero_44bits[16..31]
  211. skip_bits(gb, 12); // XXX_reserved_zero_44bits[32..43]
  212. }
  213. static void parse_ptl(HEVCContext *s, PTL *ptl, int max_num_sub_layers)
  214. {
  215. int i;
  216. HEVCLocalContext *lc = s->HEVClc;
  217. GetBitContext *gb = &lc->gb;
  218. decode_profile_tier_level(s, &ptl->general_ptl);
  219. ptl->general_ptl.level_idc = get_bits(gb, 8);
  220. for (i = 0; i < max_num_sub_layers - 1; i++) {
  221. ptl->sub_layer_profile_present_flag[i] = get_bits1(gb);
  222. ptl->sub_layer_level_present_flag[i] = get_bits1(gb);
  223. }
  224. if (max_num_sub_layers - 1> 0)
  225. for (i = max_num_sub_layers - 1; i < 8; i++)
  226. skip_bits(gb, 2); // reserved_zero_2bits[i]
  227. for (i = 0; i < max_num_sub_layers - 1; i++) {
  228. if (ptl->sub_layer_profile_present_flag[i])
  229. decode_profile_tier_level(s, &ptl->sub_layer_ptl[i]);
  230. if (ptl->sub_layer_level_present_flag[i])
  231. ptl->sub_layer_ptl[i].level_idc = get_bits(gb, 8);
  232. }
  233. }
  234. static void decode_sublayer_hrd(HEVCContext *s, unsigned int nb_cpb,
  235. int subpic_params_present)
  236. {
  237. GetBitContext *gb = &s->HEVClc->gb;
  238. int i;
  239. for (i = 0; i < nb_cpb; i++) {
  240. get_ue_golomb_long(gb); // bit_rate_value_minus1
  241. get_ue_golomb_long(gb); // cpb_size_value_minus1
  242. if (subpic_params_present) {
  243. get_ue_golomb_long(gb); // cpb_size_du_value_minus1
  244. get_ue_golomb_long(gb); // bit_rate_du_value_minus1
  245. }
  246. skip_bits1(gb); // cbr_flag
  247. }
  248. }
  249. static int decode_hrd(HEVCContext *s, int common_inf_present,
  250. int max_sublayers)
  251. {
  252. GetBitContext *gb = &s->HEVClc->gb;
  253. int nal_params_present = 0, vcl_params_present = 0;
  254. int subpic_params_present = 0;
  255. int i;
  256. if (common_inf_present) {
  257. nal_params_present = get_bits1(gb);
  258. vcl_params_present = get_bits1(gb);
  259. if (nal_params_present || vcl_params_present) {
  260. subpic_params_present = get_bits1(gb);
  261. if (subpic_params_present) {
  262. skip_bits(gb, 8); // tick_divisor_minus2
  263. skip_bits(gb, 5); // du_cpb_removal_delay_increment_length_minus1
  264. skip_bits(gb, 1); // sub_pic_cpb_params_in_pic_timing_sei_flag
  265. skip_bits(gb, 5); // dpb_output_delay_du_length_minus1
  266. }
  267. skip_bits(gb, 4); // bit_rate_scale
  268. skip_bits(gb, 4); // cpb_size_scale
  269. if (subpic_params_present)
  270. skip_bits(gb, 4); // cpb_size_du_scale
  271. skip_bits(gb, 5); // initial_cpb_removal_delay_length_minus1
  272. skip_bits(gb, 5); // au_cpb_removal_delay_length_minus1
  273. skip_bits(gb, 5); // dpb_output_delay_length_minus1
  274. }
  275. }
  276. for (i = 0; i < max_sublayers; i++) {
  277. int low_delay = 0;
  278. unsigned int nb_cpb = 1;
  279. int fixed_rate = get_bits1(gb);
  280. if (!fixed_rate)
  281. fixed_rate = get_bits1(gb);
  282. if (fixed_rate)
  283. get_ue_golomb_long(gb); // elemental_duration_in_tc_minus1
  284. else
  285. low_delay = get_bits1(gb);
  286. if (!low_delay) {
  287. nb_cpb = get_ue_golomb_long(gb) + 1;
  288. if (nb_cpb < 1 || nb_cpb > 32) {
  289. av_log(s->avctx, AV_LOG_ERROR, "nb_cpb %d invalid\n", nb_cpb);
  290. return AVERROR_INVALIDDATA;
  291. }
  292. }
  293. if (nal_params_present)
  294. decode_sublayer_hrd(s, nb_cpb, subpic_params_present);
  295. if (vcl_params_present)
  296. decode_sublayer_hrd(s, nb_cpb, subpic_params_present);
  297. }
  298. return 0;
  299. }
  300. int ff_hevc_decode_nal_vps(HEVCContext *s)
  301. {
  302. int i,j;
  303. GetBitContext *gb = &s->HEVClc->gb;
  304. int vps_id = 0;
  305. HEVCVPS *vps;
  306. AVBufferRef *vps_buf = av_buffer_allocz(sizeof(*vps));
  307. if (!vps_buf)
  308. return AVERROR(ENOMEM);
  309. vps = (HEVCVPS*)vps_buf->data;
  310. av_log(s->avctx, AV_LOG_DEBUG, "Decoding VPS\n");
  311. vps_id = get_bits(gb, 4);
  312. if (vps_id >= MAX_VPS_COUNT) {
  313. av_log(s->avctx, AV_LOG_ERROR, "VPS id out of range: %d\n", vps_id);
  314. goto err;
  315. }
  316. if (get_bits(gb, 2) != 3) { // vps_reserved_three_2bits
  317. av_log(s->avctx, AV_LOG_ERROR, "vps_reserved_three_2bits is not three\n");
  318. goto err;
  319. }
  320. vps->vps_max_layers = get_bits(gb, 6) + 1;
  321. vps->vps_max_sub_layers = get_bits(gb, 3) + 1;
  322. vps->vps_temporal_id_nesting_flag = get_bits1(gb);
  323. if (get_bits(gb, 16) != 0xffff) { // vps_reserved_ffff_16bits
  324. av_log(s->avctx, AV_LOG_ERROR, "vps_reserved_ffff_16bits is not 0xffff\n");
  325. goto err;
  326. }
  327. if (vps->vps_max_sub_layers > MAX_SUB_LAYERS) {
  328. av_log(s->avctx, AV_LOG_ERROR, "vps_max_sub_layers out of range: %d\n",
  329. vps->vps_max_sub_layers);
  330. goto err;
  331. }
  332. parse_ptl(s, &vps->ptl, vps->vps_max_sub_layers);
  333. vps->vps_sub_layer_ordering_info_present_flag = get_bits1(gb);
  334. i = vps->vps_sub_layer_ordering_info_present_flag ? 0 : vps->vps_max_sub_layers - 1;
  335. for (; i < vps->vps_max_sub_layers; i++) {
  336. vps->vps_max_dec_pic_buffering[i] = get_ue_golomb_long(gb) + 1;
  337. vps->vps_num_reorder_pics[i] = get_ue_golomb_long(gb);
  338. vps->vps_max_latency_increase[i] = get_ue_golomb_long(gb) - 1;
  339. if (vps->vps_max_dec_pic_buffering[i] > MAX_DPB_SIZE || !vps->vps_max_dec_pic_buffering[i]) {
  340. av_log(s->avctx, AV_LOG_ERROR, "vps_max_dec_pic_buffering_minus1 out of range: %d\n",
  341. vps->vps_max_dec_pic_buffering[i] - 1);
  342. goto err;
  343. }
  344. if (vps->vps_num_reorder_pics[i] > vps->vps_max_dec_pic_buffering[i] - 1) {
  345. av_log(s->avctx, AV_LOG_WARNING, "vps_max_num_reorder_pics out of range: %d\n",
  346. vps->vps_num_reorder_pics[i]);
  347. if (s->avctx->err_recognition & AV_EF_EXPLODE)
  348. goto err;
  349. }
  350. }
  351. vps->vps_max_layer_id = get_bits(gb, 6);
  352. vps->vps_num_layer_sets = get_ue_golomb_long(gb) + 1;
  353. if ((vps->vps_num_layer_sets - 1LL) * (vps->vps_max_layer_id + 1LL) > get_bits_left(gb)) {
  354. av_log(s->avctx, AV_LOG_ERROR, "too many layer_id_included_flags\n");
  355. goto err;
  356. }
  357. for (i = 1; i < vps->vps_num_layer_sets; i++)
  358. for (j = 0; j <= vps->vps_max_layer_id; j++)
  359. skip_bits(gb, 1); // layer_id_included_flag[i][j]
  360. vps->vps_timing_info_present_flag = get_bits1(gb);
  361. if (vps->vps_timing_info_present_flag) {
  362. vps->vps_num_units_in_tick = get_bits_long(gb, 32);
  363. vps->vps_time_scale = get_bits_long(gb, 32);
  364. vps->vps_poc_proportional_to_timing_flag = get_bits1(gb);
  365. if (vps->vps_poc_proportional_to_timing_flag)
  366. vps->vps_num_ticks_poc_diff_one = get_ue_golomb_long(gb) + 1;
  367. vps->vps_num_hrd_parameters = get_ue_golomb_long(gb);
  368. for (i = 0; i < vps->vps_num_hrd_parameters; i++) {
  369. int common_inf_present = 1;
  370. get_ue_golomb_long(gb); // hrd_layer_set_idx
  371. if (i)
  372. common_inf_present = get_bits1(gb);
  373. decode_hrd(s, common_inf_present, vps->vps_max_sub_layers);
  374. }
  375. }
  376. get_bits1(gb); /* vps_extension_flag */
  377. av_buffer_unref(&s->vps_list[vps_id]);
  378. s->vps_list[vps_id] = vps_buf;
  379. return 0;
  380. err:
  381. av_buffer_unref(&vps_buf);
  382. return AVERROR_INVALIDDATA;
  383. }
  384. static void decode_vui(HEVCContext *s, HEVCSPS *sps)
  385. {
  386. VUI *vui = &sps->vui;
  387. GetBitContext *gb = &s->HEVClc->gb;
  388. int sar_present;
  389. av_log(s->avctx, AV_LOG_DEBUG, "Decoding VUI\n");
  390. sar_present = get_bits1(gb);
  391. if (sar_present) {
  392. uint8_t sar_idx = get_bits(gb, 8);
  393. if (sar_idx < FF_ARRAY_ELEMS(vui_sar))
  394. vui->sar = vui_sar[sar_idx];
  395. else if (sar_idx == 255) {
  396. vui->sar.num = get_bits(gb, 16);
  397. vui->sar.den = get_bits(gb, 16);
  398. } else
  399. av_log(s->avctx, AV_LOG_WARNING,
  400. "Unknown SAR index: %u.\n", sar_idx);
  401. }
  402. vui->overscan_info_present_flag = get_bits1(gb);
  403. if (vui->overscan_info_present_flag)
  404. vui->overscan_appropriate_flag = get_bits1(gb);
  405. vui->video_signal_type_present_flag = get_bits1(gb);
  406. if (vui->video_signal_type_present_flag) {
  407. vui->video_format = get_bits(gb, 3);
  408. vui->video_full_range_flag = get_bits1(gb);
  409. vui->colour_description_present_flag = get_bits1(gb);
  410. if (vui->video_full_range_flag && sps->pix_fmt == AV_PIX_FMT_YUV420P)
  411. sps->pix_fmt = AV_PIX_FMT_YUVJ420P;
  412. if (vui->colour_description_present_flag) {
  413. vui->colour_primaries = get_bits(gb, 8);
  414. vui->transfer_characteristic = get_bits(gb, 8);
  415. vui->matrix_coeffs = get_bits(gb, 8);
  416. // Set invalid values to "unspecified"
  417. if (vui->colour_primaries >= AVCOL_PRI_NB)
  418. vui->colour_primaries = AVCOL_PRI_UNSPECIFIED;
  419. if (vui->transfer_characteristic >= AVCOL_TRC_NB)
  420. vui->transfer_characteristic = AVCOL_TRC_UNSPECIFIED;
  421. if (vui->matrix_coeffs >= AVCOL_SPC_NB)
  422. vui->matrix_coeffs = AVCOL_SPC_UNSPECIFIED;
  423. }
  424. }
  425. vui->chroma_loc_info_present_flag = get_bits1(gb);
  426. if (vui->chroma_loc_info_present_flag) {
  427. vui->chroma_sample_loc_type_top_field = get_ue_golomb_long(gb);
  428. vui->chroma_sample_loc_type_bottom_field = get_ue_golomb_long(gb);
  429. }
  430. vui->neutra_chroma_indication_flag = get_bits1(gb);
  431. vui->field_seq_flag = get_bits1(gb);
  432. vui->frame_field_info_present_flag = get_bits1(gb);
  433. vui->default_display_window_flag = get_bits1(gb);
  434. if (vui->default_display_window_flag) {
  435. //TODO: * 2 is only valid for 420
  436. vui->def_disp_win.left_offset = get_ue_golomb_long(gb) * 2;
  437. vui->def_disp_win.right_offset = get_ue_golomb_long(gb) * 2;
  438. vui->def_disp_win.top_offset = get_ue_golomb_long(gb) * 2;
  439. vui->def_disp_win.bottom_offset = get_ue_golomb_long(gb) * 2;
  440. if (s->apply_defdispwin &&
  441. s->avctx->flags2 & CODEC_FLAG2_IGNORE_CROP) {
  442. av_log(s->avctx, AV_LOG_DEBUG,
  443. "discarding vui default display window, "
  444. "original values are l:%u r:%u t:%u b:%u\n",
  445. vui->def_disp_win.left_offset,
  446. vui->def_disp_win.right_offset,
  447. vui->def_disp_win.top_offset,
  448. vui->def_disp_win.bottom_offset);
  449. vui->def_disp_win.left_offset =
  450. vui->def_disp_win.right_offset =
  451. vui->def_disp_win.top_offset =
  452. vui->def_disp_win.bottom_offset = 0;
  453. }
  454. }
  455. vui->vui_timing_info_present_flag = get_bits1(gb);
  456. if (vui->vui_timing_info_present_flag) {
  457. vui->vui_num_units_in_tick = get_bits_long(gb, 32);
  458. vui->vui_time_scale = get_bits_long(gb, 32);
  459. vui->vui_poc_proportional_to_timing_flag = get_bits1(gb);
  460. if (vui->vui_poc_proportional_to_timing_flag)
  461. vui->vui_num_ticks_poc_diff_one_minus1 = get_ue_golomb_long(gb);
  462. vui->vui_hrd_parameters_present_flag = get_bits1(gb);
  463. if (vui->vui_hrd_parameters_present_flag)
  464. decode_hrd(s, 1, sps->max_sub_layers);
  465. }
  466. vui->bitstream_restriction_flag = get_bits1(gb);
  467. if (vui->bitstream_restriction_flag) {
  468. vui->tiles_fixed_structure_flag = get_bits1(gb);
  469. vui->motion_vectors_over_pic_boundaries_flag = get_bits1(gb);
  470. vui->restricted_ref_pic_lists_flag = get_bits1(gb);
  471. vui->min_spatial_segmentation_idc = get_ue_golomb_long(gb);
  472. vui->max_bytes_per_pic_denom = get_ue_golomb_long(gb);
  473. vui->max_bits_per_min_cu_denom = get_ue_golomb_long(gb);
  474. vui->log2_max_mv_length_horizontal = get_ue_golomb_long(gb);
  475. vui->log2_max_mv_length_vertical = get_ue_golomb_long(gb);
  476. }
  477. }
  478. static void set_default_scaling_list_data(ScalingList *sl)
  479. {
  480. int matrixId;
  481. for (matrixId = 0; matrixId < 6; matrixId++) {
  482. // 4x4 default is 16
  483. memset(sl->sl[0][matrixId], 16, 16);
  484. sl->sl_dc[0][matrixId] = 16; // default for 16x16
  485. sl->sl_dc[1][matrixId] = 16; // default for 32x32
  486. }
  487. memcpy(sl->sl[1][0], default_scaling_list_intra, 64);
  488. memcpy(sl->sl[1][1], default_scaling_list_intra, 64);
  489. memcpy(sl->sl[1][2], default_scaling_list_intra, 64);
  490. memcpy(sl->sl[1][3], default_scaling_list_inter, 64);
  491. memcpy(sl->sl[1][4], default_scaling_list_inter, 64);
  492. memcpy(sl->sl[1][5], default_scaling_list_inter, 64);
  493. memcpy(sl->sl[2][0], default_scaling_list_intra, 64);
  494. memcpy(sl->sl[2][1], default_scaling_list_intra, 64);
  495. memcpy(sl->sl[2][2], default_scaling_list_intra, 64);
  496. memcpy(sl->sl[2][3], default_scaling_list_inter, 64);
  497. memcpy(sl->sl[2][4], default_scaling_list_inter, 64);
  498. memcpy(sl->sl[2][5], default_scaling_list_inter, 64);
  499. memcpy(sl->sl[3][0], default_scaling_list_intra, 64);
  500. memcpy(sl->sl[3][1], default_scaling_list_intra, 64);
  501. memcpy(sl->sl[3][2], default_scaling_list_intra, 64);
  502. memcpy(sl->sl[3][3], default_scaling_list_inter, 64);
  503. memcpy(sl->sl[3][4], default_scaling_list_inter, 64);
  504. memcpy(sl->sl[3][5], default_scaling_list_inter, 64);
  505. }
  506. static int scaling_list_data(HEVCContext *s, ScalingList *sl, HEVCSPS *sps)
  507. {
  508. GetBitContext *gb = &s->HEVClc->gb;
  509. uint8_t scaling_list_pred_mode_flag;
  510. int32_t scaling_list_dc_coef[2][6];
  511. int size_id, matrix_id, pos;
  512. int i;
  513. for (size_id = 0; size_id < 4; size_id++)
  514. for (matrix_id = 0; matrix_id < 6; matrix_id += ((size_id == 3) ? 3 : 1)) {
  515. scaling_list_pred_mode_flag = get_bits1(gb);
  516. if (!scaling_list_pred_mode_flag) {
  517. unsigned int delta = get_ue_golomb_long(gb);
  518. /* Only need to handle non-zero delta. Zero means default,
  519. * which should already be in the arrays. */
  520. if (delta) {
  521. // Copy from previous array.
  522. if (matrix_id < delta) {
  523. av_log(s->avctx, AV_LOG_ERROR,
  524. "Invalid delta in scaling list data: %d.\n", delta);
  525. return AVERROR_INVALIDDATA;
  526. }
  527. memcpy(sl->sl[size_id][matrix_id],
  528. sl->sl[size_id][matrix_id - delta],
  529. size_id > 0 ? 64 : 16);
  530. if (size_id > 1)
  531. sl->sl_dc[size_id - 2][matrix_id] = sl->sl_dc[size_id - 2][matrix_id - delta];
  532. }
  533. } else {
  534. int next_coef, coef_num;
  535. int32_t scaling_list_delta_coef;
  536. next_coef = 8;
  537. coef_num = FFMIN(64, 1 << (4 + (size_id << 1)));
  538. if (size_id > 1) {
  539. scaling_list_dc_coef[size_id - 2][matrix_id] = get_se_golomb(gb) + 8;
  540. next_coef = scaling_list_dc_coef[size_id - 2][matrix_id];
  541. sl->sl_dc[size_id - 2][matrix_id] = next_coef;
  542. }
  543. for (i = 0; i < coef_num; i++) {
  544. if (size_id == 0)
  545. pos = 4 * ff_hevc_diag_scan4x4_y[i] +
  546. ff_hevc_diag_scan4x4_x[i];
  547. else
  548. pos = 8 * ff_hevc_diag_scan8x8_y[i] +
  549. ff_hevc_diag_scan8x8_x[i];
  550. scaling_list_delta_coef = get_se_golomb(gb);
  551. next_coef = (next_coef + scaling_list_delta_coef + 256) % 256;
  552. sl->sl[size_id][matrix_id][pos] = next_coef;
  553. }
  554. }
  555. }
  556. if (sps->chroma_format_idc == 3) {
  557. for (i = 0; i < 64; i++) {
  558. sl->sl[3][1][i] = sl->sl[2][1][i];
  559. sl->sl[3][2][i] = sl->sl[2][2][i];
  560. sl->sl[3][4][i] = sl->sl[2][4][i];
  561. sl->sl[3][5][i] = sl->sl[2][5][i];
  562. }
  563. sl->sl_dc[1][1] = sl->sl_dc[0][1];
  564. sl->sl_dc[1][2] = sl->sl_dc[0][2];
  565. sl->sl_dc[1][4] = sl->sl_dc[0][4];
  566. sl->sl_dc[1][5] = sl->sl_dc[0][5];
  567. }
  568. return 0;
  569. }
  570. int ff_hevc_decode_nal_sps(HEVCContext *s)
  571. {
  572. const AVPixFmtDescriptor *desc;
  573. GetBitContext *gb = &s->HEVClc->gb;
  574. int ret = 0;
  575. unsigned int sps_id = 0;
  576. int log2_diff_max_min_transform_block_size;
  577. int bit_depth_chroma, start, vui_present, sublayer_ordering_info;
  578. int i;
  579. HEVCSPS *sps;
  580. AVBufferRef *sps_buf = av_buffer_allocz(sizeof(*sps));
  581. if (!sps_buf)
  582. return AVERROR(ENOMEM);
  583. sps = (HEVCSPS*)sps_buf->data;
  584. av_log(s->avctx, AV_LOG_DEBUG, "Decoding SPS\n");
  585. // Coded parameters
  586. sps->vps_id = get_bits(gb, 4);
  587. if (sps->vps_id >= MAX_VPS_COUNT) {
  588. av_log(s->avctx, AV_LOG_ERROR, "VPS id out of range: %d\n", sps->vps_id);
  589. ret = AVERROR_INVALIDDATA;
  590. goto err;
  591. }
  592. if (!s->vps_list[sps->vps_id]) {
  593. av_log(s->avctx, AV_LOG_ERROR, "VPS %d does not exist\n",
  594. sps->vps_id);
  595. ret = AVERROR_INVALIDDATA;
  596. goto err;
  597. }
  598. sps->max_sub_layers = get_bits(gb, 3) + 1;
  599. if (sps->max_sub_layers > MAX_SUB_LAYERS) {
  600. av_log(s->avctx, AV_LOG_ERROR, "sps_max_sub_layers out of range: %d\n",
  601. sps->max_sub_layers);
  602. ret = AVERROR_INVALIDDATA;
  603. goto err;
  604. }
  605. skip_bits1(gb); // temporal_id_nesting_flag
  606. parse_ptl(s, &sps->ptl, sps->max_sub_layers);
  607. sps_id = get_ue_golomb_long(gb);
  608. if (sps_id >= MAX_SPS_COUNT) {
  609. av_log(s->avctx, AV_LOG_ERROR, "SPS id out of range: %d\n", sps_id);
  610. ret = AVERROR_INVALIDDATA;
  611. goto err;
  612. }
  613. sps->chroma_format_idc = get_ue_golomb_long(gb);
  614. if (!(sps->chroma_format_idc == 1 || sps->chroma_format_idc == 2 || sps->chroma_format_idc == 3)) {
  615. avpriv_report_missing_feature(s->avctx, "chroma_format_idc != {1, 2, 3}\n");
  616. ret = AVERROR_PATCHWELCOME;
  617. goto err;
  618. }
  619. if (sps->chroma_format_idc == 3)
  620. sps->separate_colour_plane_flag = get_bits1(gb);
  621. if (sps->separate_colour_plane_flag)
  622. sps->chroma_format_idc = 0;
  623. sps->width = get_ue_golomb_long(gb);
  624. sps->height = get_ue_golomb_long(gb);
  625. if ((ret = av_image_check_size(sps->width,
  626. sps->height, 0, s->avctx)) < 0)
  627. goto err;
  628. if (get_bits1(gb)) { // pic_conformance_flag
  629. //TODO: * 2 is only valid for 420
  630. sps->pic_conf_win.left_offset = get_ue_golomb_long(gb) * 2;
  631. sps->pic_conf_win.right_offset = get_ue_golomb_long(gb) * 2;
  632. sps->pic_conf_win.top_offset = get_ue_golomb_long(gb) * 2;
  633. sps->pic_conf_win.bottom_offset = get_ue_golomb_long(gb) * 2;
  634. if (s->avctx->flags2 & CODEC_FLAG2_IGNORE_CROP) {
  635. av_log(s->avctx, AV_LOG_DEBUG,
  636. "discarding sps conformance window, "
  637. "original values are l:%u r:%u t:%u b:%u\n",
  638. sps->pic_conf_win.left_offset,
  639. sps->pic_conf_win.right_offset,
  640. sps->pic_conf_win.top_offset,
  641. sps->pic_conf_win.bottom_offset);
  642. sps->pic_conf_win.left_offset =
  643. sps->pic_conf_win.right_offset =
  644. sps->pic_conf_win.top_offset =
  645. sps->pic_conf_win.bottom_offset = 0;
  646. }
  647. sps->output_window = sps->pic_conf_win;
  648. }
  649. sps->bit_depth = get_ue_golomb_long(gb) + 8;
  650. bit_depth_chroma = get_ue_golomb_long(gb) + 8;
  651. if (bit_depth_chroma != sps->bit_depth) {
  652. av_log(s->avctx, AV_LOG_ERROR,
  653. "Luma bit depth (%d) is different from chroma bit depth (%d), "
  654. "this is unsupported.\n",
  655. sps->bit_depth, bit_depth_chroma);
  656. ret = AVERROR_INVALIDDATA;
  657. goto err;
  658. }
  659. switch (sps->bit_depth) {
  660. case 8:
  661. if (sps->chroma_format_idc == 1) sps->pix_fmt = AV_PIX_FMT_YUV420P;
  662. if (sps->chroma_format_idc == 2) sps->pix_fmt = AV_PIX_FMT_YUV422P;
  663. if (sps->chroma_format_idc == 3) sps->pix_fmt = AV_PIX_FMT_YUV444P;
  664. break;
  665. case 9:
  666. if (sps->chroma_format_idc == 1) sps->pix_fmt = AV_PIX_FMT_YUV420P9;
  667. if (sps->chroma_format_idc == 2) sps->pix_fmt = AV_PIX_FMT_YUV422P9;
  668. if (sps->chroma_format_idc == 3) sps->pix_fmt = AV_PIX_FMT_YUV444P9;
  669. break;
  670. case 10:
  671. if (sps->chroma_format_idc == 1) sps->pix_fmt = AV_PIX_FMT_YUV420P10;
  672. if (sps->chroma_format_idc == 2) sps->pix_fmt = AV_PIX_FMT_YUV422P10;
  673. if (sps->chroma_format_idc == 3) sps->pix_fmt = AV_PIX_FMT_YUV444P10;
  674. break;
  675. case 12:
  676. if (sps->chroma_format_idc == 1) sps->pix_fmt = AV_PIX_FMT_YUV420P12;
  677. if (sps->chroma_format_idc == 2) sps->pix_fmt = AV_PIX_FMT_YUV422P12;
  678. if (sps->chroma_format_idc == 3) sps->pix_fmt = AV_PIX_FMT_YUV444P12;
  679. break;
  680. default:
  681. av_log(s->avctx, AV_LOG_ERROR,
  682. "4:2:0, 4:2:2, 4:4:4 supports are currently specified for 8, 10 and 12 bits.\n");
  683. return AVERROR_PATCHWELCOME;
  684. }
  685. desc = av_pix_fmt_desc_get(sps->pix_fmt);
  686. if (!desc) {
  687. ret = AVERROR(EINVAL);
  688. goto err;
  689. }
  690. sps->hshift[0] = sps->vshift[0] = 0;
  691. sps->hshift[2] = sps->hshift[1] = desc->log2_chroma_w;
  692. sps->vshift[2] = sps->vshift[1] = desc->log2_chroma_h;
  693. sps->pixel_shift = sps->bit_depth > 8;
  694. sps->log2_max_poc_lsb = get_ue_golomb_long(gb) + 4;
  695. if (sps->log2_max_poc_lsb > 16) {
  696. av_log(s->avctx, AV_LOG_ERROR, "log2_max_pic_order_cnt_lsb_minus4 out range: %d\n",
  697. sps->log2_max_poc_lsb - 4);
  698. ret = AVERROR_INVALIDDATA;
  699. goto err;
  700. }
  701. sublayer_ordering_info = get_bits1(gb);
  702. start = sublayer_ordering_info ? 0 : sps->max_sub_layers - 1;
  703. for (i = start; i < sps->max_sub_layers; i++) {
  704. sps->temporal_layer[i].max_dec_pic_buffering = get_ue_golomb_long(gb) + 1;
  705. sps->temporal_layer[i].num_reorder_pics = get_ue_golomb_long(gb);
  706. sps->temporal_layer[i].max_latency_increase = get_ue_golomb_long(gb) - 1;
  707. if (sps->temporal_layer[i].max_dec_pic_buffering > MAX_DPB_SIZE) {
  708. av_log(s->avctx, AV_LOG_ERROR, "sps_max_dec_pic_buffering_minus1 out of range: %d\n",
  709. sps->temporal_layer[i].max_dec_pic_buffering - 1);
  710. ret = AVERROR_INVALIDDATA;
  711. goto err;
  712. }
  713. if (sps->temporal_layer[i].num_reorder_pics > sps->temporal_layer[i].max_dec_pic_buffering - 1) {
  714. av_log(s->avctx, AV_LOG_WARNING, "sps_max_num_reorder_pics out of range: %d\n",
  715. sps->temporal_layer[i].num_reorder_pics);
  716. if (s->avctx->err_recognition & AV_EF_EXPLODE ||
  717. sps->temporal_layer[i].num_reorder_pics > MAX_DPB_SIZE - 1) {
  718. ret = AVERROR_INVALIDDATA;
  719. goto err;
  720. }
  721. sps->temporal_layer[i].max_dec_pic_buffering = sps->temporal_layer[i].num_reorder_pics + 1;
  722. }
  723. }
  724. if (!sublayer_ordering_info) {
  725. for (i = 0; i < start; i++) {
  726. sps->temporal_layer[i].max_dec_pic_buffering = sps->temporal_layer[start].max_dec_pic_buffering;
  727. sps->temporal_layer[i].num_reorder_pics = sps->temporal_layer[start].num_reorder_pics;
  728. sps->temporal_layer[i].max_latency_increase = sps->temporal_layer[start].max_latency_increase;
  729. }
  730. }
  731. sps->log2_min_cb_size = get_ue_golomb_long(gb) + 3;
  732. sps->log2_diff_max_min_coding_block_size = get_ue_golomb_long(gb);
  733. sps->log2_min_tb_size = get_ue_golomb_long(gb) + 2;
  734. log2_diff_max_min_transform_block_size = get_ue_golomb_long(gb);
  735. sps->log2_max_trafo_size = log2_diff_max_min_transform_block_size +
  736. sps->log2_min_tb_size;
  737. if (sps->log2_min_tb_size >= sps->log2_min_cb_size) {
  738. av_log(s->avctx, AV_LOG_ERROR, "Invalid value for log2_min_tb_size");
  739. ret = AVERROR_INVALIDDATA;
  740. goto err;
  741. }
  742. sps->max_transform_hierarchy_depth_inter = get_ue_golomb_long(gb);
  743. sps->max_transform_hierarchy_depth_intra = get_ue_golomb_long(gb);
  744. sps->scaling_list_enable_flag = get_bits1(gb);
  745. if (sps->scaling_list_enable_flag) {
  746. set_default_scaling_list_data(&sps->scaling_list);
  747. if (get_bits1(gb)) {
  748. ret = scaling_list_data(s, &sps->scaling_list, sps);
  749. if (ret < 0)
  750. goto err;
  751. }
  752. }
  753. sps->amp_enabled_flag = get_bits1(gb);
  754. sps->sao_enabled = get_bits1(gb);
  755. sps->pcm_enabled_flag = get_bits1(gb);
  756. if (sps->pcm_enabled_flag) {
  757. sps->pcm.bit_depth = get_bits(gb, 4) + 1;
  758. sps->pcm.bit_depth_chroma = get_bits(gb, 4) + 1;
  759. sps->pcm.log2_min_pcm_cb_size = get_ue_golomb_long(gb) + 3;
  760. sps->pcm.log2_max_pcm_cb_size = sps->pcm.log2_min_pcm_cb_size +
  761. get_ue_golomb_long(gb);
  762. if (sps->pcm.bit_depth > sps->bit_depth) {
  763. av_log(s->avctx, AV_LOG_ERROR,
  764. "PCM bit depth (%d) is greater than normal bit depth (%d)\n",
  765. sps->pcm.bit_depth, sps->bit_depth);
  766. ret = AVERROR_INVALIDDATA;
  767. goto err;
  768. }
  769. sps->pcm.loop_filter_disable_flag = get_bits1(gb);
  770. }
  771. sps->nb_st_rps = get_ue_golomb_long(gb);
  772. if (sps->nb_st_rps > MAX_SHORT_TERM_RPS_COUNT) {
  773. av_log(s->avctx, AV_LOG_ERROR, "Too many short term RPS: %d.\n",
  774. sps->nb_st_rps);
  775. ret = AVERROR_INVALIDDATA;
  776. goto err;
  777. }
  778. for (i = 0; i < sps->nb_st_rps; i++) {
  779. if ((ret = ff_hevc_decode_short_term_rps(s, &sps->st_rps[i],
  780. sps, 0)) < 0)
  781. goto err;
  782. }
  783. sps->long_term_ref_pics_present_flag = get_bits1(gb);
  784. if (sps->long_term_ref_pics_present_flag) {
  785. sps->num_long_term_ref_pics_sps = get_ue_golomb_long(gb);
  786. for (i = 0; i < sps->num_long_term_ref_pics_sps; i++) {
  787. sps->lt_ref_pic_poc_lsb_sps[i] = get_bits(gb, sps->log2_max_poc_lsb);
  788. sps->used_by_curr_pic_lt_sps_flag[i] = get_bits1(gb);
  789. }
  790. }
  791. sps->sps_temporal_mvp_enabled_flag = get_bits1(gb);
  792. sps->sps_strong_intra_smoothing_enable_flag = get_bits1(gb);
  793. sps->vui.sar = (AVRational){0, 1};
  794. vui_present = get_bits1(gb);
  795. if (vui_present)
  796. decode_vui(s, sps);
  797. if (get_bits1(gb)) { // sps_extension_flag
  798. int sps_extension_flag[1];
  799. for (i = 0; i < 1; i++)
  800. sps_extension_flag[i] = get_bits1(gb);
  801. skip_bits(gb, 7); //sps_extension_7bits = get_bits(gb, 7);
  802. if (sps_extension_flag[0]) {
  803. int extended_precision_processing_flag;
  804. int high_precision_offsets_enabled_flag;
  805. int cabac_bypass_alignment_enabled_flag;
  806. sps->transform_skip_rotation_enabled_flag = get_bits1(gb);
  807. sps->transform_skip_context_enabled_flag = get_bits1(gb);
  808. sps->implicit_rdpcm_enabled_flag = get_bits1(gb);
  809. sps->explicit_rdpcm_enabled_flag = get_bits1(gb);
  810. extended_precision_processing_flag = get_bits1(gb);
  811. if (extended_precision_processing_flag)
  812. av_log(s->avctx, AV_LOG_WARNING,
  813. "extended_precision_processing_flag not yet implemented\n");
  814. sps->intra_smoothing_disabled_flag = get_bits1(gb);
  815. high_precision_offsets_enabled_flag = get_bits1(gb);
  816. if (high_precision_offsets_enabled_flag)
  817. av_log(s->avctx, AV_LOG_WARNING,
  818. "high_precision_offsets_enabled_flag not yet implemented\n");
  819. sps->persistent_rice_adaptation_enabled_flag = get_bits1(gb);
  820. cabac_bypass_alignment_enabled_flag = get_bits1(gb);
  821. if (cabac_bypass_alignment_enabled_flag)
  822. av_log(s->avctx, AV_LOG_WARNING,
  823. "cabac_bypass_alignment_enabled_flag not yet implemented\n");
  824. }
  825. }
  826. if (s->apply_defdispwin) {
  827. sps->output_window.left_offset += sps->vui.def_disp_win.left_offset;
  828. sps->output_window.right_offset += sps->vui.def_disp_win.right_offset;
  829. sps->output_window.top_offset += sps->vui.def_disp_win.top_offset;
  830. sps->output_window.bottom_offset += sps->vui.def_disp_win.bottom_offset;
  831. }
  832. if (sps->output_window.left_offset & (0x1F >> (sps->pixel_shift)) &&
  833. !(s->avctx->flags & CODEC_FLAG_UNALIGNED)) {
  834. sps->output_window.left_offset &= ~(0x1F >> (sps->pixel_shift));
  835. av_log(s->avctx, AV_LOG_WARNING, "Reducing left output window to %d "
  836. "chroma samples to preserve alignment.\n",
  837. sps->output_window.left_offset);
  838. }
  839. sps->output_width = sps->width -
  840. (sps->output_window.left_offset + sps->output_window.right_offset);
  841. sps->output_height = sps->height -
  842. (sps->output_window.top_offset + sps->output_window.bottom_offset);
  843. if (sps->output_width <= 0 || sps->output_height <= 0) {
  844. av_log(s->avctx, AV_LOG_WARNING, "Invalid visible frame dimensions: %dx%d.\n",
  845. sps->output_width, sps->output_height);
  846. if (s->avctx->err_recognition & AV_EF_EXPLODE) {
  847. ret = AVERROR_INVALIDDATA;
  848. goto err;
  849. }
  850. av_log(s->avctx, AV_LOG_WARNING,
  851. "Displaying the whole video surface.\n");
  852. sps->pic_conf_win.left_offset =
  853. sps->pic_conf_win.right_offset =
  854. sps->pic_conf_win.top_offset =
  855. sps->pic_conf_win.bottom_offset = 0;
  856. sps->output_width = sps->width;
  857. sps->output_height = sps->height;
  858. }
  859. // Inferred parameters
  860. sps->log2_ctb_size = sps->log2_min_cb_size +
  861. sps->log2_diff_max_min_coding_block_size;
  862. sps->log2_min_pu_size = sps->log2_min_cb_size - 1;
  863. sps->ctb_width = (sps->width + (1 << sps->log2_ctb_size) - 1) >> sps->log2_ctb_size;
  864. sps->ctb_height = (sps->height + (1 << sps->log2_ctb_size) - 1) >> sps->log2_ctb_size;
  865. sps->ctb_size = sps->ctb_width * sps->ctb_height;
  866. sps->min_cb_width = sps->width >> sps->log2_min_cb_size;
  867. sps->min_cb_height = sps->height >> sps->log2_min_cb_size;
  868. sps->min_tb_width = sps->width >> sps->log2_min_tb_size;
  869. sps->min_tb_height = sps->height >> sps->log2_min_tb_size;
  870. sps->min_pu_width = sps->width >> sps->log2_min_pu_size;
  871. sps->min_pu_height = sps->height >> sps->log2_min_pu_size;
  872. sps->tb_mask = (1 << (sps->log2_ctb_size - sps->log2_min_tb_size)) - 1;
  873. sps->qp_bd_offset = 6 * (sps->bit_depth - 8);
  874. if (sps->width & ((1 << sps->log2_min_cb_size) - 1) ||
  875. sps->height & ((1 << sps->log2_min_cb_size) - 1)) {
  876. av_log(s->avctx, AV_LOG_ERROR, "Invalid coded frame dimensions.\n");
  877. goto err;
  878. }
  879. if (sps->log2_ctb_size > MAX_LOG2_CTB_SIZE) {
  880. av_log(s->avctx, AV_LOG_ERROR, "CTB size out of range: 2^%d\n", sps->log2_ctb_size);
  881. goto err;
  882. }
  883. if (sps->max_transform_hierarchy_depth_inter > sps->log2_ctb_size - sps->log2_min_tb_size) {
  884. av_log(s->avctx, AV_LOG_ERROR, "max_transform_hierarchy_depth_inter out of range: %d\n",
  885. sps->max_transform_hierarchy_depth_inter);
  886. goto err;
  887. }
  888. if (sps->max_transform_hierarchy_depth_intra > sps->log2_ctb_size - sps->log2_min_tb_size) {
  889. av_log(s->avctx, AV_LOG_ERROR, "max_transform_hierarchy_depth_intra out of range: %d\n",
  890. sps->max_transform_hierarchy_depth_intra);
  891. goto err;
  892. }
  893. if (sps->log2_max_trafo_size > FFMIN(sps->log2_ctb_size, 5)) {
  894. av_log(s->avctx, AV_LOG_ERROR,
  895. "max transform block size out of range: %d\n",
  896. sps->log2_max_trafo_size);
  897. goto err;
  898. }
  899. if (s->avctx->debug & FF_DEBUG_BITSTREAM) {
  900. av_log(s->avctx, AV_LOG_DEBUG,
  901. "Parsed SPS: id %d; coded wxh: %dx%d; "
  902. "cropped wxh: %dx%d; pix_fmt: %s.\n",
  903. sps_id, sps->width, sps->height,
  904. sps->output_width, sps->output_height,
  905. av_get_pix_fmt_name(sps->pix_fmt));
  906. }
  907. /* check if this is a repeat of an already parsed SPS, then keep the
  908. * original one.
  909. * otherwise drop all PPSes that depend on it */
  910. if (s->sps_list[sps_id] &&
  911. !memcmp(s->sps_list[sps_id]->data, sps_buf->data, sps_buf->size)) {
  912. av_buffer_unref(&sps_buf);
  913. } else {
  914. for (i = 0; i < FF_ARRAY_ELEMS(s->pps_list); i++) {
  915. if (s->pps_list[i] && ((HEVCPPS*)s->pps_list[i]->data)->sps_id == sps_id)
  916. av_buffer_unref(&s->pps_list[i]);
  917. }
  918. if (s->sps_list[sps_id] && s->sps == (HEVCSPS*)s->sps_list[sps_id]->data) {
  919. av_buffer_unref(&s->current_sps);
  920. s->current_sps = av_buffer_ref(s->sps_list[sps_id]);
  921. if (!s->current_sps)
  922. s->sps = NULL;
  923. }
  924. av_buffer_unref(&s->sps_list[sps_id]);
  925. s->sps_list[sps_id] = sps_buf;
  926. }
  927. return 0;
  928. err:
  929. av_buffer_unref(&sps_buf);
  930. return ret;
  931. }
  932. static void hevc_pps_free(void *opaque, uint8_t *data)
  933. {
  934. HEVCPPS *pps = (HEVCPPS*)data;
  935. av_freep(&pps->column_width);
  936. av_freep(&pps->row_height);
  937. av_freep(&pps->col_bd);
  938. av_freep(&pps->row_bd);
  939. av_freep(&pps->col_idxX);
  940. av_freep(&pps->ctb_addr_rs_to_ts);
  941. av_freep(&pps->ctb_addr_ts_to_rs);
  942. av_freep(&pps->tile_pos_rs);
  943. av_freep(&pps->tile_id);
  944. av_freep(&pps->min_tb_addr_zs_tab);
  945. av_freep(&pps);
  946. }
  947. static int pps_range_extensions(HEVCContext *s, HEVCPPS *pps, HEVCSPS *sps) {
  948. GetBitContext *gb = &s->HEVClc->gb;
  949. int i;
  950. if (pps->transform_skip_enabled_flag) {
  951. pps->log2_max_transform_skip_block_size = get_ue_golomb_long(gb) + 2;
  952. }
  953. pps->cross_component_prediction_enabled_flag = get_bits1(gb);
  954. pps->chroma_qp_offset_list_enabled_flag = get_bits1(gb);
  955. if (pps->chroma_qp_offset_list_enabled_flag) {
  956. pps->diff_cu_chroma_qp_offset_depth = get_ue_golomb_long(gb);
  957. pps->chroma_qp_offset_list_len_minus1 = get_ue_golomb_long(gb);
  958. if (pps->chroma_qp_offset_list_len_minus1 && pps->chroma_qp_offset_list_len_minus1 >= 5) {
  959. av_log(s->avctx, AV_LOG_ERROR,
  960. "chroma_qp_offset_list_len_minus1 shall be in the range [0, 5].\n");
  961. return AVERROR_INVALIDDATA;
  962. }
  963. for (i = 0; i <= pps->chroma_qp_offset_list_len_minus1; i++) {
  964. pps->cb_qp_offset_list[i] = get_se_golomb_long(gb);
  965. if (pps->cb_qp_offset_list[i]) {
  966. av_log(s->avctx, AV_LOG_WARNING,
  967. "cb_qp_offset_list not tested yet.\n");
  968. }
  969. pps->cr_qp_offset_list[i] = get_se_golomb_long(gb);
  970. if (pps->cr_qp_offset_list[i]) {
  971. av_log(s->avctx, AV_LOG_WARNING,
  972. "cb_qp_offset_list not tested yet.\n");
  973. }
  974. }
  975. }
  976. pps->log2_sao_offset_scale_luma = get_ue_golomb_long(gb);
  977. pps->log2_sao_offset_scale_chroma = get_ue_golomb_long(gb);
  978. return(0);
  979. }
  980. int ff_hevc_decode_nal_pps(HEVCContext *s)
  981. {
  982. GetBitContext *gb = &s->HEVClc->gb;
  983. HEVCSPS *sps = NULL;
  984. int pic_area_in_ctbs;
  985. int log2_diff_ctb_min_tb_size;
  986. int i, j, x, y, ctb_addr_rs, tile_id;
  987. int ret = 0;
  988. unsigned int pps_id = 0;
  989. AVBufferRef *pps_buf;
  990. HEVCPPS *pps = av_mallocz(sizeof(*pps));
  991. if (!pps)
  992. return AVERROR(ENOMEM);
  993. pps_buf = av_buffer_create((uint8_t *)pps, sizeof(*pps),
  994. hevc_pps_free, NULL, 0);
  995. if (!pps_buf) {
  996. av_freep(&pps);
  997. return AVERROR(ENOMEM);
  998. }
  999. av_log(s->avctx, AV_LOG_DEBUG, "Decoding PPS\n");
  1000. // Default values
  1001. pps->loop_filter_across_tiles_enabled_flag = 1;
  1002. pps->num_tile_columns = 1;
  1003. pps->num_tile_rows = 1;
  1004. pps->uniform_spacing_flag = 1;
  1005. pps->disable_dbf = 0;
  1006. pps->beta_offset = 0;
  1007. pps->tc_offset = 0;
  1008. pps->log2_max_transform_skip_block_size = 2;
  1009. // Coded parameters
  1010. pps_id = get_ue_golomb_long(gb);
  1011. if (pps_id >= MAX_PPS_COUNT) {
  1012. av_log(s->avctx, AV_LOG_ERROR, "PPS id out of range: %d\n", pps_id);
  1013. ret = AVERROR_INVALIDDATA;
  1014. goto err;
  1015. }
  1016. pps->sps_id = get_ue_golomb_long(gb);
  1017. if (pps->sps_id >= MAX_SPS_COUNT) {
  1018. av_log(s->avctx, AV_LOG_ERROR, "SPS id out of range: %d\n", pps->sps_id);
  1019. ret = AVERROR_INVALIDDATA;
  1020. goto err;
  1021. }
  1022. if (!s->sps_list[pps->sps_id]) {
  1023. av_log(s->avctx, AV_LOG_ERROR, "SPS %u does not exist.\n", pps->sps_id);
  1024. ret = AVERROR_INVALIDDATA;
  1025. goto err;
  1026. }
  1027. sps = (HEVCSPS *)s->sps_list[pps->sps_id]->data;
  1028. pps->dependent_slice_segments_enabled_flag = get_bits1(gb);
  1029. pps->output_flag_present_flag = get_bits1(gb);
  1030. pps->num_extra_slice_header_bits = get_bits(gb, 3);
  1031. pps->sign_data_hiding_flag = get_bits1(gb);
  1032. pps->cabac_init_present_flag = get_bits1(gb);
  1033. pps->num_ref_idx_l0_default_active = get_ue_golomb_long(gb) + 1;
  1034. pps->num_ref_idx_l1_default_active = get_ue_golomb_long(gb) + 1;
  1035. pps->pic_init_qp_minus26 = get_se_golomb(gb);
  1036. pps->constrained_intra_pred_flag = get_bits1(gb);
  1037. pps->transform_skip_enabled_flag = get_bits1(gb);
  1038. pps->cu_qp_delta_enabled_flag = get_bits1(gb);
  1039. pps->diff_cu_qp_delta_depth = 0;
  1040. if (pps->cu_qp_delta_enabled_flag)
  1041. pps->diff_cu_qp_delta_depth = get_ue_golomb_long(gb);
  1042. pps->cb_qp_offset = get_se_golomb(gb);
  1043. if (pps->cb_qp_offset < -12 || pps->cb_qp_offset > 12) {
  1044. av_log(s->avctx, AV_LOG_ERROR, "pps_cb_qp_offset out of range: %d\n",
  1045. pps->cb_qp_offset);
  1046. ret = AVERROR_INVALIDDATA;
  1047. goto err;
  1048. }
  1049. pps->cr_qp_offset = get_se_golomb(gb);
  1050. if (pps->cr_qp_offset < -12 || pps->cr_qp_offset > 12) {
  1051. av_log(s->avctx, AV_LOG_ERROR, "pps_cr_qp_offset out of range: %d\n",
  1052. pps->cr_qp_offset);
  1053. ret = AVERROR_INVALIDDATA;
  1054. goto err;
  1055. }
  1056. pps->pic_slice_level_chroma_qp_offsets_present_flag = get_bits1(gb);
  1057. pps->weighted_pred_flag = get_bits1(gb);
  1058. pps->weighted_bipred_flag = get_bits1(gb);
  1059. pps->transquant_bypass_enable_flag = get_bits1(gb);
  1060. pps->tiles_enabled_flag = get_bits1(gb);
  1061. pps->entropy_coding_sync_enabled_flag = get_bits1(gb);
  1062. if (pps->tiles_enabled_flag) {
  1063. pps->num_tile_columns = get_ue_golomb_long(gb) + 1;
  1064. pps->num_tile_rows = get_ue_golomb_long(gb) + 1;
  1065. if (pps->num_tile_columns == 0 ||
  1066. pps->num_tile_columns >= sps->width) {
  1067. av_log(s->avctx, AV_LOG_ERROR, "num_tile_columns_minus1 out of range: %d\n",
  1068. pps->num_tile_columns - 1);
  1069. ret = AVERROR_INVALIDDATA;
  1070. goto err;
  1071. }
  1072. if (pps->num_tile_rows == 0 ||
  1073. pps->num_tile_rows >= sps->height) {
  1074. av_log(s->avctx, AV_LOG_ERROR, "num_tile_rows_minus1 out of range: %d\n",
  1075. pps->num_tile_rows - 1);
  1076. ret = AVERROR_INVALIDDATA;
  1077. goto err;
  1078. }
  1079. pps->column_width = av_malloc_array(pps->num_tile_columns, sizeof(*pps->column_width));
  1080. pps->row_height = av_malloc_array(pps->num_tile_rows, sizeof(*pps->row_height));
  1081. if (!pps->column_width || !pps->row_height) {
  1082. ret = AVERROR(ENOMEM);
  1083. goto err;
  1084. }
  1085. pps->uniform_spacing_flag = get_bits1(gb);
  1086. if (!pps->uniform_spacing_flag) {
  1087. uint64_t sum = 0;
  1088. for (i = 0; i < pps->num_tile_columns - 1; i++) {
  1089. pps->column_width[i] = get_ue_golomb_long(gb) + 1;
  1090. sum += pps->column_width[i];
  1091. }
  1092. if (sum >= sps->ctb_width) {
  1093. av_log(s->avctx, AV_LOG_ERROR, "Invalid tile widths.\n");
  1094. ret = AVERROR_INVALIDDATA;
  1095. goto err;
  1096. }
  1097. pps->column_width[pps->num_tile_columns - 1] = sps->ctb_width - sum;
  1098. sum = 0;
  1099. for (i = 0; i < pps->num_tile_rows - 1; i++) {
  1100. pps->row_height[i] = get_ue_golomb_long(gb) + 1;
  1101. sum += pps->row_height[i];
  1102. }
  1103. if (sum >= sps->ctb_height) {
  1104. av_log(s->avctx, AV_LOG_ERROR, "Invalid tile heights.\n");
  1105. ret = AVERROR_INVALIDDATA;
  1106. goto err;
  1107. }
  1108. pps->row_height[pps->num_tile_rows - 1] = sps->ctb_height - sum;
  1109. }
  1110. pps->loop_filter_across_tiles_enabled_flag = get_bits1(gb);
  1111. }
  1112. pps->seq_loop_filter_across_slices_enabled_flag = get_bits1(gb);
  1113. pps->deblocking_filter_control_present_flag = get_bits1(gb);
  1114. if (pps->deblocking_filter_control_present_flag) {
  1115. pps->deblocking_filter_override_enabled_flag = get_bits1(gb);
  1116. pps->disable_dbf = get_bits1(gb);
  1117. if (!pps->disable_dbf) {
  1118. pps->beta_offset = get_se_golomb(gb) * 2;
  1119. pps->tc_offset = get_se_golomb(gb) * 2;
  1120. if (pps->beta_offset/2 < -6 || pps->beta_offset/2 > 6) {
  1121. av_log(s->avctx, AV_LOG_ERROR, "pps_beta_offset_div2 out of range: %d\n",
  1122. pps->beta_offset/2);
  1123. ret = AVERROR_INVALIDDATA;
  1124. goto err;
  1125. }
  1126. if (pps->tc_offset/2 < -6 || pps->tc_offset/2 > 6) {
  1127. av_log(s->avctx, AV_LOG_ERROR, "pps_tc_offset_div2 out of range: %d\n",
  1128. pps->tc_offset/2);
  1129. ret = AVERROR_INVALIDDATA;
  1130. goto err;
  1131. }
  1132. }
  1133. }
  1134. pps->scaling_list_data_present_flag = get_bits1(gb);
  1135. if (pps->scaling_list_data_present_flag) {
  1136. set_default_scaling_list_data(&pps->scaling_list);
  1137. ret = scaling_list_data(s, &pps->scaling_list, sps);
  1138. if (ret < 0)
  1139. goto err;
  1140. }
  1141. pps->lists_modification_present_flag = get_bits1(gb);
  1142. pps->log2_parallel_merge_level = get_ue_golomb_long(gb) + 2;
  1143. if (pps->log2_parallel_merge_level > sps->log2_ctb_size) {
  1144. av_log(s->avctx, AV_LOG_ERROR, "log2_parallel_merge_level_minus2 out of range: %d\n",
  1145. pps->log2_parallel_merge_level - 2);
  1146. ret = AVERROR_INVALIDDATA;
  1147. goto err;
  1148. }
  1149. pps->slice_header_extension_present_flag = get_bits1(gb);
  1150. if (get_bits1(gb)) { // pps_extension_present_flag
  1151. int pps_range_extensions_flag = get_bits1(gb);
  1152. /* int pps_extension_7bits = */ get_bits(gb, 7);
  1153. if (sps->ptl.general_ptl.profile_idc == FF_PROFILE_HEVC_REXT && pps_range_extensions_flag) {
  1154. pps_range_extensions(s, pps, sps);
  1155. }
  1156. }
  1157. // Inferred parameters
  1158. pps->col_bd = av_malloc_array(pps->num_tile_columns + 1, sizeof(*pps->col_bd));
  1159. pps->row_bd = av_malloc_array(pps->num_tile_rows + 1, sizeof(*pps->row_bd));
  1160. pps->col_idxX = av_malloc_array(sps->ctb_width, sizeof(*pps->col_idxX));
  1161. if (!pps->col_bd || !pps->row_bd || !pps->col_idxX) {
  1162. ret = AVERROR(ENOMEM);
  1163. goto err;
  1164. }
  1165. if (pps->uniform_spacing_flag) {
  1166. if (!pps->column_width) {
  1167. pps->column_width = av_malloc_array(pps->num_tile_columns, sizeof(*pps->column_width));
  1168. pps->row_height = av_malloc_array(pps->num_tile_rows, sizeof(*pps->row_height));
  1169. }
  1170. if (!pps->column_width || !pps->row_height) {
  1171. ret = AVERROR(ENOMEM);
  1172. goto err;
  1173. }
  1174. for (i = 0; i < pps->num_tile_columns; i++) {
  1175. pps->column_width[i] = ((i + 1) * sps->ctb_width) / pps->num_tile_columns -
  1176. (i * sps->ctb_width) / pps->num_tile_columns;
  1177. }
  1178. for (i = 0; i < pps->num_tile_rows; i++) {
  1179. pps->row_height[i] = ((i + 1) * sps->ctb_height) / pps->num_tile_rows -
  1180. (i * sps->ctb_height) / pps->num_tile_rows;
  1181. }
  1182. }
  1183. pps->col_bd[0] = 0;
  1184. for (i = 0; i < pps->num_tile_columns; i++)
  1185. pps->col_bd[i + 1] = pps->col_bd[i] + pps->column_width[i];
  1186. pps->row_bd[0] = 0;
  1187. for (i = 0; i < pps->num_tile_rows; i++)
  1188. pps->row_bd[i + 1] = pps->row_bd[i] + pps->row_height[i];
  1189. for (i = 0, j = 0; i < sps->ctb_width; i++) {
  1190. if (i > pps->col_bd[j])
  1191. j++;
  1192. pps->col_idxX[i] = j;
  1193. }
  1194. /**
  1195. * 6.5
  1196. */
  1197. pic_area_in_ctbs = sps->ctb_width * sps->ctb_height;
  1198. pps->ctb_addr_rs_to_ts = av_malloc_array(pic_area_in_ctbs, sizeof(*pps->ctb_addr_rs_to_ts));
  1199. pps->ctb_addr_ts_to_rs = av_malloc_array(pic_area_in_ctbs, sizeof(*pps->ctb_addr_ts_to_rs));
  1200. pps->tile_id = av_malloc_array(pic_area_in_ctbs, sizeof(*pps->tile_id));
  1201. pps->min_tb_addr_zs_tab = av_malloc_array((sps->tb_mask+2) * (sps->tb_mask+2), sizeof(*pps->min_tb_addr_zs_tab));
  1202. if (!pps->ctb_addr_rs_to_ts || !pps->ctb_addr_ts_to_rs ||
  1203. !pps->tile_id || !pps->min_tb_addr_zs_tab) {
  1204. ret = AVERROR(ENOMEM);
  1205. goto err;
  1206. }
  1207. for (ctb_addr_rs = 0; ctb_addr_rs < pic_area_in_ctbs; ctb_addr_rs++) {
  1208. int tb_x = ctb_addr_rs % sps->ctb_width;
  1209. int tb_y = ctb_addr_rs / sps->ctb_width;
  1210. int tile_x = 0;
  1211. int tile_y = 0;
  1212. int val = 0;
  1213. for (i = 0; i < pps->num_tile_columns; i++) {
  1214. if (tb_x < pps->col_bd[i + 1]) {
  1215. tile_x = i;
  1216. break;
  1217. }
  1218. }
  1219. for (i = 0; i < pps->num_tile_rows; i++) {
  1220. if (tb_y < pps->row_bd[i + 1]) {
  1221. tile_y = i;
  1222. break;
  1223. }
  1224. }
  1225. for (i = 0; i < tile_x; i++)
  1226. val += pps->row_height[tile_y] * pps->column_width[i];
  1227. for (i = 0; i < tile_y; i++)
  1228. val += sps->ctb_width * pps->row_height[i];
  1229. val += (tb_y - pps->row_bd[tile_y]) * pps->column_width[tile_x] +
  1230. tb_x - pps->col_bd[tile_x];
  1231. pps->ctb_addr_rs_to_ts[ctb_addr_rs] = val;
  1232. pps->ctb_addr_ts_to_rs[val] = ctb_addr_rs;
  1233. }
  1234. for (j = 0, tile_id = 0; j < pps->num_tile_rows; j++)
  1235. for (i = 0; i < pps->num_tile_columns; i++, tile_id++)
  1236. for (y = pps->row_bd[j]; y < pps->row_bd[j + 1]; y++)
  1237. for (x = pps->col_bd[i]; x < pps->col_bd[i + 1]; x++)
  1238. pps->tile_id[pps->ctb_addr_rs_to_ts[y * sps->ctb_width + x]] = tile_id;
  1239. pps->tile_pos_rs = av_malloc_array(tile_id, sizeof(*pps->tile_pos_rs));
  1240. if (!pps->tile_pos_rs) {
  1241. ret = AVERROR(ENOMEM);
  1242. goto err;
  1243. }
  1244. for (j = 0; j < pps->num_tile_rows; j++)
  1245. for (i = 0; i < pps->num_tile_columns; i++)
  1246. pps->tile_pos_rs[j * pps->num_tile_columns + i] = pps->row_bd[j] * sps->ctb_width + pps->col_bd[i];
  1247. log2_diff_ctb_min_tb_size = sps->log2_ctb_size - sps->log2_min_tb_size;
  1248. pps->min_tb_addr_zs = &pps->min_tb_addr_zs_tab[1*(sps->tb_mask+2)+1];
  1249. for (y = 0; y < sps->tb_mask+2; y++) {
  1250. pps->min_tb_addr_zs_tab[y*(sps->tb_mask+2)] = -1;
  1251. pps->min_tb_addr_zs_tab[y] = -1;
  1252. }
  1253. for (y = 0; y < sps->tb_mask+1; y++) {
  1254. for (x = 0; x < sps->tb_mask+1; x++) {
  1255. int tb_x = x >> log2_diff_ctb_min_tb_size;
  1256. int tb_y = y >> log2_diff_ctb_min_tb_size;
  1257. int ctb_addr_rs = sps->ctb_width * tb_y + tb_x;
  1258. int val = pps->ctb_addr_rs_to_ts[ctb_addr_rs] <<
  1259. (log2_diff_ctb_min_tb_size * 2);
  1260. for (i = 0; i < log2_diff_ctb_min_tb_size; i++) {
  1261. int m = 1 << i;
  1262. val += (m & x ? m * m : 0) + (m & y ? 2 * m * m : 0);
  1263. }
  1264. pps->min_tb_addr_zs[y * (sps->tb_mask+2) + x] = val;
  1265. }
  1266. }
  1267. av_buffer_unref(&s->pps_list[pps_id]);
  1268. s->pps_list[pps_id] = pps_buf;
  1269. return 0;
  1270. err:
  1271. av_buffer_unref(&pps_buf);
  1272. return ret;
  1273. }