You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1380 lines
51KB

  1. /*
  2. * HEVC Parameter Set decoding
  3. *
  4. * Copyright (C) 2012 - 2103 Guillaume Martres
  5. * Copyright (C) 2012 - 2103 Mickael Raulet
  6. * Copyright (C) 2012 - 2013 Gildas Cocherel
  7. * Copyright (C) 2013 Vittorio Giovara
  8. *
  9. * This file is part of Libav.
  10. *
  11. * Libav is free software; you can redistribute it and/or
  12. * modify it under the terms of the GNU Lesser General Public
  13. * License as published by the Free Software Foundation; either
  14. * version 2.1 of the License, or (at your option) any later version.
  15. *
  16. * Libav is distributed in the hope that it will be useful,
  17. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  18. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  19. * Lesser General Public License for more details.
  20. *
  21. * You should have received a copy of the GNU Lesser General Public
  22. * License along with Libav; if not, write to the Free Software
  23. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  24. */
  25. #include "libavutil/imgutils.h"
  26. #include "golomb.h"
  27. #include "hevc.h"
  28. static const uint8_t default_scaling_list_intra[] = {
  29. 16, 16, 16, 16, 17, 18, 21, 24,
  30. 16, 16, 16, 16, 17, 19, 22, 25,
  31. 16, 16, 17, 18, 20, 22, 25, 29,
  32. 16, 16, 18, 21, 24, 27, 31, 36,
  33. 17, 17, 20, 24, 30, 35, 41, 47,
  34. 18, 19, 22, 27, 35, 44, 54, 65,
  35. 21, 22, 25, 31, 41, 54, 70, 88,
  36. 24, 25, 29, 36, 47, 65, 88, 115
  37. };
  38. static const uint8_t default_scaling_list_inter[] = {
  39. 16, 16, 16, 16, 17, 18, 20, 24,
  40. 16, 16, 16, 17, 18, 20, 24, 25,
  41. 16, 16, 17, 18, 20, 24, 25, 28,
  42. 16, 17, 18, 20, 24, 25, 28, 33,
  43. 17, 18, 20, 24, 25, 28, 33, 41,
  44. 18, 20, 24, 25, 28, 33, 41, 54,
  45. 20, 24, 25, 28, 33, 41, 54, 71,
  46. 24, 25, 28, 33, 41, 54, 71, 91
  47. };
  48. static const AVRational vui_sar[] = {
  49. { 0, 1 },
  50. { 1, 1 },
  51. { 12, 11 },
  52. { 10, 11 },
  53. { 16, 11 },
  54. { 40, 33 },
  55. { 24, 11 },
  56. { 20, 11 },
  57. { 32, 11 },
  58. { 80, 33 },
  59. { 18, 11 },
  60. { 15, 11 },
  61. { 64, 33 },
  62. { 160, 99 },
  63. { 4, 3 },
  64. { 3, 2 },
  65. { 2, 1 },
  66. };
  67. static void remove_pps(HEVCParamSets *s, int id)
  68. {
  69. if (s->pps_list[id] && s->pps == (const HEVCPPS*)s->pps_list[id]->data)
  70. s->pps = NULL;
  71. av_buffer_unref(&s->pps_list[id]);
  72. }
  73. static void remove_sps(HEVCParamSets *s, int id)
  74. {
  75. int i;
  76. if (s->sps_list[id]) {
  77. if (s->sps == (const HEVCSPS*)s->sps_list[id]->data)
  78. s->sps = NULL;
  79. /* drop all PPS that depend on this SPS */
  80. for (i = 0; i < FF_ARRAY_ELEMS(s->pps_list); i++)
  81. if (s->pps_list[i] && ((HEVCPPS*)s->pps_list[i]->data)->sps_id == id)
  82. remove_pps(s, i);
  83. }
  84. av_buffer_unref(&s->sps_list[id]);
  85. }
  86. static void remove_vps(HEVCParamSets *s, int id)
  87. {
  88. int i;
  89. if (s->vps_list[id]) {
  90. if (s->vps == (const HEVCVPS*)s->vps_list[id]->data)
  91. s->vps = NULL;
  92. for (i = 0; i < FF_ARRAY_ELEMS(s->sps_list); i++)
  93. if (s->sps_list[i] && ((HEVCSPS*)s->sps_list[i]->data)->vps_id == id)
  94. remove_sps(s, i);
  95. }
  96. av_buffer_unref(&s->vps_list[id]);
  97. }
  98. int ff_hevc_decode_short_term_rps(GetBitContext *gb, AVCodecContext *avctx,
  99. ShortTermRPS *rps, const HEVCSPS *sps, int is_slice_header)
  100. {
  101. uint8_t rps_predict = 0;
  102. int delta_poc;
  103. int k0 = 0;
  104. int k1 = 0;
  105. int k = 0;
  106. int i;
  107. if (rps != sps->st_rps && sps->nb_st_rps)
  108. rps_predict = get_bits1(gb);
  109. if (rps_predict) {
  110. const ShortTermRPS *rps_ridx;
  111. int delta_rps, abs_delta_rps;
  112. uint8_t use_delta_flag = 0;
  113. uint8_t delta_rps_sign;
  114. if (is_slice_header) {
  115. unsigned int delta_idx = get_ue_golomb_long(gb) + 1;
  116. if (delta_idx > sps->nb_st_rps) {
  117. av_log(avctx, AV_LOG_ERROR,
  118. "Invalid value of delta_idx in slice header RPS: %d > %d.\n",
  119. delta_idx, sps->nb_st_rps);
  120. return AVERROR_INVALIDDATA;
  121. }
  122. rps_ridx = &sps->st_rps[sps->nb_st_rps - delta_idx];
  123. rps->rps_idx_num_delta_pocs = rps_ridx->num_delta_pocs;
  124. } else
  125. rps_ridx = &sps->st_rps[rps - sps->st_rps - 1];
  126. delta_rps_sign = get_bits1(gb);
  127. abs_delta_rps = get_ue_golomb_long(gb) + 1;
  128. delta_rps = (1 - (delta_rps_sign << 1)) * abs_delta_rps;
  129. for (i = 0; i <= rps_ridx->num_delta_pocs; i++) {
  130. int used = rps->used[k] = get_bits1(gb);
  131. if (!used)
  132. use_delta_flag = get_bits1(gb);
  133. if (used || use_delta_flag) {
  134. if (i < rps_ridx->num_delta_pocs)
  135. delta_poc = delta_rps + rps_ridx->delta_poc[i];
  136. else
  137. delta_poc = delta_rps;
  138. rps->delta_poc[k] = delta_poc;
  139. if (delta_poc < 0)
  140. k0++;
  141. else
  142. k1++;
  143. k++;
  144. }
  145. }
  146. rps->num_delta_pocs = k;
  147. rps->num_negative_pics = k0;
  148. // sort in increasing order (smallest first)
  149. if (rps->num_delta_pocs != 0) {
  150. int used, tmp;
  151. for (i = 1; i < rps->num_delta_pocs; i++) {
  152. delta_poc = rps->delta_poc[i];
  153. used = rps->used[i];
  154. for (k = i - 1; k >= 0; k--) {
  155. tmp = rps->delta_poc[k];
  156. if (delta_poc < tmp) {
  157. rps->delta_poc[k + 1] = tmp;
  158. rps->used[k + 1] = rps->used[k];
  159. rps->delta_poc[k] = delta_poc;
  160. rps->used[k] = used;
  161. }
  162. }
  163. }
  164. }
  165. if ((rps->num_negative_pics >> 1) != 0) {
  166. int used;
  167. k = rps->num_negative_pics - 1;
  168. // flip the negative values to largest first
  169. for (i = 0; i < rps->num_negative_pics >> 1; i++) {
  170. delta_poc = rps->delta_poc[i];
  171. used = rps->used[i];
  172. rps->delta_poc[i] = rps->delta_poc[k];
  173. rps->used[i] = rps->used[k];
  174. rps->delta_poc[k] = delta_poc;
  175. rps->used[k] = used;
  176. k--;
  177. }
  178. }
  179. } else {
  180. unsigned int prev, nb_positive_pics;
  181. rps->num_negative_pics = get_ue_golomb_long(gb);
  182. nb_positive_pics = get_ue_golomb_long(gb);
  183. if (rps->num_negative_pics >= MAX_REFS ||
  184. nb_positive_pics >= MAX_REFS) {
  185. av_log(avctx, AV_LOG_ERROR, "Too many refs in a short term RPS.\n");
  186. return AVERROR_INVALIDDATA;
  187. }
  188. rps->num_delta_pocs = rps->num_negative_pics + nb_positive_pics;
  189. if (rps->num_delta_pocs) {
  190. prev = 0;
  191. for (i = 0; i < rps->num_negative_pics; i++) {
  192. delta_poc = get_ue_golomb_long(gb) + 1;
  193. prev -= delta_poc;
  194. rps->delta_poc[i] = prev;
  195. rps->used[i] = get_bits1(gb);
  196. }
  197. prev = 0;
  198. for (i = 0; i < nb_positive_pics; i++) {
  199. delta_poc = get_ue_golomb_long(gb) + 1;
  200. prev += delta_poc;
  201. rps->delta_poc[rps->num_negative_pics + i] = prev;
  202. rps->used[rps->num_negative_pics + i] = get_bits1(gb);
  203. }
  204. }
  205. }
  206. return 0;
  207. }
  208. static void decode_profile_tier_level(GetBitContext *gb, AVCodecContext *avctx,
  209. PTLCommon *ptl)
  210. {
  211. int i;
  212. ptl->profile_space = get_bits(gb, 2);
  213. ptl->tier_flag = get_bits1(gb);
  214. ptl->profile_idc = get_bits(gb, 5);
  215. if (ptl->profile_idc == FF_PROFILE_HEVC_MAIN)
  216. av_log(avctx, AV_LOG_DEBUG, "Main profile bitstream\n");
  217. else if (ptl->profile_idc == FF_PROFILE_HEVC_MAIN_10)
  218. av_log(avctx, AV_LOG_DEBUG, "Main 10 profile bitstream\n");
  219. else if (ptl->profile_idc == FF_PROFILE_HEVC_MAIN_STILL_PICTURE)
  220. av_log(avctx, AV_LOG_DEBUG, "Main Still Picture profile bitstream\n");
  221. else
  222. av_log(avctx, AV_LOG_WARNING, "Unknown HEVC profile: %d\n", ptl->profile_idc);
  223. for (i = 0; i < 32; i++) {
  224. ptl->profile_compatibility_flag[i] = get_bits1(gb);
  225. if (ptl->profile_idc == 0 && i > 0 && ptl->profile_compatibility_flag[i])
  226. ptl->profile_idc = i;
  227. }
  228. ptl->progressive_source_flag = get_bits1(gb);
  229. ptl->interlaced_source_flag = get_bits1(gb);
  230. ptl->non_packed_constraint_flag = get_bits1(gb);
  231. ptl->frame_only_constraint_flag = get_bits1(gb);
  232. skip_bits(gb, 16); // XXX_reserved_zero_44bits[0..15]
  233. skip_bits(gb, 16); // XXX_reserved_zero_44bits[16..31]
  234. skip_bits(gb, 12); // XXX_reserved_zero_44bits[32..43]
  235. }
  236. static void parse_ptl(GetBitContext *gb, AVCodecContext *avctx,
  237. PTL *ptl, int max_num_sub_layers)
  238. {
  239. int i;
  240. decode_profile_tier_level(gb, avctx, &ptl->general_ptl);
  241. ptl->general_ptl.level_idc = get_bits(gb, 8);
  242. for (i = 0; i < max_num_sub_layers - 1; i++) {
  243. ptl->sub_layer_profile_present_flag[i] = get_bits1(gb);
  244. ptl->sub_layer_level_present_flag[i] = get_bits1(gb);
  245. }
  246. if (max_num_sub_layers - 1 > 0)
  247. for (i = max_num_sub_layers - 1; i < 8; i++)
  248. skip_bits(gb, 2); // reserved_zero_2bits[i]
  249. for (i = 0; i < max_num_sub_layers - 1; i++) {
  250. if (ptl->sub_layer_profile_present_flag[i])
  251. decode_profile_tier_level(gb, avctx, &ptl->sub_layer_ptl[i]);
  252. if (ptl->sub_layer_level_present_flag[i])
  253. ptl->sub_layer_ptl[i].level_idc = get_bits(gb, 8);
  254. }
  255. }
  256. static void decode_sublayer_hrd(GetBitContext *gb, unsigned int nb_cpb,
  257. int subpic_params_present)
  258. {
  259. int i;
  260. for (i = 0; i < nb_cpb; i++) {
  261. get_ue_golomb_long(gb); // bit_rate_value_minus1
  262. get_ue_golomb_long(gb); // cpb_size_value_minus1
  263. if (subpic_params_present) {
  264. get_ue_golomb_long(gb); // cpb_size_du_value_minus1
  265. get_ue_golomb_long(gb); // bit_rate_du_value_minus1
  266. }
  267. skip_bits1(gb); // cbr_flag
  268. }
  269. }
  270. static void decode_hrd(GetBitContext *gb, int common_inf_present,
  271. int max_sublayers)
  272. {
  273. int nal_params_present = 0, vcl_params_present = 0;
  274. int subpic_params_present = 0;
  275. int i;
  276. if (common_inf_present) {
  277. nal_params_present = get_bits1(gb);
  278. vcl_params_present = get_bits1(gb);
  279. if (nal_params_present || vcl_params_present) {
  280. subpic_params_present = get_bits1(gb);
  281. if (subpic_params_present) {
  282. skip_bits(gb, 8); // tick_divisor_minus2
  283. skip_bits(gb, 5); // du_cpb_removal_delay_increment_length_minus1
  284. skip_bits(gb, 1); // sub_pic_cpb_params_in_pic_timing_sei_flag
  285. skip_bits(gb, 5); // dpb_output_delay_du_length_minus1
  286. }
  287. skip_bits(gb, 4); // bit_rate_scale
  288. skip_bits(gb, 4); // cpb_size_scale
  289. if (subpic_params_present)
  290. skip_bits(gb, 4); // cpb_size_du_scale
  291. skip_bits(gb, 5); // initial_cpb_removal_delay_length_minus1
  292. skip_bits(gb, 5); // au_cpb_removal_delay_length_minus1
  293. skip_bits(gb, 5); // dpb_output_delay_length_minus1
  294. }
  295. }
  296. for (i = 0; i < max_sublayers; i++) {
  297. int low_delay = 0;
  298. unsigned int nb_cpb = 1;
  299. int fixed_rate = get_bits1(gb);
  300. if (!fixed_rate)
  301. fixed_rate = get_bits1(gb);
  302. if (fixed_rate)
  303. get_ue_golomb_long(gb); // elemental_duration_in_tc_minus1
  304. else
  305. low_delay = get_bits1(gb);
  306. if (!low_delay)
  307. nb_cpb = get_ue_golomb_long(gb) + 1;
  308. if (nal_params_present)
  309. decode_sublayer_hrd(gb, nb_cpb, subpic_params_present);
  310. if (vcl_params_present)
  311. decode_sublayer_hrd(gb, nb_cpb, subpic_params_present);
  312. }
  313. }
  314. int ff_hevc_decode_nal_vps(GetBitContext *gb, AVCodecContext *avctx,
  315. HEVCParamSets *ps)
  316. {
  317. int i,j;
  318. int vps_id = 0;
  319. HEVCVPS *vps;
  320. AVBufferRef *vps_buf = av_buffer_allocz(sizeof(*vps));
  321. if (!vps_buf)
  322. return AVERROR(ENOMEM);
  323. vps = (HEVCVPS*)vps_buf->data;
  324. av_log(avctx, AV_LOG_DEBUG, "Decoding VPS\n");
  325. vps_id = get_bits(gb, 4);
  326. if (vps_id >= MAX_VPS_COUNT) {
  327. av_log(avctx, AV_LOG_ERROR, "VPS id out of range: %d\n", vps_id);
  328. goto err;
  329. }
  330. if (get_bits(gb, 2) != 3) { // vps_reserved_three_2bits
  331. av_log(avctx, AV_LOG_ERROR, "vps_reserved_three_2bits is not three\n");
  332. goto err;
  333. }
  334. vps->vps_max_layers = get_bits(gb, 6) + 1;
  335. vps->vps_max_sub_layers = get_bits(gb, 3) + 1;
  336. vps->vps_temporal_id_nesting_flag = get_bits1(gb);
  337. if (get_bits(gb, 16) != 0xffff) { // vps_reserved_ffff_16bits
  338. av_log(avctx, AV_LOG_ERROR, "vps_reserved_ffff_16bits is not 0xffff\n");
  339. goto err;
  340. }
  341. if (vps->vps_max_sub_layers > MAX_SUB_LAYERS) {
  342. av_log(avctx, AV_LOG_ERROR, "vps_max_sub_layers out of range: %d\n",
  343. vps->vps_max_sub_layers);
  344. goto err;
  345. }
  346. parse_ptl(gb, avctx, &vps->ptl, vps->vps_max_sub_layers);
  347. vps->vps_sub_layer_ordering_info_present_flag = get_bits1(gb);
  348. i = vps->vps_sub_layer_ordering_info_present_flag ? 0 : vps->vps_max_sub_layers - 1;
  349. for (; i < vps->vps_max_sub_layers; i++) {
  350. vps->vps_max_dec_pic_buffering[i] = get_ue_golomb_long(gb) + 1;
  351. vps->vps_num_reorder_pics[i] = get_ue_golomb_long(gb);
  352. vps->vps_max_latency_increase[i] = get_ue_golomb_long(gb) - 1;
  353. if (vps->vps_max_dec_pic_buffering[i] > MAX_DPB_SIZE) {
  354. av_log(avctx, AV_LOG_ERROR, "vps_max_dec_pic_buffering_minus1 out of range: %d\n",
  355. vps->vps_max_dec_pic_buffering[i] - 1);
  356. goto err;
  357. }
  358. if (vps->vps_num_reorder_pics[i] > vps->vps_max_dec_pic_buffering[i] - 1) {
  359. av_log(avctx, AV_LOG_WARNING, "vps_max_num_reorder_pics out of range: %d\n",
  360. vps->vps_num_reorder_pics[i]);
  361. if (avctx->err_recognition & AV_EF_EXPLODE)
  362. goto err;
  363. }
  364. }
  365. vps->vps_max_layer_id = get_bits(gb, 6);
  366. vps->vps_num_layer_sets = get_ue_golomb_long(gb) + 1;
  367. for (i = 1; i < vps->vps_num_layer_sets; i++)
  368. for (j = 0; j <= vps->vps_max_layer_id; j++)
  369. skip_bits(gb, 1); // layer_id_included_flag[i][j]
  370. vps->vps_timing_info_present_flag = get_bits1(gb);
  371. if (vps->vps_timing_info_present_flag) {
  372. vps->vps_num_units_in_tick = get_bits_long(gb, 32);
  373. vps->vps_time_scale = get_bits_long(gb, 32);
  374. vps->vps_poc_proportional_to_timing_flag = get_bits1(gb);
  375. if (vps->vps_poc_proportional_to_timing_flag)
  376. vps->vps_num_ticks_poc_diff_one = get_ue_golomb_long(gb) + 1;
  377. vps->vps_num_hrd_parameters = get_ue_golomb_long(gb);
  378. for (i = 0; i < vps->vps_num_hrd_parameters; i++) {
  379. int common_inf_present = 1;
  380. get_ue_golomb_long(gb); // hrd_layer_set_idx
  381. if (i)
  382. common_inf_present = get_bits1(gb);
  383. decode_hrd(gb, common_inf_present, vps->vps_max_sub_layers);
  384. }
  385. }
  386. get_bits1(gb); /* vps_extension_flag */
  387. if (ps->vps_list[vps_id] &&
  388. !memcmp(ps->vps_list[vps_id]->data, vps_buf->data, vps_buf->size)) {
  389. av_buffer_unref(&vps_buf);
  390. } else {
  391. remove_vps(ps, vps_id);
  392. ps->vps_list[vps_id] = vps_buf;
  393. }
  394. return 0;
  395. err:
  396. av_buffer_unref(&vps_buf);
  397. return AVERROR_INVALIDDATA;
  398. }
  399. static void decode_vui(GetBitContext *gb, AVCodecContext *avctx,
  400. int apply_defdispwin, HEVCSPS *sps)
  401. {
  402. VUI *vui = &sps->vui;
  403. int sar_present;
  404. av_log(avctx, AV_LOG_DEBUG, "Decoding VUI\n");
  405. sar_present = get_bits1(gb);
  406. if (sar_present) {
  407. uint8_t sar_idx = get_bits(gb, 8);
  408. if (sar_idx < FF_ARRAY_ELEMS(vui_sar))
  409. vui->sar = vui_sar[sar_idx];
  410. else if (sar_idx == 255) {
  411. vui->sar.num = get_bits(gb, 16);
  412. vui->sar.den = get_bits(gb, 16);
  413. } else
  414. av_log(avctx, AV_LOG_WARNING,
  415. "Unknown SAR index: %u.\n", sar_idx);
  416. }
  417. vui->overscan_info_present_flag = get_bits1(gb);
  418. if (vui->overscan_info_present_flag)
  419. vui->overscan_appropriate_flag = get_bits1(gb);
  420. vui->video_signal_type_present_flag = get_bits1(gb);
  421. if (vui->video_signal_type_present_flag) {
  422. vui->video_format = get_bits(gb, 3);
  423. vui->video_full_range_flag = get_bits1(gb);
  424. vui->colour_description_present_flag = get_bits1(gb);
  425. if (vui->video_full_range_flag && sps->pix_fmt == AV_PIX_FMT_YUV420P)
  426. sps->pix_fmt = AV_PIX_FMT_YUVJ420P;
  427. if (vui->colour_description_present_flag) {
  428. vui->colour_primaries = get_bits(gb, 8);
  429. vui->transfer_characteristic = get_bits(gb, 8);
  430. vui->matrix_coeffs = get_bits(gb, 8);
  431. // Set invalid values to "unspecified"
  432. if (vui->colour_primaries >= AVCOL_PRI_NB)
  433. vui->colour_primaries = AVCOL_PRI_UNSPECIFIED;
  434. if (vui->transfer_characteristic >= AVCOL_TRC_NB)
  435. vui->transfer_characteristic = AVCOL_TRC_UNSPECIFIED;
  436. if (vui->matrix_coeffs >= AVCOL_SPC_NB)
  437. vui->matrix_coeffs = AVCOL_SPC_UNSPECIFIED;
  438. }
  439. }
  440. vui->chroma_loc_info_present_flag = get_bits1(gb);
  441. if (vui->chroma_loc_info_present_flag) {
  442. vui->chroma_sample_loc_type_top_field = get_ue_golomb_long(gb);
  443. vui->chroma_sample_loc_type_bottom_field = get_ue_golomb_long(gb);
  444. }
  445. vui->neutra_chroma_indication_flag = get_bits1(gb);
  446. vui->field_seq_flag = get_bits1(gb);
  447. vui->frame_field_info_present_flag = get_bits1(gb);
  448. vui->default_display_window_flag = get_bits1(gb);
  449. if (vui->default_display_window_flag) {
  450. //TODO: * 2 is only valid for 420
  451. vui->def_disp_win.left_offset = get_ue_golomb_long(gb) * 2;
  452. vui->def_disp_win.right_offset = get_ue_golomb_long(gb) * 2;
  453. vui->def_disp_win.top_offset = get_ue_golomb_long(gb) * 2;
  454. vui->def_disp_win.bottom_offset = get_ue_golomb_long(gb) * 2;
  455. if (apply_defdispwin &&
  456. avctx->flags2 & AV_CODEC_FLAG2_IGNORE_CROP) {
  457. av_log(avctx, AV_LOG_DEBUG,
  458. "discarding vui default display window, "
  459. "original values are l:%u r:%u t:%u b:%u\n",
  460. vui->def_disp_win.left_offset,
  461. vui->def_disp_win.right_offset,
  462. vui->def_disp_win.top_offset,
  463. vui->def_disp_win.bottom_offset);
  464. vui->def_disp_win.left_offset =
  465. vui->def_disp_win.right_offset =
  466. vui->def_disp_win.top_offset =
  467. vui->def_disp_win.bottom_offset = 0;
  468. }
  469. }
  470. vui->vui_timing_info_present_flag = get_bits1(gb);
  471. if (vui->vui_timing_info_present_flag) {
  472. vui->vui_num_units_in_tick = get_bits_long(gb, 32);
  473. vui->vui_time_scale = get_bits_long(gb, 32);
  474. vui->vui_poc_proportional_to_timing_flag = get_bits1(gb);
  475. if (vui->vui_poc_proportional_to_timing_flag)
  476. vui->vui_num_ticks_poc_diff_one_minus1 = get_ue_golomb_long(gb);
  477. vui->vui_hrd_parameters_present_flag = get_bits1(gb);
  478. if (vui->vui_hrd_parameters_present_flag)
  479. decode_hrd(gb, 1, sps->max_sub_layers);
  480. }
  481. vui->bitstream_restriction_flag = get_bits1(gb);
  482. if (vui->bitstream_restriction_flag) {
  483. vui->tiles_fixed_structure_flag = get_bits1(gb);
  484. vui->motion_vectors_over_pic_boundaries_flag = get_bits1(gb);
  485. vui->restricted_ref_pic_lists_flag = get_bits1(gb);
  486. vui->min_spatial_segmentation_idc = get_ue_golomb_long(gb);
  487. vui->max_bytes_per_pic_denom = get_ue_golomb_long(gb);
  488. vui->max_bits_per_min_cu_denom = get_ue_golomb_long(gb);
  489. vui->log2_max_mv_length_horizontal = get_ue_golomb_long(gb);
  490. vui->log2_max_mv_length_vertical = get_ue_golomb_long(gb);
  491. }
  492. }
  493. static void set_default_scaling_list_data(ScalingList *sl)
  494. {
  495. int matrixId;
  496. for (matrixId = 0; matrixId < 6; matrixId++) {
  497. // 4x4 default is 16
  498. memset(sl->sl[0][matrixId], 16, 16);
  499. sl->sl_dc[0][matrixId] = 16; // default for 16x16
  500. sl->sl_dc[1][matrixId] = 16; // default for 32x32
  501. }
  502. memcpy(sl->sl[1][0], default_scaling_list_intra, 64);
  503. memcpy(sl->sl[1][1], default_scaling_list_intra, 64);
  504. memcpy(sl->sl[1][2], default_scaling_list_intra, 64);
  505. memcpy(sl->sl[1][3], default_scaling_list_inter, 64);
  506. memcpy(sl->sl[1][4], default_scaling_list_inter, 64);
  507. memcpy(sl->sl[1][5], default_scaling_list_inter, 64);
  508. memcpy(sl->sl[2][0], default_scaling_list_intra, 64);
  509. memcpy(sl->sl[2][1], default_scaling_list_intra, 64);
  510. memcpy(sl->sl[2][2], default_scaling_list_intra, 64);
  511. memcpy(sl->sl[2][3], default_scaling_list_inter, 64);
  512. memcpy(sl->sl[2][4], default_scaling_list_inter, 64);
  513. memcpy(sl->sl[2][5], default_scaling_list_inter, 64);
  514. memcpy(sl->sl[3][0], default_scaling_list_intra, 64);
  515. memcpy(sl->sl[3][1], default_scaling_list_inter, 64);
  516. }
  517. static int scaling_list_data(GetBitContext *gb, AVCodecContext *avctx, ScalingList *sl)
  518. {
  519. uint8_t scaling_list_pred_mode_flag[4][6];
  520. int32_t scaling_list_dc_coef[2][6];
  521. int size_id, matrix_id, i, pos;
  522. for (size_id = 0; size_id < 4; size_id++)
  523. for (matrix_id = 0; matrix_id < (size_id == 3 ? 2 : 6); matrix_id++) {
  524. scaling_list_pred_mode_flag[size_id][matrix_id] = get_bits1(gb);
  525. if (!scaling_list_pred_mode_flag[size_id][matrix_id]) {
  526. unsigned int delta = get_ue_golomb_long(gb);
  527. /* Only need to handle non-zero delta. Zero means default,
  528. * which should already be in the arrays. */
  529. if (delta) {
  530. // Copy from previous array.
  531. if (matrix_id < delta) {
  532. av_log(avctx, AV_LOG_ERROR,
  533. "Invalid delta in scaling list data: %d.\n", delta);
  534. return AVERROR_INVALIDDATA;
  535. }
  536. memcpy(sl->sl[size_id][matrix_id],
  537. sl->sl[size_id][matrix_id - delta],
  538. size_id > 0 ? 64 : 16);
  539. if (size_id > 1)
  540. sl->sl_dc[size_id - 2][matrix_id] = sl->sl_dc[size_id - 2][matrix_id - delta];
  541. }
  542. } else {
  543. int next_coef, coef_num;
  544. int32_t scaling_list_delta_coef;
  545. next_coef = 8;
  546. coef_num = FFMIN(64, 1 << (4 + (size_id << 1)));
  547. if (size_id > 1) {
  548. scaling_list_dc_coef[size_id - 2][matrix_id] = get_se_golomb(gb) + 8;
  549. next_coef = scaling_list_dc_coef[size_id - 2][matrix_id];
  550. sl->sl_dc[size_id - 2][matrix_id] = next_coef;
  551. }
  552. for (i = 0; i < coef_num; i++) {
  553. if (size_id == 0)
  554. pos = 4 * ff_hevc_diag_scan4x4_y[i] +
  555. ff_hevc_diag_scan4x4_x[i];
  556. else
  557. pos = 8 * ff_hevc_diag_scan8x8_y[i] +
  558. ff_hevc_diag_scan8x8_x[i];
  559. scaling_list_delta_coef = get_se_golomb(gb);
  560. next_coef = (next_coef + scaling_list_delta_coef + 256) % 256;
  561. sl->sl[size_id][matrix_id][pos] = next_coef;
  562. }
  563. }
  564. }
  565. return 0;
  566. }
  567. static int map_pixel_format(AVCodecContext *avctx, HEVCSPS *sps)
  568. {
  569. const AVPixFmtDescriptor *desc;
  570. if (sps->chroma_format_idc == 1) {
  571. switch (sps->bit_depth) {
  572. case 8: sps->pix_fmt = AV_PIX_FMT_YUV420P; break;
  573. case 9: sps->pix_fmt = AV_PIX_FMT_YUV420P9; break;
  574. case 10: sps->pix_fmt = AV_PIX_FMT_YUV420P10; break;
  575. default:
  576. av_log(avctx, AV_LOG_ERROR, "Unsupported bit depth: %d\n",
  577. sps->bit_depth);
  578. return AVERROR_PATCHWELCOME;
  579. }
  580. } else {
  581. av_log(avctx, AV_LOG_ERROR,
  582. "non-4:2:0 support is currently unspecified.\n");
  583. return AVERROR_PATCHWELCOME;
  584. }
  585. desc = av_pix_fmt_desc_get(sps->pix_fmt);
  586. if (!desc)
  587. return AVERROR(EINVAL);
  588. sps->hshift[0] = sps->vshift[0] = 0;
  589. sps->hshift[2] = sps->hshift[1] = desc->log2_chroma_w;
  590. sps->vshift[2] = sps->vshift[1] = desc->log2_chroma_h;
  591. sps->pixel_shift = sps->bit_depth > 8;
  592. return 0;
  593. }
  594. int ff_hevc_parse_sps(HEVCSPS *sps, GetBitContext *gb, unsigned int *sps_id,
  595. int apply_defdispwin, AVBufferRef **vps_list, AVCodecContext *avctx)
  596. {
  597. int ret = 0;
  598. int log2_diff_max_min_transform_block_size;
  599. int bit_depth_chroma, start, vui_present, sublayer_ordering_info;
  600. int i;
  601. // Coded parameters
  602. sps->vps_id = get_bits(gb, 4);
  603. if (sps->vps_id >= MAX_VPS_COUNT) {
  604. av_log(avctx, AV_LOG_ERROR, "VPS id out of range: %d\n", sps->vps_id);
  605. ret = AVERROR_INVALIDDATA;
  606. goto err;
  607. }
  608. if (vps_list && !vps_list[sps->vps_id]) {
  609. av_log(avctx, AV_LOG_ERROR, "VPS %d does not exist\n",
  610. sps->vps_id);
  611. ret = AVERROR_INVALIDDATA;
  612. goto err;
  613. }
  614. sps->max_sub_layers = get_bits(gb, 3) + 1;
  615. if (sps->max_sub_layers > MAX_SUB_LAYERS) {
  616. av_log(avctx, AV_LOG_ERROR, "sps_max_sub_layers out of range: %d\n",
  617. sps->max_sub_layers);
  618. ret = AVERROR_INVALIDDATA;
  619. goto err;
  620. }
  621. skip_bits1(gb); // temporal_id_nesting_flag
  622. parse_ptl(gb, avctx, &sps->ptl, sps->max_sub_layers);
  623. *sps_id = get_ue_golomb_long(gb);
  624. if (*sps_id >= MAX_SPS_COUNT) {
  625. av_log(avctx, AV_LOG_ERROR, "SPS id out of range: %d\n", *sps_id);
  626. ret = AVERROR_INVALIDDATA;
  627. goto err;
  628. }
  629. sps->chroma_format_idc = get_ue_golomb_long(gb);
  630. if (sps->chroma_format_idc != 1) {
  631. avpriv_report_missing_feature(avctx, "chroma_format_idc %d",
  632. sps->chroma_format_idc);
  633. ret = AVERROR_PATCHWELCOME;
  634. goto err;
  635. }
  636. if (sps->chroma_format_idc == 3)
  637. sps->separate_colour_plane_flag = get_bits1(gb);
  638. sps->width = get_ue_golomb_long(gb);
  639. sps->height = get_ue_golomb_long(gb);
  640. if ((ret = av_image_check_size(sps->width,
  641. sps->height, 0, avctx)) < 0)
  642. goto err;
  643. if (get_bits1(gb)) { // pic_conformance_flag
  644. //TODO: * 2 is only valid for 420
  645. sps->pic_conf_win.left_offset = get_ue_golomb_long(gb) * 2;
  646. sps->pic_conf_win.right_offset = get_ue_golomb_long(gb) * 2;
  647. sps->pic_conf_win.top_offset = get_ue_golomb_long(gb) * 2;
  648. sps->pic_conf_win.bottom_offset = get_ue_golomb_long(gb) * 2;
  649. if (avctx->flags2 & AV_CODEC_FLAG2_IGNORE_CROP) {
  650. av_log(avctx, AV_LOG_DEBUG,
  651. "discarding sps conformance window, "
  652. "original values are l:%u r:%u t:%u b:%u\n",
  653. sps->pic_conf_win.left_offset,
  654. sps->pic_conf_win.right_offset,
  655. sps->pic_conf_win.top_offset,
  656. sps->pic_conf_win.bottom_offset);
  657. sps->pic_conf_win.left_offset =
  658. sps->pic_conf_win.right_offset =
  659. sps->pic_conf_win.top_offset =
  660. sps->pic_conf_win.bottom_offset = 0;
  661. }
  662. sps->output_window = sps->pic_conf_win;
  663. }
  664. sps->bit_depth = get_ue_golomb_long(gb) + 8;
  665. bit_depth_chroma = get_ue_golomb_long(gb) + 8;
  666. if (bit_depth_chroma != sps->bit_depth) {
  667. av_log(avctx, AV_LOG_ERROR,
  668. "Luma bit depth (%d) is different from chroma bit depth (%d), "
  669. "this is unsupported.\n",
  670. sps->bit_depth, bit_depth_chroma);
  671. ret = AVERROR_INVALIDDATA;
  672. goto err;
  673. }
  674. ret = map_pixel_format(avctx, sps);
  675. if (ret < 0)
  676. goto err;
  677. sps->log2_max_poc_lsb = get_ue_golomb_long(gb) + 4;
  678. if (sps->log2_max_poc_lsb > 16) {
  679. av_log(avctx, AV_LOG_ERROR, "log2_max_pic_order_cnt_lsb_minus4 out range: %d\n",
  680. sps->log2_max_poc_lsb - 4);
  681. ret = AVERROR_INVALIDDATA;
  682. goto err;
  683. }
  684. sublayer_ordering_info = get_bits1(gb);
  685. start = sublayer_ordering_info ? 0 : sps->max_sub_layers - 1;
  686. for (i = start; i < sps->max_sub_layers; i++) {
  687. sps->temporal_layer[i].max_dec_pic_buffering = get_ue_golomb_long(gb) + 1;
  688. sps->temporal_layer[i].num_reorder_pics = get_ue_golomb_long(gb);
  689. sps->temporal_layer[i].max_latency_increase = get_ue_golomb_long(gb) - 1;
  690. if (sps->temporal_layer[i].max_dec_pic_buffering > MAX_DPB_SIZE) {
  691. av_log(avctx, AV_LOG_ERROR, "sps_max_dec_pic_buffering_minus1 out of range: %d\n",
  692. sps->temporal_layer[i].max_dec_pic_buffering - 1);
  693. ret = AVERROR_INVALIDDATA;
  694. goto err;
  695. }
  696. if (sps->temporal_layer[i].num_reorder_pics > sps->temporal_layer[i].max_dec_pic_buffering - 1) {
  697. av_log(avctx, AV_LOG_WARNING, "sps_max_num_reorder_pics out of range: %d\n",
  698. sps->temporal_layer[i].num_reorder_pics);
  699. if (avctx->err_recognition & AV_EF_EXPLODE ||
  700. sps->temporal_layer[i].num_reorder_pics > MAX_DPB_SIZE - 1) {
  701. ret = AVERROR_INVALIDDATA;
  702. goto err;
  703. }
  704. sps->temporal_layer[i].max_dec_pic_buffering = sps->temporal_layer[i].num_reorder_pics + 1;
  705. }
  706. }
  707. if (!sublayer_ordering_info) {
  708. for (i = 0; i < start; i++) {
  709. sps->temporal_layer[i].max_dec_pic_buffering = sps->temporal_layer[start].max_dec_pic_buffering;
  710. sps->temporal_layer[i].num_reorder_pics = sps->temporal_layer[start].num_reorder_pics;
  711. sps->temporal_layer[i].max_latency_increase = sps->temporal_layer[start].max_latency_increase;
  712. }
  713. }
  714. sps->log2_min_cb_size = get_ue_golomb_long(gb) + 3;
  715. sps->log2_diff_max_min_coding_block_size = get_ue_golomb_long(gb);
  716. sps->log2_min_tb_size = get_ue_golomb_long(gb) + 2;
  717. log2_diff_max_min_transform_block_size = get_ue_golomb_long(gb);
  718. sps->log2_max_trafo_size = log2_diff_max_min_transform_block_size +
  719. sps->log2_min_tb_size;
  720. if (sps->log2_min_tb_size >= sps->log2_min_cb_size) {
  721. av_log(avctx, AV_LOG_ERROR, "Invalid value for log2_min_tb_size");
  722. ret = AVERROR_INVALIDDATA;
  723. goto err;
  724. }
  725. sps->max_transform_hierarchy_depth_inter = get_ue_golomb_long(gb);
  726. sps->max_transform_hierarchy_depth_intra = get_ue_golomb_long(gb);
  727. sps->scaling_list_enable_flag = get_bits1(gb);
  728. if (sps->scaling_list_enable_flag) {
  729. set_default_scaling_list_data(&sps->scaling_list);
  730. if (get_bits1(gb)) {
  731. ret = scaling_list_data(gb, avctx, &sps->scaling_list);
  732. if (ret < 0)
  733. goto err;
  734. }
  735. }
  736. sps->amp_enabled_flag = get_bits1(gb);
  737. sps->sao_enabled = get_bits1(gb);
  738. sps->pcm_enabled_flag = get_bits1(gb);
  739. if (sps->pcm_enabled_flag) {
  740. sps->pcm.bit_depth = get_bits(gb, 4) + 1;
  741. sps->pcm.bit_depth_chroma = get_bits(gb, 4) + 1;
  742. sps->pcm.log2_min_pcm_cb_size = get_ue_golomb_long(gb) + 3;
  743. sps->pcm.log2_max_pcm_cb_size = sps->pcm.log2_min_pcm_cb_size +
  744. get_ue_golomb_long(gb);
  745. if (sps->pcm.bit_depth > sps->bit_depth) {
  746. av_log(avctx, AV_LOG_ERROR,
  747. "PCM bit depth (%d) is greater than normal bit depth (%d)\n",
  748. sps->pcm.bit_depth, sps->bit_depth);
  749. ret = AVERROR_INVALIDDATA;
  750. goto err;
  751. }
  752. sps->pcm.loop_filter_disable_flag = get_bits1(gb);
  753. }
  754. sps->nb_st_rps = get_ue_golomb_long(gb);
  755. if (sps->nb_st_rps > MAX_SHORT_TERM_RPS_COUNT) {
  756. av_log(avctx, AV_LOG_ERROR, "Too many short term RPS: %d.\n",
  757. sps->nb_st_rps);
  758. ret = AVERROR_INVALIDDATA;
  759. goto err;
  760. }
  761. for (i = 0; i < sps->nb_st_rps; i++) {
  762. if ((ret = ff_hevc_decode_short_term_rps(gb, avctx, &sps->st_rps[i],
  763. sps, 0)) < 0)
  764. goto err;
  765. }
  766. sps->long_term_ref_pics_present_flag = get_bits1(gb);
  767. if (sps->long_term_ref_pics_present_flag) {
  768. sps->num_long_term_ref_pics_sps = get_ue_golomb_long(gb);
  769. for (i = 0; i < sps->num_long_term_ref_pics_sps; i++) {
  770. sps->lt_ref_pic_poc_lsb_sps[i] = get_bits(gb, sps->log2_max_poc_lsb);
  771. sps->used_by_curr_pic_lt_sps_flag[i] = get_bits1(gb);
  772. }
  773. }
  774. sps->sps_temporal_mvp_enabled_flag = get_bits1(gb);
  775. sps->sps_strong_intra_smoothing_enable_flag = get_bits1(gb);
  776. sps->vui.sar = (AVRational){0, 1};
  777. vui_present = get_bits1(gb);
  778. if (vui_present)
  779. decode_vui(gb, avctx, apply_defdispwin, sps);
  780. skip_bits1(gb); // sps_extension_flag
  781. if (apply_defdispwin) {
  782. sps->output_window.left_offset += sps->vui.def_disp_win.left_offset;
  783. sps->output_window.right_offset += sps->vui.def_disp_win.right_offset;
  784. sps->output_window.top_offset += sps->vui.def_disp_win.top_offset;
  785. sps->output_window.bottom_offset += sps->vui.def_disp_win.bottom_offset;
  786. }
  787. if (sps->output_window.left_offset & (0x1F >> (sps->pixel_shift)) &&
  788. !(avctx->flags & AV_CODEC_FLAG_UNALIGNED)) {
  789. sps->output_window.left_offset &= ~(0x1F >> (sps->pixel_shift));
  790. av_log(avctx, AV_LOG_WARNING, "Reducing left output window to %d "
  791. "chroma samples to preserve alignment.\n",
  792. sps->output_window.left_offset);
  793. }
  794. sps->output_width = sps->width -
  795. (sps->output_window.left_offset + sps->output_window.right_offset);
  796. sps->output_height = sps->height -
  797. (sps->output_window.top_offset + sps->output_window.bottom_offset);
  798. if (sps->output_width <= 0 || sps->output_height <= 0) {
  799. av_log(avctx, AV_LOG_WARNING, "Invalid visible frame dimensions: %dx%d.\n",
  800. sps->output_width, sps->output_height);
  801. if (avctx->err_recognition & AV_EF_EXPLODE) {
  802. ret = AVERROR_INVALIDDATA;
  803. goto err;
  804. }
  805. av_log(avctx, AV_LOG_WARNING,
  806. "Displaying the whole video surface.\n");
  807. sps->output_window.left_offset =
  808. sps->output_window.right_offset =
  809. sps->output_window.top_offset =
  810. sps->output_window.bottom_offset = 0;
  811. sps->output_width = sps->width;
  812. sps->output_height = sps->height;
  813. }
  814. // Inferred parameters
  815. sps->log2_ctb_size = sps->log2_min_cb_size +
  816. sps->log2_diff_max_min_coding_block_size;
  817. sps->log2_min_pu_size = sps->log2_min_cb_size - 1;
  818. sps->ctb_width = (sps->width + (1 << sps->log2_ctb_size) - 1) >> sps->log2_ctb_size;
  819. sps->ctb_height = (sps->height + (1 << sps->log2_ctb_size) - 1) >> sps->log2_ctb_size;
  820. sps->ctb_size = sps->ctb_width * sps->ctb_height;
  821. sps->min_cb_width = sps->width >> sps->log2_min_cb_size;
  822. sps->min_cb_height = sps->height >> sps->log2_min_cb_size;
  823. sps->min_tb_width = sps->width >> sps->log2_min_tb_size;
  824. sps->min_tb_height = sps->height >> sps->log2_min_tb_size;
  825. sps->min_pu_width = sps->width >> sps->log2_min_pu_size;
  826. sps->min_pu_height = sps->height >> sps->log2_min_pu_size;
  827. sps->qp_bd_offset = 6 * (sps->bit_depth - 8);
  828. if (sps->width & ((1 << sps->log2_min_cb_size) - 1) ||
  829. sps->height & ((1 << sps->log2_min_cb_size) - 1)) {
  830. av_log(avctx, AV_LOG_ERROR, "Invalid coded frame dimensions.\n");
  831. goto err;
  832. }
  833. if (sps->log2_ctb_size > MAX_LOG2_CTB_SIZE) {
  834. av_log(avctx, AV_LOG_ERROR, "CTB size out of range: 2^%d\n", sps->log2_ctb_size);
  835. goto err;
  836. }
  837. if (sps->max_transform_hierarchy_depth_inter > sps->log2_ctb_size - sps->log2_min_tb_size) {
  838. av_log(avctx, AV_LOG_ERROR, "max_transform_hierarchy_depth_inter out of range: %d\n",
  839. sps->max_transform_hierarchy_depth_inter);
  840. goto err;
  841. }
  842. if (sps->max_transform_hierarchy_depth_intra > sps->log2_ctb_size - sps->log2_min_tb_size) {
  843. av_log(avctx, AV_LOG_ERROR, "max_transform_hierarchy_depth_intra out of range: %d\n",
  844. sps->max_transform_hierarchy_depth_intra);
  845. goto err;
  846. }
  847. if (sps->log2_max_trafo_size > FFMIN(sps->log2_ctb_size, 5)) {
  848. av_log(avctx, AV_LOG_ERROR,
  849. "max transform block size out of range: %d\n",
  850. sps->log2_max_trafo_size);
  851. goto err;
  852. }
  853. return 0;
  854. err:
  855. return ret < 0 ? ret : AVERROR_INVALIDDATA;
  856. }
  857. int ff_hevc_decode_nal_sps(GetBitContext *gb, AVCodecContext *avctx,
  858. HEVCParamSets *ps, int apply_defdispwin)
  859. {
  860. HEVCSPS *sps;
  861. AVBufferRef *sps_buf = av_buffer_allocz(sizeof(*sps));
  862. unsigned int sps_id;
  863. int ret;
  864. if (!sps_buf)
  865. return AVERROR(ENOMEM);
  866. sps = (HEVCSPS*)sps_buf->data;
  867. av_log(avctx, AV_LOG_DEBUG, "Decoding SPS\n");
  868. ret = ff_hevc_parse_sps(sps, gb, &sps_id,
  869. apply_defdispwin,
  870. ps->vps_list, avctx);
  871. if (ret < 0) {
  872. av_buffer_unref(&sps_buf);
  873. return ret;
  874. }
  875. if (avctx->debug & FF_DEBUG_BITSTREAM) {
  876. av_log(avctx, AV_LOG_DEBUG,
  877. "Parsed SPS: id %d; coded wxh: %dx%d; "
  878. "cropped wxh: %dx%d; pix_fmt: %s.\n",
  879. sps_id, sps->width, sps->height,
  880. sps->output_width, sps->output_height,
  881. av_get_pix_fmt_name(sps->pix_fmt));
  882. }
  883. /* check if this is a repeat of an already parsed SPS, then keep the
  884. * original one.
  885. * otherwise drop all PPSes that depend on it */
  886. if (ps->sps_list[sps_id] &&
  887. !memcmp(ps->sps_list[sps_id]->data, sps_buf->data, sps_buf->size)) {
  888. av_buffer_unref(&sps_buf);
  889. } else {
  890. remove_sps(ps, sps_id);
  891. ps->sps_list[sps_id] = sps_buf;
  892. }
  893. return 0;
  894. }
  895. static void hevc_pps_free(void *opaque, uint8_t *data)
  896. {
  897. HEVCPPS *pps = (HEVCPPS*)data;
  898. av_freep(&pps->column_width);
  899. av_freep(&pps->row_height);
  900. av_freep(&pps->col_bd);
  901. av_freep(&pps->row_bd);
  902. av_freep(&pps->col_idxX);
  903. av_freep(&pps->ctb_addr_rs_to_ts);
  904. av_freep(&pps->ctb_addr_ts_to_rs);
  905. av_freep(&pps->tile_pos_rs);
  906. av_freep(&pps->tile_id);
  907. av_freep(&pps->min_tb_addr_zs);
  908. av_freep(&pps);
  909. }
  910. static inline int setup_pps(AVCodecContext *avctx, GetBitContext *gb,
  911. HEVCPPS *pps, HEVCSPS *sps)
  912. {
  913. int log2_diff;
  914. int pic_area_in_ctbs, pic_area_in_min_tbs;
  915. int i, j, x, y, ctb_addr_rs, tile_id;
  916. // Inferred parameters
  917. pps->col_bd = av_malloc_array(pps->num_tile_columns + 1, sizeof(*pps->col_bd));
  918. pps->row_bd = av_malloc_array(pps->num_tile_rows + 1, sizeof(*pps->row_bd));
  919. pps->col_idxX = av_malloc_array(sps->ctb_width, sizeof(*pps->col_idxX));
  920. if (!pps->col_bd || !pps->row_bd || !pps->col_idxX)
  921. return AVERROR(ENOMEM);
  922. if (pps->uniform_spacing_flag) {
  923. if (!pps->column_width) {
  924. pps->column_width = av_malloc_array(pps->num_tile_columns, sizeof(*pps->column_width));
  925. pps->row_height = av_malloc_array(pps->num_tile_rows, sizeof(*pps->row_height));
  926. }
  927. if (!pps->column_width || !pps->row_height)
  928. return AVERROR(ENOMEM);
  929. for (i = 0; i < pps->num_tile_columns; i++) {
  930. pps->column_width[i] = ((i + 1) * sps->ctb_width) / pps->num_tile_columns -
  931. (i * sps->ctb_width) / pps->num_tile_columns;
  932. }
  933. for (i = 0; i < pps->num_tile_rows; i++) {
  934. pps->row_height[i] = ((i + 1) * sps->ctb_height) / pps->num_tile_rows -
  935. (i * sps->ctb_height) / pps->num_tile_rows;
  936. }
  937. }
  938. pps->col_bd[0] = 0;
  939. for (i = 0; i < pps->num_tile_columns; i++)
  940. pps->col_bd[i + 1] = pps->col_bd[i] + pps->column_width[i];
  941. pps->row_bd[0] = 0;
  942. for (i = 0; i < pps->num_tile_rows; i++)
  943. pps->row_bd[i + 1] = pps->row_bd[i] + pps->row_height[i];
  944. for (i = 0, j = 0; i < sps->ctb_width; i++) {
  945. if (i > pps->col_bd[j])
  946. j++;
  947. pps->col_idxX[i] = j;
  948. }
  949. /**
  950. * 6.5
  951. */
  952. pic_area_in_ctbs = sps->ctb_width * sps->ctb_height;
  953. pic_area_in_min_tbs = sps->min_tb_width * sps->min_tb_height;
  954. pps->ctb_addr_rs_to_ts = av_malloc_array(pic_area_in_ctbs, sizeof(*pps->ctb_addr_rs_to_ts));
  955. pps->ctb_addr_ts_to_rs = av_malloc_array(pic_area_in_ctbs, sizeof(*pps->ctb_addr_ts_to_rs));
  956. pps->tile_id = av_malloc_array(pic_area_in_ctbs, sizeof(*pps->tile_id));
  957. pps->min_tb_addr_zs = av_malloc_array(pic_area_in_min_tbs, sizeof(*pps->min_tb_addr_zs));
  958. if (!pps->ctb_addr_rs_to_ts || !pps->ctb_addr_ts_to_rs ||
  959. !pps->tile_id || !pps->min_tb_addr_zs) {
  960. return AVERROR(ENOMEM);
  961. }
  962. for (ctb_addr_rs = 0; ctb_addr_rs < pic_area_in_ctbs; ctb_addr_rs++) {
  963. int tb_x = ctb_addr_rs % sps->ctb_width;
  964. int tb_y = ctb_addr_rs / sps->ctb_width;
  965. int tile_x = 0;
  966. int tile_y = 0;
  967. int val = 0;
  968. for (i = 0; i < pps->num_tile_columns; i++) {
  969. if (tb_x < pps->col_bd[i + 1]) {
  970. tile_x = i;
  971. break;
  972. }
  973. }
  974. for (i = 0; i < pps->num_tile_rows; i++) {
  975. if (tb_y < pps->row_bd[i + 1]) {
  976. tile_y = i;
  977. break;
  978. }
  979. }
  980. for (i = 0; i < tile_x; i++)
  981. val += pps->row_height[tile_y] * pps->column_width[i];
  982. for (i = 0; i < tile_y; i++)
  983. val += sps->ctb_width * pps->row_height[i];
  984. val += (tb_y - pps->row_bd[tile_y]) * pps->column_width[tile_x] +
  985. tb_x - pps->col_bd[tile_x];
  986. pps->ctb_addr_rs_to_ts[ctb_addr_rs] = val;
  987. pps->ctb_addr_ts_to_rs[val] = ctb_addr_rs;
  988. }
  989. for (j = 0, tile_id = 0; j < pps->num_tile_rows; j++)
  990. for (i = 0; i < pps->num_tile_columns; i++, tile_id++)
  991. for (y = pps->row_bd[j]; y < pps->row_bd[j + 1]; y++)
  992. for (x = pps->col_bd[i]; x < pps->col_bd[i + 1]; x++)
  993. pps->tile_id[pps->ctb_addr_rs_to_ts[y * sps->ctb_width + x]] = tile_id;
  994. pps->tile_pos_rs = av_malloc_array(tile_id, sizeof(*pps->tile_pos_rs));
  995. if (!pps->tile_pos_rs)
  996. return AVERROR(ENOMEM);
  997. for (j = 0; j < pps->num_tile_rows; j++)
  998. for (i = 0; i < pps->num_tile_columns; i++)
  999. pps->tile_pos_rs[j * pps->num_tile_columns + i] =
  1000. pps->row_bd[j] * sps->ctb_width + pps->col_bd[i];
  1001. log2_diff = sps->log2_ctb_size - sps->log2_min_tb_size;
  1002. for (y = 0; y < sps->min_tb_height; y++) {
  1003. for (x = 0; x < sps->min_tb_width; x++) {
  1004. int tb_x = x >> log2_diff;
  1005. int tb_y = y >> log2_diff;
  1006. int rs = sps->ctb_width * tb_y + tb_x;
  1007. int val = pps->ctb_addr_rs_to_ts[rs] << (log2_diff * 2);
  1008. for (i = 0; i < log2_diff; i++) {
  1009. int m = 1 << i;
  1010. val += (m & x ? m * m : 0) + (m & y ? 2 * m * m : 0);
  1011. }
  1012. pps->min_tb_addr_zs[y * sps->min_tb_width + x] = val;
  1013. }
  1014. }
  1015. return 0;
  1016. }
  1017. int ff_hevc_decode_nal_pps(GetBitContext *gb, AVCodecContext *avctx,
  1018. HEVCParamSets *ps)
  1019. {
  1020. HEVCSPS *sps = NULL;
  1021. int i, ret = 0;
  1022. unsigned int pps_id = 0;
  1023. AVBufferRef *pps_buf;
  1024. HEVCPPS *pps = av_mallocz(sizeof(*pps));
  1025. if (!pps)
  1026. return AVERROR(ENOMEM);
  1027. pps_buf = av_buffer_create((uint8_t *)pps, sizeof(*pps),
  1028. hevc_pps_free, NULL, 0);
  1029. if (!pps_buf) {
  1030. av_freep(&pps);
  1031. return AVERROR(ENOMEM);
  1032. }
  1033. av_log(avctx, AV_LOG_DEBUG, "Decoding PPS\n");
  1034. // Default values
  1035. pps->loop_filter_across_tiles_enabled_flag = 1;
  1036. pps->num_tile_columns = 1;
  1037. pps->num_tile_rows = 1;
  1038. pps->uniform_spacing_flag = 1;
  1039. pps->disable_dbf = 0;
  1040. pps->beta_offset = 0;
  1041. pps->tc_offset = 0;
  1042. // Coded parameters
  1043. pps_id = get_ue_golomb_long(gb);
  1044. if (pps_id >= MAX_PPS_COUNT) {
  1045. av_log(avctx, AV_LOG_ERROR, "PPS id out of range: %d\n", pps_id);
  1046. ret = AVERROR_INVALIDDATA;
  1047. goto err;
  1048. }
  1049. pps->sps_id = get_ue_golomb_long(gb);
  1050. if (pps->sps_id >= MAX_SPS_COUNT) {
  1051. av_log(avctx, AV_LOG_ERROR, "SPS id out of range: %d\n", pps->sps_id);
  1052. ret = AVERROR_INVALIDDATA;
  1053. goto err;
  1054. }
  1055. if (!ps->sps_list[pps->sps_id]) {
  1056. av_log(avctx, AV_LOG_ERROR, "SPS %u does not exist.\n", pps->sps_id);
  1057. ret = AVERROR_INVALIDDATA;
  1058. goto err;
  1059. }
  1060. sps = (HEVCSPS *)ps->sps_list[pps->sps_id]->data;
  1061. pps->dependent_slice_segments_enabled_flag = get_bits1(gb);
  1062. pps->output_flag_present_flag = get_bits1(gb);
  1063. pps->num_extra_slice_header_bits = get_bits(gb, 3);
  1064. pps->sign_data_hiding_flag = get_bits1(gb);
  1065. pps->cabac_init_present_flag = get_bits1(gb);
  1066. pps->num_ref_idx_l0_default_active = get_ue_golomb_long(gb) + 1;
  1067. pps->num_ref_idx_l1_default_active = get_ue_golomb_long(gb) + 1;
  1068. pps->pic_init_qp_minus26 = get_se_golomb(gb);
  1069. pps->constrained_intra_pred_flag = get_bits1(gb);
  1070. pps->transform_skip_enabled_flag = get_bits1(gb);
  1071. pps->cu_qp_delta_enabled_flag = get_bits1(gb);
  1072. pps->diff_cu_qp_delta_depth = 0;
  1073. if (pps->cu_qp_delta_enabled_flag)
  1074. pps->diff_cu_qp_delta_depth = get_ue_golomb_long(gb);
  1075. pps->cb_qp_offset = get_se_golomb(gb);
  1076. if (pps->cb_qp_offset < -12 || pps->cb_qp_offset > 12) {
  1077. av_log(avctx, AV_LOG_ERROR, "pps_cb_qp_offset out of range: %d\n",
  1078. pps->cb_qp_offset);
  1079. ret = AVERROR_INVALIDDATA;
  1080. goto err;
  1081. }
  1082. pps->cr_qp_offset = get_se_golomb(gb);
  1083. if (pps->cr_qp_offset < -12 || pps->cr_qp_offset > 12) {
  1084. av_log(avctx, AV_LOG_ERROR, "pps_cr_qp_offset out of range: %d\n",
  1085. pps->cr_qp_offset);
  1086. ret = AVERROR_INVALIDDATA;
  1087. goto err;
  1088. }
  1089. pps->pic_slice_level_chroma_qp_offsets_present_flag = get_bits1(gb);
  1090. pps->weighted_pred_flag = get_bits1(gb);
  1091. pps->weighted_bipred_flag = get_bits1(gb);
  1092. pps->transquant_bypass_enable_flag = get_bits1(gb);
  1093. pps->tiles_enabled_flag = get_bits1(gb);
  1094. pps->entropy_coding_sync_enabled_flag = get_bits1(gb);
  1095. if (pps->tiles_enabled_flag) {
  1096. pps->num_tile_columns = get_ue_golomb_long(gb) + 1;
  1097. pps->num_tile_rows = get_ue_golomb_long(gb) + 1;
  1098. if (pps->num_tile_columns == 0 ||
  1099. pps->num_tile_columns >= sps->width) {
  1100. av_log(avctx, AV_LOG_ERROR, "num_tile_columns_minus1 out of range: %d\n",
  1101. pps->num_tile_columns - 1);
  1102. ret = AVERROR_INVALIDDATA;
  1103. goto err;
  1104. }
  1105. if (pps->num_tile_rows == 0 ||
  1106. pps->num_tile_rows >= sps->height) {
  1107. av_log(avctx, AV_LOG_ERROR, "num_tile_rows_minus1 out of range: %d\n",
  1108. pps->num_tile_rows - 1);
  1109. ret = AVERROR_INVALIDDATA;
  1110. goto err;
  1111. }
  1112. pps->column_width = av_malloc_array(pps->num_tile_columns, sizeof(*pps->column_width));
  1113. pps->row_height = av_malloc_array(pps->num_tile_rows, sizeof(*pps->row_height));
  1114. if (!pps->column_width || !pps->row_height) {
  1115. ret = AVERROR(ENOMEM);
  1116. goto err;
  1117. }
  1118. pps->uniform_spacing_flag = get_bits1(gb);
  1119. if (!pps->uniform_spacing_flag) {
  1120. uint64_t sum = 0;
  1121. for (i = 0; i < pps->num_tile_columns - 1; i++) {
  1122. pps->column_width[i] = get_ue_golomb_long(gb) + 1;
  1123. sum += pps->column_width[i];
  1124. }
  1125. if (sum >= sps->ctb_width) {
  1126. av_log(avctx, AV_LOG_ERROR, "Invalid tile widths.\n");
  1127. ret = AVERROR_INVALIDDATA;
  1128. goto err;
  1129. }
  1130. pps->column_width[pps->num_tile_columns - 1] = sps->ctb_width - sum;
  1131. sum = 0;
  1132. for (i = 0; i < pps->num_tile_rows - 1; i++) {
  1133. pps->row_height[i] = get_ue_golomb_long(gb) + 1;
  1134. sum += pps->row_height[i];
  1135. }
  1136. if (sum >= sps->ctb_height) {
  1137. av_log(avctx, AV_LOG_ERROR, "Invalid tile heights.\n");
  1138. ret = AVERROR_INVALIDDATA;
  1139. goto err;
  1140. }
  1141. pps->row_height[pps->num_tile_rows - 1] = sps->ctb_height - sum;
  1142. }
  1143. pps->loop_filter_across_tiles_enabled_flag = get_bits1(gb);
  1144. }
  1145. pps->seq_loop_filter_across_slices_enabled_flag = get_bits1(gb);
  1146. pps->deblocking_filter_control_present_flag = get_bits1(gb);
  1147. if (pps->deblocking_filter_control_present_flag) {
  1148. pps->deblocking_filter_override_enabled_flag = get_bits1(gb);
  1149. pps->disable_dbf = get_bits1(gb);
  1150. if (!pps->disable_dbf) {
  1151. pps->beta_offset = get_se_golomb(gb) * 2;
  1152. pps->tc_offset = get_se_golomb(gb) * 2;
  1153. if (pps->beta_offset/2 < -6 || pps->beta_offset/2 > 6) {
  1154. av_log(avctx, AV_LOG_ERROR, "pps_beta_offset_div2 out of range: %d\n",
  1155. pps->beta_offset/2);
  1156. ret = AVERROR_INVALIDDATA;
  1157. goto err;
  1158. }
  1159. if (pps->tc_offset/2 < -6 || pps->tc_offset/2 > 6) {
  1160. av_log(avctx, AV_LOG_ERROR, "pps_tc_offset_div2 out of range: %d\n",
  1161. pps->tc_offset/2);
  1162. ret = AVERROR_INVALIDDATA;
  1163. goto err;
  1164. }
  1165. }
  1166. }
  1167. pps->scaling_list_data_present_flag = get_bits1(gb);
  1168. if (pps->scaling_list_data_present_flag) {
  1169. set_default_scaling_list_data(&pps->scaling_list);
  1170. ret = scaling_list_data(gb, avctx, &pps->scaling_list);
  1171. if (ret < 0)
  1172. goto err;
  1173. }
  1174. pps->lists_modification_present_flag = get_bits1(gb);
  1175. pps->log2_parallel_merge_level = get_ue_golomb_long(gb) + 2;
  1176. if (pps->log2_parallel_merge_level > sps->log2_ctb_size) {
  1177. av_log(avctx, AV_LOG_ERROR, "log2_parallel_merge_level_minus2 out of range: %d\n",
  1178. pps->log2_parallel_merge_level - 2);
  1179. ret = AVERROR_INVALIDDATA;
  1180. goto err;
  1181. }
  1182. pps->slice_header_extension_present_flag = get_bits1(gb);
  1183. skip_bits1(gb); // pps_extension_flag
  1184. ret = setup_pps(avctx, gb, pps, sps);
  1185. if (ret < 0)
  1186. goto err;
  1187. remove_pps(ps, pps_id);
  1188. ps->pps_list[pps_id] = pps_buf;
  1189. return 0;
  1190. err:
  1191. av_buffer_unref(&pps_buf);
  1192. return ret;
  1193. }