You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

529 lines
19KB

  1. /*
  2. * H.26L/H.264/AVC/JVT/14496-10/... sei decoding
  3. * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. /**
  22. * @file
  23. * H.264 / AVC / MPEG4 part10 sei decoding.
  24. * @author Michael Niedermayer <michaelni@gmx.at>
  25. */
  26. #include "avcodec.h"
  27. #include "golomb.h"
  28. #include "h264.h"
  29. #include "internal.h"
  30. static const uint8_t sei_num_clock_ts_table[9] = {
  31. 1, 1, 1, 2, 2, 3, 3, 2, 3
  32. };
  33. void ff_h264_reset_sei(H264Context *h)
  34. {
  35. h->sei_recovery_frame_cnt = -1;
  36. h->sei_dpb_output_delay = 0;
  37. h->sei_cpb_removal_delay = -1;
  38. h->sei_buffering_period_present = 0;
  39. h->sei_frame_packing_present = 0;
  40. h->sei_display_orientation_present = 0;
  41. h->sei_reguserdata_afd_present = 0;
  42. h->a53_caption_size = 0;
  43. av_freep(&h->a53_caption);
  44. }
  45. static int decode_picture_timing(H264Context *h)
  46. {
  47. SPS *sps = &h->sps;
  48. int i;
  49. for (i = 0; i<MAX_SPS_COUNT; i++)
  50. if (!sps->log2_max_frame_num && h->sps_buffers[i])
  51. sps = h->sps_buffers[i];
  52. if (sps->nal_hrd_parameters_present_flag || sps->vcl_hrd_parameters_present_flag) {
  53. h->sei_cpb_removal_delay = get_bits_long(&h->gb,
  54. sps->cpb_removal_delay_length);
  55. h->sei_dpb_output_delay = get_bits_long(&h->gb,
  56. sps->dpb_output_delay_length);
  57. }
  58. if (sps->pic_struct_present_flag) {
  59. unsigned int i, num_clock_ts;
  60. h->sei_pic_struct = get_bits(&h->gb, 4);
  61. h->sei_ct_type = 0;
  62. if (h->sei_pic_struct > SEI_PIC_STRUCT_FRAME_TRIPLING)
  63. return AVERROR_INVALIDDATA;
  64. num_clock_ts = sei_num_clock_ts_table[h->sei_pic_struct];
  65. for (i = 0; i < num_clock_ts; i++) {
  66. if (get_bits(&h->gb, 1)) { /* clock_timestamp_flag */
  67. unsigned int full_timestamp_flag;
  68. h->sei_ct_type |= 1 << get_bits(&h->gb, 2);
  69. skip_bits(&h->gb, 1); /* nuit_field_based_flag */
  70. skip_bits(&h->gb, 5); /* counting_type */
  71. full_timestamp_flag = get_bits(&h->gb, 1);
  72. skip_bits(&h->gb, 1); /* discontinuity_flag */
  73. skip_bits(&h->gb, 1); /* cnt_dropped_flag */
  74. skip_bits(&h->gb, 8); /* n_frames */
  75. if (full_timestamp_flag) {
  76. skip_bits(&h->gb, 6); /* seconds_value 0..59 */
  77. skip_bits(&h->gb, 6); /* minutes_value 0..59 */
  78. skip_bits(&h->gb, 5); /* hours_value 0..23 */
  79. } else {
  80. if (get_bits(&h->gb, 1)) { /* seconds_flag */
  81. skip_bits(&h->gb, 6); /* seconds_value range 0..59 */
  82. if (get_bits(&h->gb, 1)) { /* minutes_flag */
  83. skip_bits(&h->gb, 6); /* minutes_value 0..59 */
  84. if (get_bits(&h->gb, 1)) /* hours_flag */
  85. skip_bits(&h->gb, 5); /* hours_value 0..23 */
  86. }
  87. }
  88. }
  89. if (sps->time_offset_length > 0)
  90. skip_bits(&h->gb,
  91. sps->time_offset_length); /* time_offset */
  92. }
  93. }
  94. if (h->avctx->debug & FF_DEBUG_PICT_INFO)
  95. av_log(h->avctx, AV_LOG_DEBUG, "ct_type:%X pic_struct:%d\n",
  96. h->sei_ct_type, h->sei_pic_struct);
  97. }
  98. return 0;
  99. }
  100. static int decode_registered_user_data_afd(H264Context *h, int size)
  101. {
  102. int flag;
  103. if (size-- < 1)
  104. return AVERROR_INVALIDDATA;
  105. skip_bits(&h->gb, 1); // 0
  106. flag = get_bits(&h->gb, 1); // active_format_flag
  107. skip_bits(&h->gb, 6); // reserved
  108. if (flag) {
  109. if (size-- < 1)
  110. return AVERROR_INVALIDDATA;
  111. skip_bits(&h->gb, 4); // reserved
  112. h->active_format_description = get_bits(&h->gb, 4);
  113. h->sei_reguserdata_afd_present = 1;
  114. #if FF_API_AFD
  115. FF_DISABLE_DEPRECATION_WARNINGS
  116. h->avctx->dtg_active_format = h->active_format_description;
  117. FF_ENABLE_DEPRECATION_WARNINGS
  118. #endif /* FF_API_AFD */
  119. }
  120. return 0;
  121. }
  122. static int decode_registered_user_data_closed_caption(H264Context *h, int size)
  123. {
  124. int flag;
  125. int user_data_type_code;
  126. int cc_count;
  127. if (size < 3)
  128. return AVERROR(EINVAL);
  129. user_data_type_code = get_bits(&h->gb, 8);
  130. if (user_data_type_code == 0x3) {
  131. skip_bits(&h->gb, 1); // reserved
  132. flag = get_bits(&h->gb, 1); // process_cc_data_flag
  133. if (flag) {
  134. skip_bits(&h->gb, 1); // zero bit
  135. cc_count = get_bits(&h->gb, 5);
  136. skip_bits(&h->gb, 8); // reserved
  137. size -= 2;
  138. if (cc_count && size >= cc_count * 3) {
  139. const uint64_t new_size = (h->a53_caption_size + cc_count
  140. * UINT64_C(3));
  141. int i, ret;
  142. if (new_size > INT_MAX)
  143. return AVERROR(EINVAL);
  144. /* Allow merging of the cc data from two fields. */
  145. ret = av_reallocp(&h->a53_caption, new_size);
  146. if (ret < 0)
  147. return ret;
  148. for (i = 0; i < cc_count; i++) {
  149. h->a53_caption[h->a53_caption_size++] = get_bits(&h->gb, 8);
  150. h->a53_caption[h->a53_caption_size++] = get_bits(&h->gb, 8);
  151. h->a53_caption[h->a53_caption_size++] = get_bits(&h->gb, 8);
  152. }
  153. skip_bits(&h->gb, 8); // marker_bits
  154. }
  155. }
  156. }
  157. return 0;
  158. }
  159. static int decode_registered_user_data(H264Context *h, int size)
  160. {
  161. uint32_t country_code;
  162. uint32_t user_identifier;
  163. if (size < 7)
  164. return AVERROR_INVALIDDATA;
  165. size -= 7;
  166. country_code = get_bits(&h->gb, 8); // itu_t_t35_country_code
  167. if (country_code == 0xFF) {
  168. skip_bits(&h->gb, 8); // itu_t_t35_country_code_extension_byte
  169. size--;
  170. }
  171. /* itu_t_t35_payload_byte follows */
  172. skip_bits(&h->gb, 8); // terminal provider code
  173. skip_bits(&h->gb, 8); // terminal provider oriented code
  174. user_identifier = get_bits_long(&h->gb, 32);
  175. switch (user_identifier) {
  176. case MKBETAG('D', 'T', 'G', '1'): // afd_data
  177. return decode_registered_user_data_afd(h, size);
  178. case MKBETAG('G', 'A', '9', '4'): // closed captions
  179. return decode_registered_user_data_closed_caption(h, size);
  180. default:
  181. skip_bits(&h->gb, size * 8);
  182. break;
  183. }
  184. return 0;
  185. }
  186. static int decode_unregistered_user_data(H264Context *h, int size)
  187. {
  188. uint8_t user_data[16 + 256];
  189. int e, build, i;
  190. if (size < 16)
  191. return AVERROR_INVALIDDATA;
  192. for (i = 0; i < sizeof(user_data) - 1 && i < size; i++)
  193. user_data[i] = get_bits(&h->gb, 8);
  194. user_data[i] = 0;
  195. e = sscanf(user_data + 16, "x264 - core %d", &build);
  196. if (e == 1 && build > 0)
  197. h->x264_build = build;
  198. if (e == 1 && build == 1 && !strncmp(user_data+16, "x264 - core 0000", 16))
  199. h->x264_build = 67;
  200. if (h->avctx->debug & FF_DEBUG_BUGS)
  201. av_log(h->avctx, AV_LOG_DEBUG, "user data:\"%s\"\n", user_data + 16);
  202. for (; i < size; i++)
  203. skip_bits(&h->gb, 8);
  204. return 0;
  205. }
  206. static int decode_recovery_point(H264Context *h)
  207. {
  208. h->sei_recovery_frame_cnt = get_ue_golomb(&h->gb);
  209. /* 1b exact_match_flag,
  210. * 1b broken_link_flag,
  211. * 2b changing_slice_group_idc */
  212. skip_bits(&h->gb, 4);
  213. if (h->avctx->debug & FF_DEBUG_PICT_INFO)
  214. av_log(h->avctx, AV_LOG_DEBUG, "sei_recovery_frame_cnt: %d\n", h->sei_recovery_frame_cnt);
  215. h->has_recovery_point = 1;
  216. return 0;
  217. }
  218. static int decode_buffering_period(H264Context *h)
  219. {
  220. unsigned int sps_id;
  221. int sched_sel_idx;
  222. SPS *sps;
  223. sps_id = get_ue_golomb_31(&h->gb);
  224. if (sps_id > 31 || !h->sps_buffers[sps_id]) {
  225. av_log(h->avctx, AV_LOG_ERROR,
  226. "non-existing SPS %d referenced in buffering period\n", sps_id);
  227. return AVERROR_INVALIDDATA;
  228. }
  229. sps = h->sps_buffers[sps_id];
  230. // NOTE: This is really so duplicated in the standard... See H.264, D.1.1
  231. if (sps->nal_hrd_parameters_present_flag) {
  232. for (sched_sel_idx = 0; sched_sel_idx < sps->cpb_cnt; sched_sel_idx++) {
  233. h->initial_cpb_removal_delay[sched_sel_idx] =
  234. get_bits_long(&h->gb, sps->initial_cpb_removal_delay_length);
  235. // initial_cpb_removal_delay_offset
  236. skip_bits(&h->gb, sps->initial_cpb_removal_delay_length);
  237. }
  238. }
  239. if (sps->vcl_hrd_parameters_present_flag) {
  240. for (sched_sel_idx = 0; sched_sel_idx < sps->cpb_cnt; sched_sel_idx++) {
  241. h->initial_cpb_removal_delay[sched_sel_idx] =
  242. get_bits_long(&h->gb, sps->initial_cpb_removal_delay_length);
  243. // initial_cpb_removal_delay_offset
  244. skip_bits(&h->gb, sps->initial_cpb_removal_delay_length);
  245. }
  246. }
  247. h->sei_buffering_period_present = 1;
  248. return 0;
  249. }
  250. static int decode_frame_packing_arrangement(H264Context *h)
  251. {
  252. h->sei_fpa.frame_packing_arrangement_id = get_ue_golomb(&h->gb);
  253. h->sei_fpa.frame_packing_arrangement_cancel_flag = get_bits1(&h->gb);
  254. h->sei_frame_packing_present = !h->sei_fpa.frame_packing_arrangement_cancel_flag;
  255. if (h->sei_frame_packing_present) {
  256. h->sei_fpa.frame_packing_arrangement_type =
  257. h->frame_packing_arrangement_type = get_bits(&h->gb, 7);
  258. h->sei_fpa.quincunx_sampling_flag =
  259. h->quincunx_subsampling = get_bits1(&h->gb);
  260. h->sei_fpa.content_interpretation_type =
  261. h->content_interpretation_type = get_bits(&h->gb, 6);
  262. // the following skips: spatial_flipping_flag, frame0_flipped_flag,
  263. // field_views_flag, current_frame_is_frame0_flag,
  264. // frame0_self_contained_flag, frame1_self_contained_flag
  265. skip_bits(&h->gb, 6);
  266. if (!h->quincunx_subsampling && h->frame_packing_arrangement_type != 5)
  267. skip_bits(&h->gb, 16); // frame[01]_grid_position_[xy]
  268. skip_bits(&h->gb, 8); // frame_packing_arrangement_reserved_byte
  269. h->sei_fpa.frame_packing_arrangement_repetition_period = get_ue_golomb(&h->gb) /* frame_packing_arrangement_repetition_period */;
  270. }
  271. skip_bits1(&h->gb); // frame_packing_arrangement_extension_flag
  272. if (h->avctx->debug & FF_DEBUG_PICT_INFO)
  273. av_log(h->avctx, AV_LOG_DEBUG, "SEI FPA %d %d %d %d %d %d\n",
  274. h->sei_fpa.frame_packing_arrangement_id,
  275. h->sei_fpa.frame_packing_arrangement_cancel_flag,
  276. h->sei_fpa.frame_packing_arrangement_type,
  277. h->sei_fpa.quincunx_sampling_flag,
  278. h->sei_fpa.content_interpretation_type,
  279. h->sei_fpa.frame_packing_arrangement_repetition_period);
  280. return 0;
  281. }
  282. static int decode_display_orientation(H264Context *h)
  283. {
  284. h->sei_display_orientation_present = !get_bits1(&h->gb);
  285. if (h->sei_display_orientation_present) {
  286. h->sei_hflip = get_bits1(&h->gb); // hor_flip
  287. h->sei_vflip = get_bits1(&h->gb); // ver_flip
  288. h->sei_anticlockwise_rotation = get_bits(&h->gb, 16);
  289. get_ue_golomb(&h->gb); // display_orientation_repetition_period
  290. skip_bits1(&h->gb); // display_orientation_extension_flag
  291. }
  292. return 0;
  293. }
  294. static int decode_GreenMetadata(H264Context *h)
  295. {
  296. if (h->avctx->debug & FF_DEBUG_GREEN_MD)
  297. av_log(h->avctx, AV_LOG_DEBUG, "Green Metadata Info SEI message\n");
  298. h->sei_green_metadata.green_metadata_type=get_bits(&h->gb, 8);
  299. if (h->avctx->debug & FF_DEBUG_GREEN_MD)
  300. av_log(h->avctx, AV_LOG_DEBUG, "green_metadata_type = %d\n",
  301. h->sei_green_metadata.green_metadata_type);
  302. if (h->sei_green_metadata.green_metadata_type==0){
  303. h->sei_green_metadata.period_type=get_bits(&h->gb, 8);
  304. if (h->avctx->debug & FF_DEBUG_GREEN_MD)
  305. av_log(h->avctx, AV_LOG_DEBUG, "green_metadata_period_type = %d\n",
  306. h->sei_green_metadata.period_type);
  307. if (h->sei_green_metadata.green_metadata_type==2){
  308. h->sei_green_metadata.num_seconds = get_bits(&h->gb, 16);
  309. if (h->avctx->debug & FF_DEBUG_GREEN_MD)
  310. av_log(h->avctx, AV_LOG_DEBUG, "green_metadata_num_seconds = %d\n",
  311. h->sei_green_metadata.num_seconds);
  312. }
  313. else if (h->sei_green_metadata.period_type==3){
  314. h->sei_green_metadata.num_pictures = get_bits(&h->gb, 16);
  315. if (h->avctx->debug & FF_DEBUG_GREEN_MD)
  316. av_log(h->avctx, AV_LOG_DEBUG, "green_metadata_num_pictures = %d\n",
  317. h->sei_green_metadata.num_pictures);
  318. }
  319. h->sei_green_metadata.percent_non_zero_macroblocks=get_bits(&h->gb, 8);
  320. h->sei_green_metadata.percent_intra_coded_macroblocks=get_bits(&h->gb, 8);
  321. h->sei_green_metadata.percent_six_tap_filtering=get_bits(&h->gb, 8);
  322. h->sei_green_metadata.percent_alpha_point_deblocking_instance=get_bits(&h->gb, 8);
  323. if (h->avctx->debug & FF_DEBUG_GREEN_MD)
  324. av_log(h->avctx, AV_LOG_DEBUG, "SEI GREEN Complexity Metrics = %f %f %f %f\n",
  325. (float)h->sei_green_metadata.percent_non_zero_macroblocks/255,
  326. (float)h->sei_green_metadata.percent_intra_coded_macroblocks/255,
  327. (float)h->sei_green_metadata.percent_six_tap_filtering/255,
  328. (float)h->sei_green_metadata.percent_alpha_point_deblocking_instance/255);
  329. }else if( h->sei_green_metadata.green_metadata_type==1){
  330. h->sei_green_metadata.xsd_metric_type=get_bits(&h->gb, 8);
  331. h->sei_green_metadata.xsd_metric_value=get_bits(&h->gb, 16);
  332. if (h->avctx->debug & FF_DEBUG_GREEN_MD)
  333. av_log(h->avctx, AV_LOG_DEBUG, "xsd_metric_type = %d\n",
  334. h->sei_green_metadata.xsd_metric_type);
  335. if ( h->sei_green_metadata.xsd_metric_type==0){
  336. if (h->avctx->debug & FF_DEBUG_GREEN_MD)
  337. av_log(h->avctx, AV_LOG_DEBUG, "xsd_metric_value = %f\n",
  338. (float)h->sei_green_metadata.xsd_metric_value/100);
  339. }
  340. }
  341. return 0;
  342. }
  343. int ff_h264_decode_sei(H264Context *h)
  344. {
  345. while (get_bits_left(&h->gb) > 16 && show_bits(&h->gb, 16)) {
  346. int type = 0;
  347. unsigned size = 0;
  348. unsigned next;
  349. int ret = 0;
  350. do {
  351. if (get_bits_left(&h->gb) < 8)
  352. return AVERROR_INVALIDDATA;
  353. type += show_bits(&h->gb, 8);
  354. } while (get_bits(&h->gb, 8) == 255);
  355. do {
  356. if (get_bits_left(&h->gb) < 8)
  357. return AVERROR_INVALIDDATA;
  358. size += show_bits(&h->gb, 8);
  359. } while (get_bits(&h->gb, 8) == 255);
  360. if (h->avctx->debug&FF_DEBUG_STARTCODE)
  361. av_log(h->avctx, AV_LOG_DEBUG, "SEI %d len:%d\n", type, size);
  362. if (size > get_bits_left(&h->gb) / 8) {
  363. av_log(h->avctx, AV_LOG_ERROR, "SEI type %d size %d truncated at %d\n",
  364. type, 8*size, get_bits_left(&h->gb));
  365. return AVERROR_INVALIDDATA;
  366. }
  367. next = get_bits_count(&h->gb) + 8 * size;
  368. switch (type) {
  369. case SEI_TYPE_PIC_TIMING: // Picture timing SEI
  370. ret = decode_picture_timing(h);
  371. break;
  372. case SEI_TYPE_USER_DATA_REGISTERED:
  373. ret = decode_registered_user_data(h, size);
  374. break;
  375. case SEI_TYPE_USER_DATA_UNREGISTERED:
  376. ret = decode_unregistered_user_data(h, size);
  377. break;
  378. case SEI_TYPE_RECOVERY_POINT:
  379. ret = decode_recovery_point(h);
  380. break;
  381. case SEI_TYPE_BUFFERING_PERIOD:
  382. ret = decode_buffering_period(h);
  383. break;
  384. case SEI_TYPE_FRAME_PACKING:
  385. ret = decode_frame_packing_arrangement(h);
  386. break;
  387. case SEI_TYPE_DISPLAY_ORIENTATION:
  388. ret = decode_display_orientation(h);
  389. break;
  390. case SEI_TYPE_GREEN_METADATA:
  391. ret = decode_GreenMetadata(h);
  392. break;
  393. default:
  394. av_log(h->avctx, AV_LOG_DEBUG, "unknown SEI type %d\n", type);
  395. }
  396. if (ret < 0)
  397. return ret;
  398. skip_bits_long(&h->gb, next - get_bits_count(&h->gb));
  399. // FIXME check bits here
  400. align_get_bits(&h->gb);
  401. }
  402. return 0;
  403. }
  404. const char* ff_h264_sei_stereo_mode(H264Context *h)
  405. {
  406. if (h->sei_fpa.frame_packing_arrangement_cancel_flag == 0) {
  407. switch (h->sei_fpa.frame_packing_arrangement_type) {
  408. case SEI_FPA_TYPE_CHECKERBOARD:
  409. if (h->sei_fpa.content_interpretation_type == 2)
  410. return "checkerboard_rl";
  411. else
  412. return "checkerboard_lr";
  413. case SEI_FPA_TYPE_INTERLEAVE_COLUMN:
  414. if (h->sei_fpa.content_interpretation_type == 2)
  415. return "col_interleaved_rl";
  416. else
  417. return "col_interleaved_lr";
  418. case SEI_FPA_TYPE_INTERLEAVE_ROW:
  419. if (h->sei_fpa.content_interpretation_type == 2)
  420. return "row_interleaved_rl";
  421. else
  422. return "row_interleaved_lr";
  423. case SEI_FPA_TYPE_SIDE_BY_SIDE:
  424. if (h->sei_fpa.content_interpretation_type == 2)
  425. return "right_left";
  426. else
  427. return "left_right";
  428. case SEI_FPA_TYPE_TOP_BOTTOM:
  429. if (h->sei_fpa.content_interpretation_type == 2)
  430. return "bottom_top";
  431. else
  432. return "top_bottom";
  433. case SEI_FPA_TYPE_INTERLEAVE_TEMPORAL:
  434. if (h->sei_fpa.content_interpretation_type == 2)
  435. return "block_rl";
  436. else
  437. return "block_lr";
  438. case SEI_FPA_TYPE_2D:
  439. default:
  440. return "mono";
  441. }
  442. } else if (h->sei_fpa.frame_packing_arrangement_cancel_flag == 1) {
  443. return "mono";
  444. } else {
  445. return NULL;
  446. }
  447. }