You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

488 lines
17KB

  1. /*
  2. * This file is part of Libav.
  3. *
  4. * Libav is free software; you can redistribute it and/or
  5. * modify it under the terms of the GNU Lesser General Public
  6. * License as published by the Free Software Foundation; either
  7. * version 2.1 of the License, or (at your option) any later version.
  8. *
  9. * Libav is distributed in the hope that it will be useful,
  10. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  12. * Lesser General Public License for more details.
  13. *
  14. * You should have received a copy of the GNU Lesser General Public
  15. * License along with Libav; if not, write to the Free Software
  16. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  17. */
  18. #include "bytestream.h"
  19. #include "get_bits.h"
  20. #include "golomb.h"
  21. #include "h264.h"
  22. #include "h264dec.h"
  23. #include "h264_parse.h"
  24. int ff_h264_pred_weight_table(GetBitContext *gb, const SPS *sps,
  25. const int *ref_count, int slice_type_nos,
  26. H264PredWeightTable *pwt)
  27. {
  28. int list, i, j;
  29. int luma_def, chroma_def;
  30. pwt->use_weight = 0;
  31. pwt->use_weight_chroma = 0;
  32. pwt->luma_log2_weight_denom = get_ue_golomb(gb);
  33. if (sps->chroma_format_idc)
  34. pwt->chroma_log2_weight_denom = get_ue_golomb(gb);
  35. luma_def = 1 << pwt->luma_log2_weight_denom;
  36. chroma_def = 1 << pwt->chroma_log2_weight_denom;
  37. for (list = 0; list < 2; list++) {
  38. pwt->luma_weight_flag[list] = 0;
  39. pwt->chroma_weight_flag[list] = 0;
  40. for (i = 0; i < ref_count[list]; i++) {
  41. int luma_weight_flag, chroma_weight_flag;
  42. luma_weight_flag = get_bits1(gb);
  43. if (luma_weight_flag) {
  44. pwt->luma_weight[i][list][0] = get_se_golomb(gb);
  45. pwt->luma_weight[i][list][1] = get_se_golomb(gb);
  46. if (pwt->luma_weight[i][list][0] != luma_def ||
  47. pwt->luma_weight[i][list][1] != 0) {
  48. pwt->use_weight = 1;
  49. pwt->luma_weight_flag[list] = 1;
  50. }
  51. } else {
  52. pwt->luma_weight[i][list][0] = luma_def;
  53. pwt->luma_weight[i][list][1] = 0;
  54. }
  55. if (sps->chroma_format_idc) {
  56. chroma_weight_flag = get_bits1(gb);
  57. if (chroma_weight_flag) {
  58. int j;
  59. for (j = 0; j < 2; j++) {
  60. pwt->chroma_weight[i][list][j][0] = get_se_golomb(gb);
  61. pwt->chroma_weight[i][list][j][1] = get_se_golomb(gb);
  62. if (pwt->chroma_weight[i][list][j][0] != chroma_def ||
  63. pwt->chroma_weight[i][list][j][1] != 0) {
  64. pwt->use_weight_chroma = 1;
  65. pwt->chroma_weight_flag[list] = 1;
  66. }
  67. }
  68. } else {
  69. int j;
  70. for (j = 0; j < 2; j++) {
  71. pwt->chroma_weight[i][list][j][0] = chroma_def;
  72. pwt->chroma_weight[i][list][j][1] = 0;
  73. }
  74. }
  75. }
  76. // for MBAFF
  77. pwt->luma_weight[16 + 2 * i][list][0] = pwt->luma_weight[16 + 2 * i + 1][list][0] = pwt->luma_weight[i][list][0];
  78. pwt->luma_weight[16 + 2 * i][list][1] = pwt->luma_weight[16 + 2 * i + 1][list][1] = pwt->luma_weight[i][list][1];
  79. for (j = 0; j < 2; j++) {
  80. pwt->chroma_weight[16 + 2 * i][list][j][0] = pwt->chroma_weight[16 + 2 * i + 1][list][j][0] = pwt->chroma_weight[i][list][j][0];
  81. pwt->chroma_weight[16 + 2 * i][list][j][1] = pwt->chroma_weight[16 + 2 * i + 1][list][j][1] = pwt->chroma_weight[i][list][j][1];
  82. }
  83. }
  84. if (slice_type_nos != AV_PICTURE_TYPE_B)
  85. break;
  86. }
  87. pwt->use_weight = pwt->use_weight || pwt->use_weight_chroma;
  88. return 0;
  89. }
  90. /**
  91. * Check if the top & left blocks are available if needed and
  92. * change the dc mode so it only uses the available blocks.
  93. */
  94. int ff_h264_check_intra4x4_pred_mode(int8_t *pred_mode_cache, void *logctx,
  95. int top_samples_available, int left_samples_available)
  96. {
  97. static const int8_t top[12] = {
  98. -1, 0, LEFT_DC_PRED, -1, -1, -1, -1, -1, 0
  99. };
  100. static const int8_t left[12] = {
  101. 0, -1, TOP_DC_PRED, 0, -1, -1, -1, 0, -1, DC_128_PRED
  102. };
  103. int i;
  104. if (!(top_samples_available & 0x8000)) {
  105. for (i = 0; i < 4; i++) {
  106. int status = top[pred_mode_cache[scan8[0] + i]];
  107. if (status < 0) {
  108. av_log(logctx, AV_LOG_ERROR,
  109. "top block unavailable for requested intra4x4 mode %d\n",
  110. status);
  111. return AVERROR_INVALIDDATA;
  112. } else if (status) {
  113. pred_mode_cache[scan8[0] + i] = status;
  114. }
  115. }
  116. }
  117. if ((left_samples_available & 0x8888) != 0x8888) {
  118. static const int mask[4] = { 0x8000, 0x2000, 0x80, 0x20 };
  119. for (i = 0; i < 4; i++)
  120. if (!(left_samples_available & mask[i])) {
  121. int status = left[pred_mode_cache[scan8[0] + 8 * i]];
  122. if (status < 0) {
  123. av_log(logctx, AV_LOG_ERROR,
  124. "left block unavailable for requested intra4x4 mode %d\n",
  125. status);
  126. return AVERROR_INVALIDDATA;
  127. } else if (status) {
  128. pred_mode_cache[scan8[0] + 8 * i] = status;
  129. }
  130. }
  131. }
  132. return 0;
  133. }
  134. /**
  135. * Check if the top & left blocks are available if needed and
  136. * change the dc mode so it only uses the available blocks.
  137. */
  138. int ff_h264_check_intra_pred_mode(void *logctx, int top_samples_available,
  139. int left_samples_available,
  140. int mode, int is_chroma)
  141. {
  142. static const int8_t top[4] = { LEFT_DC_PRED8x8, 1, -1, -1 };
  143. static const int8_t left[5] = { TOP_DC_PRED8x8, -1, 2, -1, DC_128_PRED8x8 };
  144. if (mode > 3U) {
  145. av_log(logctx, AV_LOG_ERROR,
  146. "out of range intra chroma pred mode\n");
  147. return AVERROR_INVALIDDATA;
  148. }
  149. if (!(top_samples_available & 0x8000)) {
  150. mode = top[mode];
  151. if (mode < 0) {
  152. av_log(logctx, AV_LOG_ERROR,
  153. "top block unavailable for requested intra mode\n");
  154. return AVERROR_INVALIDDATA;
  155. }
  156. }
  157. if ((left_samples_available & 0x8080) != 0x8080) {
  158. mode = left[mode];
  159. if (is_chroma && (left_samples_available & 0x8080)) {
  160. // mad cow disease mode, aka MBAFF + constrained_intra_pred
  161. mode = ALZHEIMER_DC_L0T_PRED8x8 +
  162. (!(left_samples_available & 0x8000)) +
  163. 2 * (mode == DC_128_PRED8x8);
  164. }
  165. if (mode < 0) {
  166. av_log(logctx, AV_LOG_ERROR,
  167. "left block unavailable for requested intra mode\n");
  168. return AVERROR_INVALIDDATA;
  169. }
  170. }
  171. return mode;
  172. }
  173. int ff_h264_parse_ref_count(int *plist_count, int ref_count[2],
  174. GetBitContext *gb, const PPS *pps,
  175. int slice_type_nos, int picture_structure)
  176. {
  177. int list_count;
  178. int num_ref_idx_active_override_flag, max_refs;
  179. // set defaults, might be overridden a few lines later
  180. ref_count[0] = pps->ref_count[0];
  181. ref_count[1] = pps->ref_count[1];
  182. if (slice_type_nos != AV_PICTURE_TYPE_I) {
  183. num_ref_idx_active_override_flag = get_bits1(gb);
  184. if (num_ref_idx_active_override_flag) {
  185. ref_count[0] = get_ue_golomb(gb) + 1;
  186. if (ref_count[0] < 1)
  187. goto fail;
  188. if (slice_type_nos == AV_PICTURE_TYPE_B) {
  189. ref_count[1] = get_ue_golomb(gb) + 1;
  190. if (ref_count[1] < 1)
  191. goto fail;
  192. }
  193. }
  194. if (slice_type_nos == AV_PICTURE_TYPE_B)
  195. list_count = 2;
  196. else
  197. list_count = 1;
  198. } else {
  199. list_count = 0;
  200. ref_count[0] = ref_count[1] = 0;
  201. }
  202. max_refs = picture_structure == PICT_FRAME ? 16 : 32;
  203. if (ref_count[0] > max_refs || ref_count[1] > max_refs)
  204. goto fail;
  205. *plist_count = list_count;
  206. return 0;
  207. fail:
  208. *plist_count = 0;
  209. ref_count[0] = 0;
  210. ref_count[1] = 0;
  211. return AVERROR_INVALIDDATA;
  212. }
  213. int ff_h264_init_poc(int pic_field_poc[2], int *pic_poc,
  214. const SPS *sps, H264POCContext *pc,
  215. int picture_structure, int nal_ref_idc)
  216. {
  217. const int max_frame_num = 1 << sps->log2_max_frame_num;
  218. int field_poc[2];
  219. pc->frame_num_offset = pc->prev_frame_num_offset;
  220. if (pc->frame_num < pc->prev_frame_num)
  221. pc->frame_num_offset += max_frame_num;
  222. if (sps->poc_type == 0) {
  223. const int max_poc_lsb = 1 << sps->log2_max_poc_lsb;
  224. if (pc->poc_lsb < pc->prev_poc_lsb &&
  225. pc->prev_poc_lsb - pc->poc_lsb >= max_poc_lsb / 2)
  226. pc->poc_msb = pc->prev_poc_msb + max_poc_lsb;
  227. else if (pc->poc_lsb > pc->prev_poc_lsb &&
  228. pc->prev_poc_lsb - pc->poc_lsb < -max_poc_lsb / 2)
  229. pc->poc_msb = pc->prev_poc_msb - max_poc_lsb;
  230. else
  231. pc->poc_msb = pc->prev_poc_msb;
  232. field_poc[0] =
  233. field_poc[1] = pc->poc_msb + pc->poc_lsb;
  234. if (picture_structure == PICT_FRAME)
  235. field_poc[1] += pc->delta_poc_bottom;
  236. } else if (sps->poc_type == 1) {
  237. int abs_frame_num, expected_delta_per_poc_cycle, expectedpoc;
  238. int i;
  239. if (sps->poc_cycle_length != 0)
  240. abs_frame_num = pc->frame_num_offset + pc->frame_num;
  241. else
  242. abs_frame_num = 0;
  243. if (nal_ref_idc == 0 && abs_frame_num > 0)
  244. abs_frame_num--;
  245. expected_delta_per_poc_cycle = 0;
  246. for (i = 0; i < sps->poc_cycle_length; i++)
  247. // FIXME integrate during sps parse
  248. expected_delta_per_poc_cycle += sps->offset_for_ref_frame[i];
  249. if (abs_frame_num > 0) {
  250. int poc_cycle_cnt = (abs_frame_num - 1) / sps->poc_cycle_length;
  251. int frame_num_in_poc_cycle = (abs_frame_num - 1) % sps->poc_cycle_length;
  252. expectedpoc = poc_cycle_cnt * expected_delta_per_poc_cycle;
  253. for (i = 0; i <= frame_num_in_poc_cycle; i++)
  254. expectedpoc = expectedpoc + sps->offset_for_ref_frame[i];
  255. } else
  256. expectedpoc = 0;
  257. if (nal_ref_idc == 0)
  258. expectedpoc = expectedpoc + sps->offset_for_non_ref_pic;
  259. field_poc[0] = expectedpoc + pc->delta_poc[0];
  260. field_poc[1] = field_poc[0] + sps->offset_for_top_to_bottom_field;
  261. if (picture_structure == PICT_FRAME)
  262. field_poc[1] += pc->delta_poc[1];
  263. } else {
  264. int poc = 2 * (pc->frame_num_offset + pc->frame_num);
  265. if (!nal_ref_idc)
  266. poc--;
  267. field_poc[0] = poc;
  268. field_poc[1] = poc;
  269. }
  270. if (picture_structure != PICT_BOTTOM_FIELD)
  271. pic_field_poc[0] = field_poc[0];
  272. if (picture_structure != PICT_TOP_FIELD)
  273. pic_field_poc[1] = field_poc[1];
  274. *pic_poc = FFMIN(pic_field_poc[0], pic_field_poc[1]);
  275. return 0;
  276. }
  277. static int decode_extradata_ps(const uint8_t *data, int size, H264ParamSets *ps,
  278. int is_avc, void *logctx)
  279. {
  280. H2645Packet pkt = { 0 };
  281. int i, ret = 0;
  282. ret = ff_h2645_packet_split(&pkt, data, size, logctx, is_avc, 2, AV_CODEC_ID_H264);
  283. if (ret < 0)
  284. goto fail;
  285. for (i = 0; i < pkt.nb_nals; i++) {
  286. H2645NAL *nal = &pkt.nals[i];
  287. switch (nal->type) {
  288. case NAL_SPS:
  289. ret = ff_h264_decode_seq_parameter_set(&nal->gb, logctx, ps);
  290. if (ret < 0)
  291. goto fail;
  292. break;
  293. case NAL_PPS:
  294. ret = ff_h264_decode_picture_parameter_set(&nal->gb, logctx, ps,
  295. nal->size_bits);
  296. if (ret < 0)
  297. goto fail;
  298. break;
  299. default:
  300. av_log(logctx, AV_LOG_VERBOSE, "Ignoring NAL type %d in extradata\n",
  301. nal->type);
  302. break;
  303. }
  304. }
  305. fail:
  306. ff_h2645_packet_uninit(&pkt);
  307. return ret;
  308. }
  309. /* There are (invalid) samples in the wild with mp4-style extradata, where the
  310. * parameter sets are stored unescaped (i.e. as RBSP).
  311. * This function catches the parameter set decoding failure and tries again
  312. * after escaping it */
  313. static int decode_extradata_ps_mp4(const uint8_t *buf, int buf_size, H264ParamSets *ps,
  314. int err_recognition, void *logctx)
  315. {
  316. int ret;
  317. ret = decode_extradata_ps(buf, buf_size, ps, 1, logctx);
  318. if (ret < 0 && !(err_recognition & AV_EF_EXPLODE)) {
  319. GetByteContext gbc;
  320. PutByteContext pbc;
  321. uint8_t *escaped_buf;
  322. int escaped_buf_size;
  323. av_log(logctx, AV_LOG_WARNING,
  324. "SPS decoding failure, trying again after escaping the NAL\n");
  325. if (buf_size / 2 >= (INT16_MAX - AV_INPUT_BUFFER_PADDING_SIZE) / 3)
  326. return AVERROR(ERANGE);
  327. escaped_buf_size = buf_size * 3 / 2 + AV_INPUT_BUFFER_PADDING_SIZE;
  328. escaped_buf = av_mallocz(escaped_buf_size);
  329. if (!escaped_buf)
  330. return AVERROR(ENOMEM);
  331. bytestream2_init(&gbc, buf, buf_size);
  332. bytestream2_init_writer(&pbc, escaped_buf, escaped_buf_size);
  333. while (bytestream2_get_bytes_left(&gbc)) {
  334. if (bytestream2_get_bytes_left(&gbc) >= 3 &&
  335. bytestream2_peek_be24(&gbc) <= 3) {
  336. bytestream2_put_be24(&pbc, 3);
  337. bytestream2_skip(&gbc, 2);
  338. } else
  339. bytestream2_put_byte(&pbc, bytestream2_get_byte(&gbc));
  340. }
  341. escaped_buf_size = bytestream2_tell_p(&pbc);
  342. AV_WB16(escaped_buf, escaped_buf_size - 2);
  343. ret = decode_extradata_ps(escaped_buf, escaped_buf_size, ps, 1, logctx);
  344. av_freep(&escaped_buf);
  345. if (ret < 0)
  346. return ret;
  347. }
  348. return 0;
  349. }
  350. int ff_h264_decode_extradata(const uint8_t *data, int size, H264ParamSets *ps,
  351. int *is_avc, int *nal_length_size,
  352. int err_recognition, void *logctx)
  353. {
  354. int ret;
  355. if (data[0] == 1) {
  356. int i, cnt, nalsize;
  357. const uint8_t *p = data;
  358. *is_avc = 1;
  359. if (size < 7) {
  360. av_log(logctx, AV_LOG_ERROR, "avcC %d too short\n", size);
  361. return AVERROR_INVALIDDATA;
  362. }
  363. // Decode sps from avcC
  364. cnt = *(p + 5) & 0x1f; // Number of sps
  365. p += 6;
  366. for (i = 0; i < cnt; i++) {
  367. nalsize = AV_RB16(p) + 2;
  368. if (p - data + nalsize > size)
  369. return AVERROR_INVALIDDATA;
  370. ret = decode_extradata_ps_mp4(p, nalsize, ps, err_recognition, logctx);
  371. if (ret < 0) {
  372. av_log(logctx, AV_LOG_ERROR,
  373. "Decoding sps %d from avcC failed\n", i);
  374. return ret;
  375. }
  376. p += nalsize;
  377. }
  378. // Decode pps from avcC
  379. cnt = *(p++); // Number of pps
  380. for (i = 0; i < cnt; i++) {
  381. nalsize = AV_RB16(p) + 2;
  382. if (p - data + nalsize > size)
  383. return AVERROR_INVALIDDATA;
  384. ret = decode_extradata_ps_mp4(p, nalsize, ps, err_recognition, logctx);
  385. if (ret < 0) {
  386. av_log(logctx, AV_LOG_ERROR,
  387. "Decoding pps %d from avcC failed\n", i);
  388. return ret;
  389. }
  390. p += nalsize;
  391. }
  392. // Store right nal length size that will be used to parse all other nals
  393. *nal_length_size = (data[4] & 0x03) + 1;
  394. } else {
  395. *is_avc = 0;
  396. ret = decode_extradata_ps(data, size, ps, 0, logctx);
  397. if (ret < 0)
  398. return ret;
  399. }
  400. return 0;
  401. }
  402. /**
  403. * Compute profile from profile_idc and constraint_set?_flags.
  404. *
  405. * @param sps SPS
  406. *
  407. * @return profile as defined by FF_PROFILE_H264_*
  408. */
  409. int ff_h264_get_profile(const SPS *sps)
  410. {
  411. int profile = sps->profile_idc;
  412. switch (sps->profile_idc) {
  413. case FF_PROFILE_H264_BASELINE:
  414. // constraint_set1_flag set to 1
  415. profile |= (sps->constraint_set_flags & 1 << 1) ? FF_PROFILE_H264_CONSTRAINED : 0;
  416. break;
  417. case FF_PROFILE_H264_HIGH_10:
  418. case FF_PROFILE_H264_HIGH_422:
  419. case FF_PROFILE_H264_HIGH_444_PREDICTIVE:
  420. // constraint_set3_flag set to 1
  421. profile |= (sps->constraint_set_flags & 1 << 3) ? FF_PROFILE_H264_INTRA : 0;
  422. break;
  423. }
  424. return profile;
  425. }