You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

483 lines
14KB

  1. /*
  2. * HEVC video Decoder
  3. *
  4. * Copyright (C) 2012 - 2013 Guillaume Martres
  5. * Copyright (C) 2012 - 2013 Gildas Cocherel
  6. *
  7. * This file is part of FFmpeg.
  8. *
  9. * FFmpeg is free software; you can redistribute it and/or
  10. * modify it under the terms of the GNU Lesser General Public
  11. * License as published by the Free Software Foundation; either
  12. * version 2.1 of the License, or (at your option) any later version.
  13. *
  14. * FFmpeg is distributed in the hope that it will be useful,
  15. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  16. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  17. * Lesser General Public License for more details.
  18. *
  19. * You should have received a copy of the GNU Lesser General Public
  20. * License along with FFmpeg; if not, write to the Free Software
  21. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  22. */
  23. #include "libavutil/pixdesc.h"
  24. #include "hevc.h"
  25. #include "internal.h"
  26. #include "thread.h"
  27. void ff_hevc_unref_frame(HEVCContext *s, HEVCFrame *frame, int flags)
  28. {
  29. /* frame->frame can be NULL if context init failed */
  30. if (!frame->frame || !frame->frame->buf[0])
  31. return;
  32. frame->flags &= ~flags;
  33. if (!frame->flags) {
  34. ff_thread_release_buffer(s->avctx, &frame->tf);
  35. av_buffer_unref(&frame->tab_mvf_buf);
  36. frame->tab_mvf = NULL;
  37. av_buffer_unref(&frame->rpl_buf);
  38. av_buffer_unref(&frame->rpl_tab_buf);
  39. frame->rpl_tab = NULL;
  40. frame->refPicList = NULL;
  41. frame->collocated_ref = NULL;
  42. }
  43. }
  44. RefPicList* ff_hevc_get_ref_list(HEVCContext *s, HEVCFrame *ref, int x0, int y0)
  45. {
  46. if (x0 < 0 || y0 < 0) {
  47. return s->ref->refPicList;
  48. } else {
  49. int x_cb = x0 >> s->sps->log2_ctb_size;
  50. int y_cb = y0 >> s->sps->log2_ctb_size;
  51. int pic_width_cb = (s->sps->width + (1<<s->sps->log2_ctb_size)-1 ) >> s->sps->log2_ctb_size;
  52. int ctb_addr_ts = s->pps->ctb_addr_rs_to_ts[y_cb * pic_width_cb + x_cb];
  53. return (RefPicList*) ref->rpl_tab[ctb_addr_ts];
  54. }
  55. }
  56. void ff_hevc_clear_refs(HEVCContext *s)
  57. {
  58. int i;
  59. for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++)
  60. ff_hevc_unref_frame(s, &s->DPB[i],
  61. HEVC_FRAME_FLAG_SHORT_REF | HEVC_FRAME_FLAG_LONG_REF);
  62. }
  63. void ff_hevc_flush_dpb(HEVCContext *s)
  64. {
  65. int i;
  66. for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++)
  67. ff_hevc_unref_frame(s, &s->DPB[i], ~0);
  68. }
  69. static HEVCFrame *alloc_frame(HEVCContext *s)
  70. {
  71. int i, j, ret;
  72. for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++) {
  73. HEVCFrame *frame = &s->DPB[i];
  74. if (frame->frame->buf[0])
  75. continue;
  76. ret = ff_thread_get_buffer(s->avctx, &frame->tf, AV_GET_BUFFER_FLAG_REF);
  77. if (ret < 0)
  78. return NULL;
  79. frame->rpl_buf = av_buffer_allocz(s->nb_nals * sizeof(RefPicListTab));
  80. if (!frame->rpl_buf)
  81. goto fail;
  82. frame->tab_mvf_buf = av_buffer_pool_get(s->tab_mvf_pool);
  83. if (!frame->tab_mvf_buf)
  84. goto fail;
  85. frame->tab_mvf = (MvField*)frame->tab_mvf_buf->data;
  86. frame->rpl_tab_buf = av_buffer_pool_get(s->rpl_tab_pool);
  87. if (!frame->rpl_tab_buf)
  88. goto fail;
  89. frame->rpl_tab = (RefPicListTab**)frame->rpl_tab_buf->data;
  90. frame->ctb_count = s->sps->ctb_width * s->sps->ctb_height;
  91. for (j = 0; j < frame->ctb_count; j++)
  92. frame->rpl_tab[j] = (RefPicListTab*)frame->rpl_buf->data;
  93. return frame;
  94. fail:
  95. ff_hevc_unref_frame(s, frame, ~0);
  96. return NULL;
  97. }
  98. av_log(s->avctx, AV_LOG_ERROR, "Error allocating frame, DPB full.\n");
  99. return NULL;
  100. }
  101. int ff_hevc_set_new_ref(HEVCContext *s, AVFrame **frame, int poc)
  102. {
  103. HEVCFrame *ref;
  104. int i;
  105. /* check that this POC doesn't already exist */
  106. for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++) {
  107. HEVCFrame *frame = &s->DPB[i];
  108. if (frame->frame->buf[0] && frame->sequence == s->seq_decode &&
  109. frame->poc == poc) {
  110. av_log(s->avctx, AV_LOG_ERROR, "Duplicate POC in a sequence: %d.\n",
  111. poc);
  112. return AVERROR_INVALIDDATA;
  113. }
  114. }
  115. ref = alloc_frame(s);
  116. if (!ref)
  117. return AVERROR(ENOMEM);
  118. *frame = ref->frame;
  119. s->ref = ref;
  120. ref->poc = poc;
  121. ref->flags = HEVC_FRAME_FLAG_OUTPUT | HEVC_FRAME_FLAG_SHORT_REF;
  122. ref->sequence = s->seq_decode;
  123. ref->window = s->sps->output_window;
  124. return 0;
  125. }
  126. int ff_hevc_output_frame(HEVCContext *s, AVFrame *out, int flush)
  127. {
  128. int nb_output = 0;
  129. int min_poc = 0xFFFF;
  130. int i, j, min_idx, ret;
  131. do {
  132. for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++) {
  133. HEVCFrame *frame = &s->DPB[i];
  134. if ((frame->flags & HEVC_FRAME_FLAG_OUTPUT) &&
  135. frame->sequence == s->seq_output) {
  136. nb_output++;
  137. if (frame->poc < min_poc) {
  138. min_poc = frame->poc;
  139. min_idx = i;
  140. }
  141. }
  142. }
  143. /* wait for more frames before output */
  144. if (!flush && s->seq_output == s->seq_decode && s->sps &&
  145. nb_output <= s->sps->temporal_layer[s->sps->max_sub_layers - 1].num_reorder_pics)
  146. return 0;
  147. if (nb_output) {
  148. HEVCFrame *frame = &s->DPB[min_idx];
  149. AVFrame *dst = out;
  150. AVFrame *src = frame->frame;
  151. const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(src->format);
  152. int pixel_shift = !!(desc->comp[0].depth_minus1 > 7);
  153. ret = av_frame_ref(out, src);
  154. ff_hevc_unref_frame(s, frame, HEVC_FRAME_FLAG_OUTPUT);
  155. if (ret < 0)
  156. return ret;
  157. for (j = 0; j < 3; j++) {
  158. int hshift = (j > 0) ? desc->log2_chroma_w : 0;
  159. int vshift = (j > 0) ? desc->log2_chroma_h : 0;
  160. int off = ((frame->window.left_offset >> hshift) << pixel_shift) +
  161. (frame->window.top_offset >> vshift) * dst->linesize[j];
  162. dst->data[j] += off;
  163. }
  164. av_log(s->avctx, AV_LOG_DEBUG, "Output frame with POC %d.\n", frame->poc);
  165. return 1;
  166. }
  167. if (s->seq_output != s->seq_decode)
  168. s->seq_output = (s->seq_output + 1) & 0xff;
  169. else
  170. break;
  171. } while (1);
  172. return 0;
  173. }
  174. static int init_slice_rpl(HEVCContext *s)
  175. {
  176. HEVCFrame *frame = s->ref;
  177. int ctb_count = frame->ctb_count;
  178. int ctb_addr_ts = s->pps->ctb_addr_rs_to_ts[s->sh.slice_segment_addr];
  179. int i;
  180. if (s->slice_idx >= frame->rpl_buf->size / sizeof(RefPicListTab))
  181. return AVERROR_INVALIDDATA;
  182. for (i = ctb_addr_ts; i < ctb_count; i++)
  183. frame->rpl_tab[i] = (RefPicListTab*)frame->rpl_buf->data + s->slice_idx;
  184. frame->refPicList = (RefPicList*)frame->rpl_tab[ctb_addr_ts];
  185. return 0;
  186. }
  187. int ff_hevc_slice_rpl(HEVCContext *s)
  188. {
  189. SliceHeader *sh = &s->sh;
  190. uint8_t nb_list = sh->slice_type == B_SLICE ? 2 : 1;
  191. uint8_t list_idx;
  192. int i, j, ret;
  193. ret = init_slice_rpl(s);
  194. if (ret < 0)
  195. return ret;
  196. if (!(s->rps[ST_CURR_BEF].nb_refs + s->rps[ST_CURR_AFT].nb_refs +
  197. s->rps[LT_CURR].nb_refs)) {
  198. av_log(s->avctx, AV_LOG_ERROR, "Zero refs in the frame RPS.\n");
  199. return AVERROR_INVALIDDATA;
  200. }
  201. for (list_idx = 0; list_idx < nb_list; list_idx++) {
  202. RefPicList rpl_tmp = { { 0 } };
  203. RefPicList *rpl = &s->ref->refPicList[list_idx];
  204. /* The order of the elements is
  205. * ST_CURR_BEF - ST_CURR_AFT - LT_CURR for the L0 and
  206. * ST_CURR_AFT - ST_CURR_BEF - LT_CURR for the L1
  207. */
  208. int cand_lists[3] = { list_idx ? ST_CURR_AFT : ST_CURR_BEF,
  209. list_idx ? ST_CURR_BEF : ST_CURR_AFT,
  210. LT_CURR };
  211. /* concatenate the candidate lists for the current frame */
  212. while (rpl_tmp.nb_refs < sh->nb_refs[list_idx]) {
  213. for (i = 0; i < FF_ARRAY_ELEMS(cand_lists); i++) {
  214. RefPicList *rps = &s->rps[cand_lists[i]];
  215. for (j = 0; j < rps->nb_refs; j++) {
  216. rpl_tmp.list[rpl_tmp.nb_refs] = rps->list[j];
  217. rpl_tmp.ref[rpl_tmp.nb_refs] = rps->ref[j];
  218. rpl_tmp.isLongTerm[rpl_tmp.nb_refs] = (i == 2);
  219. rpl_tmp.nb_refs++;
  220. }
  221. }
  222. }
  223. /* reorder the references if necessary */
  224. if (sh->rpl_modification_flag[list_idx]) {
  225. for (i = 0; i < sh->nb_refs[list_idx]; i++) {
  226. int idx = sh->list_entry_lx[list_idx][i];
  227. if (idx >= rpl_tmp.nb_refs) {
  228. av_log(s->avctx, AV_LOG_ERROR, "Invalid reference index.\n");
  229. return AVERROR_INVALIDDATA;
  230. }
  231. rpl->list[i] = rpl_tmp.list[idx];
  232. rpl->ref[i] = rpl_tmp.ref[idx];
  233. rpl->isLongTerm[i] = rpl_tmp.isLongTerm[idx];
  234. rpl->nb_refs++;
  235. }
  236. } else {
  237. memcpy(rpl, &rpl_tmp, sizeof(*rpl));
  238. rpl->nb_refs = FFMIN(rpl->nb_refs, sh->nb_refs[list_idx]);
  239. }
  240. if (sh->collocated_list == list_idx &&
  241. sh->collocated_ref_idx < rpl->nb_refs)
  242. s->ref->collocated_ref = rpl->ref[sh->collocated_ref_idx];
  243. }
  244. return 0;
  245. }
  246. static HEVCFrame *find_ref_idx(HEVCContext *s, int poc)
  247. {
  248. int i;
  249. int LtMask = (1 << s->sps->log2_max_poc_lsb) - 1;
  250. for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++) {
  251. HEVCFrame *ref = &s->DPB[i];
  252. if (ref->frame->buf[0] && (ref->sequence == s->seq_decode)) {
  253. if ((ref->poc & LtMask) == poc)
  254. return ref;
  255. }
  256. }
  257. for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++) {
  258. HEVCFrame *ref = &s->DPB[i];
  259. if (ref->frame->buf[0] && (ref->sequence == s->seq_decode)) {
  260. if (ref->poc == poc || (ref->poc & LtMask) == poc)
  261. return ref;
  262. }
  263. }
  264. av_log(s->avctx, AV_LOG_ERROR,
  265. "Could not find ref with POC %d\n", poc);
  266. return NULL;
  267. }
  268. static void mark_ref(HEVCFrame *frame, int flag)
  269. {
  270. frame->flags &= ~(HEVC_FRAME_FLAG_LONG_REF | HEVC_FRAME_FLAG_SHORT_REF);
  271. frame->flags |= flag;
  272. }
  273. static HEVCFrame *generate_missing_ref(HEVCContext *s, int poc)
  274. {
  275. HEVCFrame *frame;
  276. int i, x, y;
  277. frame = alloc_frame(s);
  278. if (!frame)
  279. return NULL;
  280. if (!s->sps->pixel_shift) {
  281. for (i = 0; frame->frame->buf[i]; i++)
  282. memset(frame->frame->buf[i]->data, 1 << (s->sps->bit_depth - 1),
  283. frame->frame->buf[i]->size);
  284. } else {
  285. for (i = 0; frame->frame->data[i]; i++)
  286. for (y = 0; y < (s->height >> s->sps->vshift[i]); y++)
  287. for (x = 0; x < (s->width >> s->sps->hshift[i]); x++) {
  288. AV_WN16(frame->frame->data[i] + y * frame->frame->linesize[i] + 2 * x,
  289. 1 << (s->sps->bit_depth - 1));
  290. }
  291. }
  292. frame->poc = poc;
  293. frame->sequence = s->seq_decode;
  294. frame->flags = 0;
  295. if (s->threads_type == FF_THREAD_FRAME)
  296. ff_thread_report_progress(&frame->tf, INT_MAX, 0);
  297. return frame;
  298. }
  299. /* add a reference with the given poc to the list and mark it as used in DPB */
  300. static int add_candidate_ref(HEVCContext *s, RefPicList *list,
  301. int poc, int ref_flag)
  302. {
  303. HEVCFrame *ref = find_ref_idx(s, poc);
  304. if (ref == s->ref)
  305. return AVERROR_INVALIDDATA;
  306. if (!ref) {
  307. ref = generate_missing_ref(s, poc);
  308. if (!ref)
  309. return AVERROR(ENOMEM);
  310. }
  311. list->list[list->nb_refs] = ref->poc;
  312. list->ref[list->nb_refs] = ref;
  313. list->nb_refs++;
  314. mark_ref(ref, ref_flag);
  315. return 0;
  316. }
  317. int ff_hevc_frame_rps(HEVCContext *s)
  318. {
  319. const ShortTermRPS *short_rps = s->sh.short_term_rps;
  320. const LongTermRPS *long_rps = &s->sh.long_term_rps;
  321. RefPicList *rps = s->rps;
  322. int i, ret;
  323. if (!short_rps)
  324. return 0;
  325. /* clear the reference flags on all frames except the current one */
  326. for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++) {
  327. HEVCFrame *frame = &s->DPB[i];
  328. if (frame == s->ref)
  329. continue;
  330. mark_ref(frame, 0);
  331. }
  332. for (i = 0; i < NB_RPS_TYPE; i++)
  333. rps[i].nb_refs = 0;
  334. /* add the short refs */
  335. for (i = 0; i < short_rps->num_delta_pocs; i++) {
  336. int poc = s->poc + short_rps->delta_poc[i];
  337. int list;
  338. if (!short_rps->used[i])
  339. list = ST_FOLL;
  340. else if (i < short_rps->num_negative_pics)
  341. list = ST_CURR_BEF;
  342. else
  343. list = ST_CURR_AFT;
  344. ret = add_candidate_ref(s, &rps[list], poc, HEVC_FRAME_FLAG_SHORT_REF);
  345. if (ret < 0)
  346. return ret;
  347. }
  348. /* add the long refs */
  349. for (i = 0; i < long_rps->nb_refs; i++) {
  350. int poc = long_rps->poc[i];
  351. int list = long_rps->used[i] ? LT_CURR : LT_FOLL;
  352. ret = add_candidate_ref(s, &rps[list], poc, HEVC_FRAME_FLAG_LONG_REF);
  353. if (ret < 0)
  354. return ret;
  355. }
  356. /* release any frames that are now unused */
  357. for (i = 0; i < FF_ARRAY_ELEMS(s->DPB); i++)
  358. ff_hevc_unref_frame(s, &s->DPB[i], 0);
  359. return 0;
  360. }
  361. int ff_hevc_compute_poc(HEVCContext *s, int poc_lsb)
  362. {
  363. int max_poc_lsb = 1 << s->sps->log2_max_poc_lsb;
  364. int prev_poc_lsb = s->pocTid0 % max_poc_lsb;
  365. int prev_poc_msb = s->pocTid0 - prev_poc_lsb;
  366. int poc_msb;
  367. if ((poc_lsb < prev_poc_lsb) && ((prev_poc_lsb - poc_lsb) >= max_poc_lsb / 2))
  368. poc_msb = prev_poc_msb + max_poc_lsb;
  369. else if ((poc_lsb > prev_poc_lsb) && ((poc_lsb - prev_poc_lsb) > (max_poc_lsb / 2)))
  370. poc_msb = prev_poc_msb - max_poc_lsb;
  371. else
  372. poc_msb = prev_poc_msb;
  373. // For BLA picture types, POCmsb is set to 0.
  374. if (s->nal_unit_type == NAL_BLA_W_LP ||
  375. s->nal_unit_type == NAL_BLA_W_RADL ||
  376. s->nal_unit_type == NAL_BLA_N_LP)
  377. poc_msb = 0;
  378. return poc_msb + poc_lsb;
  379. }
  380. int ff_hevc_frame_nb_refs(HEVCContext *s)
  381. {
  382. int ret = 0;
  383. int i;
  384. const ShortTermRPS *rps = s->sh.short_term_rps;
  385. LongTermRPS *long_rps = &s->sh.long_term_rps;
  386. if (rps) {
  387. for (i = 0; i < rps->num_negative_pics; i++)
  388. ret += !!rps->used[i];
  389. for (; i < rps->num_delta_pocs; i++)
  390. ret += !!rps->used[i];
  391. }
  392. if (long_rps) {
  393. for (i = 0; i < long_rps->nb_refs; i++)
  394. ret += !!long_rps->used[i];
  395. }
  396. return ret;
  397. }