You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1122 lines
40KB

  1. /*
  2. * FFV1 decoder
  3. *
  4. * Copyright (c) 2003-2013 Michael Niedermayer <michaelni@gmx.at>
  5. *
  6. * This file is part of FFmpeg.
  7. *
  8. * FFmpeg is free software; you can redistribute it and/or
  9. * modify it under the terms of the GNU Lesser General Public
  10. * License as published by the Free Software Foundation; either
  11. * version 2.1 of the License, or (at your option) any later version.
  12. *
  13. * FFmpeg is distributed in the hope that it will be useful,
  14. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  15. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  16. * Lesser General Public License for more details.
  17. *
  18. * You should have received a copy of the GNU Lesser General Public
  19. * License along with FFmpeg; if not, write to the Free Software
  20. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  21. */
  22. /**
  23. * @file
  24. * FF Video Codec 1 (a lossless codec) decoder
  25. */
  26. #include "libavutil/avassert.h"
  27. #include "libavutil/crc.h"
  28. #include "libavutil/opt.h"
  29. #include "libavutil/imgutils.h"
  30. #include "libavutil/pixdesc.h"
  31. #include "libavutil/timer.h"
  32. #include "avcodec.h"
  33. #include "internal.h"
  34. #include "get_bits.h"
  35. #include "rangecoder.h"
  36. #include "golomb.h"
  37. #include "mathops.h"
  38. #include "ffv1.h"
  39. static inline av_flatten int get_symbol_inline(RangeCoder *c, uint8_t *state,
  40. int is_signed)
  41. {
  42. if (get_rac(c, state + 0))
  43. return 0;
  44. else {
  45. int i, e, a;
  46. e = 0;
  47. while (get_rac(c, state + 1 + FFMIN(e, 9))) { // 1..10
  48. e++;
  49. if (e > 31)
  50. return AVERROR_INVALIDDATA;
  51. }
  52. a = 1;
  53. for (i = e - 1; i >= 0; i--)
  54. a += a + get_rac(c, state + 22 + FFMIN(i, 9)); // 22..31
  55. e = -(is_signed && get_rac(c, state + 11 + FFMIN(e, 10))); // 11..21
  56. return (a ^ e) - e;
  57. }
  58. }
  59. static av_noinline int get_symbol(RangeCoder *c, uint8_t *state, int is_signed)
  60. {
  61. return get_symbol_inline(c, state, is_signed);
  62. }
  63. static inline int get_vlc_symbol(GetBitContext *gb, VlcState *const state,
  64. int bits)
  65. {
  66. int k, i, v, ret;
  67. i = state->count;
  68. k = 0;
  69. while (i < state->error_sum) { // FIXME: optimize
  70. k++;
  71. i += i;
  72. }
  73. v = get_sr_golomb(gb, k, 12, bits);
  74. av_dlog(NULL, "v:%d bias:%d error:%d drift:%d count:%d k:%d",
  75. v, state->bias, state->error_sum, state->drift, state->count, k);
  76. #if 0 // JPEG LS
  77. if (k == 0 && 2 * state->drift <= -state->count)
  78. v ^= (-1);
  79. #else
  80. v ^= ((2 * state->drift + state->count) >> 31);
  81. #endif
  82. ret = fold(v + state->bias, bits);
  83. update_vlc_state(state, v);
  84. return ret;
  85. }
  86. static av_always_inline void decode_line(FFV1Context *s, int w,
  87. int16_t *sample[2],
  88. int plane_index, int bits)
  89. {
  90. PlaneContext *const p = &s->plane[plane_index];
  91. RangeCoder *const c = &s->c;
  92. int x;
  93. int run_count = 0;
  94. int run_mode = 0;
  95. int run_index = s->run_index;
  96. if (s->slice_coding_mode == 1) {
  97. int i;
  98. for (x = 0; x < w; x++) {
  99. int v = 0;
  100. for (i=0; i<bits; i++) {
  101. uint8_t state = 128;
  102. v += v + get_rac(c, &state);
  103. }
  104. sample[1][x] = v;
  105. }
  106. return;
  107. }
  108. for (x = 0; x < w; x++) {
  109. int diff, context, sign;
  110. context = get_context(p, sample[1] + x, sample[0] + x, sample[1] + x);
  111. if (context < 0) {
  112. context = -context;
  113. sign = 1;
  114. } else
  115. sign = 0;
  116. av_assert2(context < p->context_count);
  117. if (s->ac) {
  118. diff = get_symbol_inline(c, p->state[context], 1);
  119. } else {
  120. if (context == 0 && run_mode == 0)
  121. run_mode = 1;
  122. if (run_mode) {
  123. if (run_count == 0 && run_mode == 1) {
  124. if (get_bits1(&s->gb)) {
  125. run_count = 1 << ff_log2_run[run_index];
  126. if (x + run_count <= w)
  127. run_index++;
  128. } else {
  129. if (ff_log2_run[run_index])
  130. run_count = get_bits(&s->gb, ff_log2_run[run_index]);
  131. else
  132. run_count = 0;
  133. if (run_index)
  134. run_index--;
  135. run_mode = 2;
  136. }
  137. }
  138. run_count--;
  139. if (run_count < 0) {
  140. run_mode = 0;
  141. run_count = 0;
  142. diff = get_vlc_symbol(&s->gb, &p->vlc_state[context],
  143. bits);
  144. if (diff >= 0)
  145. diff++;
  146. } else
  147. diff = 0;
  148. } else
  149. diff = get_vlc_symbol(&s->gb, &p->vlc_state[context], bits);
  150. av_dlog(s->avctx, "count:%d index:%d, mode:%d, x:%d pos:%d\n",
  151. run_count, run_index, run_mode, x, get_bits_count(&s->gb));
  152. }
  153. if (sign)
  154. diff = -diff;
  155. sample[1][x] = (predict(sample[1] + x, sample[0] + x) + diff) &
  156. ((1 << bits) - 1);
  157. }
  158. s->run_index = run_index;
  159. }
  160. static void decode_plane(FFV1Context *s, uint8_t *src,
  161. int w, int h, int stride, int plane_index)
  162. {
  163. int x, y;
  164. int16_t *sample[2];
  165. sample[0] = s->sample_buffer + 3;
  166. sample[1] = s->sample_buffer + w + 6 + 3;
  167. s->run_index = 0;
  168. memset(s->sample_buffer, 0, 2 * (w + 6) * sizeof(*s->sample_buffer));
  169. for (y = 0; y < h; y++) {
  170. int16_t *temp = sample[0]; // FIXME: try a normal buffer
  171. sample[0] = sample[1];
  172. sample[1] = temp;
  173. sample[1][-1] = sample[0][0];
  174. sample[0][w] = sample[0][w - 1];
  175. // { START_TIMER
  176. if (s->avctx->bits_per_raw_sample <= 8) {
  177. decode_line(s, w, sample, plane_index, 8);
  178. for (x = 0; x < w; x++)
  179. src[x + stride * y] = sample[1][x];
  180. } else {
  181. decode_line(s, w, sample, plane_index, s->avctx->bits_per_raw_sample);
  182. if (s->packed_at_lsb) {
  183. for (x = 0; x < w; x++) {
  184. ((uint16_t*)(src + stride*y))[x] = sample[1][x];
  185. }
  186. } else {
  187. for (x = 0; x < w; x++) {
  188. ((uint16_t*)(src + stride*y))[x] = sample[1][x] << (16 - s->avctx->bits_per_raw_sample);
  189. }
  190. }
  191. }
  192. // STOP_TIMER("decode-line") }
  193. }
  194. }
  195. static void decode_rgb_frame(FFV1Context *s, uint8_t *src[3], int w, int h, int stride[3])
  196. {
  197. int x, y, p;
  198. int16_t *sample[4][2];
  199. int lbd = s->avctx->bits_per_raw_sample <= 8;
  200. int bits = s->avctx->bits_per_raw_sample > 0 ? s->avctx->bits_per_raw_sample : 8;
  201. int offset = 1 << bits;
  202. for (x = 0; x < 4; x++) {
  203. sample[x][0] = s->sample_buffer + x * 2 * (w + 6) + 3;
  204. sample[x][1] = s->sample_buffer + (x * 2 + 1) * (w + 6) + 3;
  205. }
  206. s->run_index = 0;
  207. memset(s->sample_buffer, 0, 8 * (w + 6) * sizeof(*s->sample_buffer));
  208. for (y = 0; y < h; y++) {
  209. for (p = 0; p < 3 + s->transparency; p++) {
  210. int16_t *temp = sample[p][0]; // FIXME: try a normal buffer
  211. sample[p][0] = sample[p][1];
  212. sample[p][1] = temp;
  213. sample[p][1][-1]= sample[p][0][0 ];
  214. sample[p][0][ w]= sample[p][0][w-1];
  215. if (lbd && s->slice_coding_mode == 0)
  216. decode_line(s, w, sample[p], (p + 1)/2, 9);
  217. else
  218. decode_line(s, w, sample[p], (p + 1)/2, bits + (s->slice_coding_mode != 1));
  219. }
  220. for (x = 0; x < w; x++) {
  221. int g = sample[0][1][x];
  222. int b = sample[1][1][x];
  223. int r = sample[2][1][x];
  224. int a = sample[3][1][x];
  225. if (s->slice_coding_mode != 1) {
  226. b -= offset;
  227. r -= offset;
  228. g -= (b * s->slice_rct_by_coef + r * s->slice_rct_ry_coef) >> 2;
  229. b += g;
  230. r += g;
  231. }
  232. if (lbd)
  233. *((uint32_t*)(src[0] + x*4 + stride[0]*y)) = b + (g<<8) + (r<<16) + (a<<24);
  234. else {
  235. *((uint16_t*)(src[0] + x*2 + stride[0]*y)) = b;
  236. *((uint16_t*)(src[1] + x*2 + stride[1]*y)) = g;
  237. *((uint16_t*)(src[2] + x*2 + stride[2]*y)) = r;
  238. }
  239. }
  240. }
  241. }
  242. static int decode_slice_header(FFV1Context *f, FFV1Context *fs)
  243. {
  244. RangeCoder *c = &fs->c;
  245. uint8_t state[CONTEXT_SIZE];
  246. unsigned ps, i, context_count;
  247. memset(state, 128, sizeof(state));
  248. av_assert0(f->version > 2);
  249. fs->slice_x = get_symbol(c, state, 0) * f->width ;
  250. fs->slice_y = get_symbol(c, state, 0) * f->height;
  251. fs->slice_width = (get_symbol(c, state, 0) + 1) * f->width + fs->slice_x;
  252. fs->slice_height = (get_symbol(c, state, 0) + 1) * f->height + fs->slice_y;
  253. fs->slice_x /= f->num_h_slices;
  254. fs->slice_y /= f->num_v_slices;
  255. fs->slice_width = fs->slice_width /f->num_h_slices - fs->slice_x;
  256. fs->slice_height = fs->slice_height/f->num_v_slices - fs->slice_y;
  257. if ((unsigned)fs->slice_width > f->width || (unsigned)fs->slice_height > f->height)
  258. return -1;
  259. if ( (unsigned)fs->slice_x + (uint64_t)fs->slice_width > f->width
  260. || (unsigned)fs->slice_y + (uint64_t)fs->slice_height > f->height)
  261. return -1;
  262. for (i = 0; i < f->plane_count; i++) {
  263. PlaneContext * const p = &fs->plane[i];
  264. int idx = get_symbol(c, state, 0);
  265. if (idx >= (unsigned)f->quant_table_count) {
  266. av_log(f->avctx, AV_LOG_ERROR, "quant_table_index out of range\n");
  267. return -1;
  268. }
  269. p->quant_table_index = idx;
  270. memcpy(p->quant_table, f->quant_tables[idx], sizeof(p->quant_table));
  271. context_count = f->context_count[idx];
  272. if (p->context_count < context_count) {
  273. av_freep(&p->state);
  274. av_freep(&p->vlc_state);
  275. }
  276. p->context_count = context_count;
  277. }
  278. ps = get_symbol(c, state, 0);
  279. if (ps == 1) {
  280. f->cur->interlaced_frame = 1;
  281. f->cur->top_field_first = 1;
  282. } else if (ps == 2) {
  283. f->cur->interlaced_frame = 1;
  284. f->cur->top_field_first = 0;
  285. } else if (ps == 3) {
  286. f->cur->interlaced_frame = 0;
  287. }
  288. f->cur->sample_aspect_ratio.num = get_symbol(c, state, 0);
  289. f->cur->sample_aspect_ratio.den = get_symbol(c, state, 0);
  290. if (av_image_check_sar(f->width, f->height,
  291. f->cur->sample_aspect_ratio) < 0) {
  292. av_log(f->avctx, AV_LOG_WARNING, "ignoring invalid SAR: %u/%u\n",
  293. f->cur->sample_aspect_ratio.num,
  294. f->cur->sample_aspect_ratio.den);
  295. f->cur->sample_aspect_ratio = (AVRational){ 0, 1 };
  296. }
  297. if (fs->version > 3) {
  298. fs->slice_reset_contexts = get_rac(c, state);
  299. fs->slice_coding_mode = get_symbol(c, state, 0);
  300. if (fs->slice_coding_mode != 1) {
  301. fs->slice_rct_by_coef = get_symbol(c, state, 0);
  302. fs->slice_rct_ry_coef = get_symbol(c, state, 0);
  303. if ((uint64_t)fs->slice_rct_by_coef + (uint64_t)fs->slice_rct_ry_coef > 4) {
  304. av_log(f->avctx, AV_LOG_ERROR, "slice_rct_y_coef out of range\n");
  305. return AVERROR_INVALIDDATA;
  306. }
  307. }
  308. }
  309. return 0;
  310. }
  311. static int decode_slice(AVCodecContext *c, void *arg)
  312. {
  313. FFV1Context *fs = *(void **)arg;
  314. FFV1Context *f = fs->avctx->priv_data;
  315. int width, height, x, y, ret;
  316. const int ps = av_pix_fmt_desc_get(c->pix_fmt)->comp[0].step_minus1 + 1;
  317. AVFrame * const p = f->cur;
  318. int i, si;
  319. for( si=0; fs != f->slice_context[si]; si ++)
  320. ;
  321. if(f->fsrc && !p->key_frame)
  322. ff_thread_await_progress(&f->last_picture, si, 0);
  323. if(f->fsrc && !p->key_frame) {
  324. FFV1Context *fssrc = f->fsrc->slice_context[si];
  325. FFV1Context *fsdst = f->slice_context[si];
  326. av_assert1(fsdst->plane_count == fssrc->plane_count);
  327. av_assert1(fsdst == fs);
  328. if (!p->key_frame)
  329. fsdst->slice_damaged |= fssrc->slice_damaged;
  330. for (i = 0; i < f->plane_count; i++) {
  331. PlaneContext *psrc = &fssrc->plane[i];
  332. PlaneContext *pdst = &fsdst->plane[i];
  333. av_free(pdst->state);
  334. av_free(pdst->vlc_state);
  335. memcpy(pdst, psrc, sizeof(*pdst));
  336. pdst->state = NULL;
  337. pdst->vlc_state = NULL;
  338. if (fssrc->ac) {
  339. pdst->state = av_malloc_array(CONTEXT_SIZE, psrc->context_count);
  340. memcpy(pdst->state, psrc->state, CONTEXT_SIZE * psrc->context_count);
  341. } else {
  342. pdst->vlc_state = av_malloc_array(sizeof(*pdst->vlc_state), psrc->context_count);
  343. memcpy(pdst->vlc_state, psrc->vlc_state, sizeof(*pdst->vlc_state) * psrc->context_count);
  344. }
  345. }
  346. }
  347. fs->slice_rct_by_coef = 1;
  348. fs->slice_rct_ry_coef = 1;
  349. if (f->version > 2) {
  350. if (ffv1_init_slice_state(f, fs) < 0)
  351. return AVERROR(ENOMEM);
  352. if (decode_slice_header(f, fs) < 0) {
  353. fs->slice_x = fs->slice_y = fs->slice_height = fs->slice_width = 0;
  354. fs->slice_damaged = 1;
  355. return AVERROR_INVALIDDATA;
  356. }
  357. }
  358. if ((ret = ffv1_init_slice_state(f, fs)) < 0)
  359. return ret;
  360. if (f->cur->key_frame || fs->slice_reset_contexts)
  361. ffv1_clear_slice_state(f, fs);
  362. width = fs->slice_width;
  363. height = fs->slice_height;
  364. x = fs->slice_x;
  365. y = fs->slice_y;
  366. if (!fs->ac) {
  367. if (f->version == 3 && f->micro_version > 1 || f->version > 3)
  368. get_rac(&fs->c, (uint8_t[]) { 129 });
  369. fs->ac_byte_count = f->version > 2 || (!x && !y) ? fs->c.bytestream - fs->c.bytestream_start - 1 : 0;
  370. init_get_bits(&fs->gb,
  371. fs->c.bytestream_start + fs->ac_byte_count,
  372. (fs->c.bytestream_end - fs->c.bytestream_start - fs->ac_byte_count) * 8);
  373. }
  374. av_assert1(width && height);
  375. if (f->colorspace == 0) {
  376. const int chroma_width = FF_CEIL_RSHIFT(width, f->chroma_h_shift);
  377. const int chroma_height = FF_CEIL_RSHIFT(height, f->chroma_v_shift);
  378. const int cx = x >> f->chroma_h_shift;
  379. const int cy = y >> f->chroma_v_shift;
  380. decode_plane(fs, p->data[0] + ps*x + y*p->linesize[0], width, height, p->linesize[0], 0);
  381. if (f->chroma_planes) {
  382. decode_plane(fs, p->data[1] + ps*cx+cy*p->linesize[1], chroma_width, chroma_height, p->linesize[1], 1);
  383. decode_plane(fs, p->data[2] + ps*cx+cy*p->linesize[2], chroma_width, chroma_height, p->linesize[2], 1);
  384. }
  385. if (fs->transparency)
  386. decode_plane(fs, p->data[3] + ps*x + y*p->linesize[3], width, height, p->linesize[3], 2);
  387. } else {
  388. uint8_t *planes[3] = { p->data[0] + ps * x + y * p->linesize[0],
  389. p->data[1] + ps * x + y * p->linesize[1],
  390. p->data[2] + ps * x + y * p->linesize[2] };
  391. decode_rgb_frame(fs, planes, width, height, p->linesize);
  392. }
  393. if (fs->ac && f->version > 2) {
  394. int v;
  395. get_rac(&fs->c, (uint8_t[]) { 129 });
  396. v = fs->c.bytestream_end - fs->c.bytestream - 2 - 5*f->ec;
  397. if (v) {
  398. av_log(f->avctx, AV_LOG_ERROR, "bytestream end mismatching by %d\n", v);
  399. fs->slice_damaged = 1;
  400. }
  401. }
  402. emms_c();
  403. ff_thread_report_progress(&f->picture, si, 0);
  404. return 0;
  405. }
  406. static int read_quant_table(RangeCoder *c, int16_t *quant_table, int scale)
  407. {
  408. int v;
  409. int i = 0;
  410. uint8_t state[CONTEXT_SIZE];
  411. memset(state, 128, sizeof(state));
  412. for (v = 0; i < 128; v++) {
  413. unsigned len = get_symbol(c, state, 0) + 1;
  414. if (len > 128 - i)
  415. return AVERROR_INVALIDDATA;
  416. while (len--) {
  417. quant_table[i] = scale * v;
  418. i++;
  419. }
  420. }
  421. for (i = 1; i < 128; i++)
  422. quant_table[256 - i] = -quant_table[i];
  423. quant_table[128] = -quant_table[127];
  424. return 2 * v - 1;
  425. }
  426. static int read_quant_tables(RangeCoder *c,
  427. int16_t quant_table[MAX_CONTEXT_INPUTS][256])
  428. {
  429. int i;
  430. int context_count = 1;
  431. for (i = 0; i < 5; i++) {
  432. int ret = read_quant_table(c, quant_table[i], context_count);
  433. if (ret < 0)
  434. return ret;
  435. context_count *= ret;
  436. if (context_count > 32768U) {
  437. return AVERROR_INVALIDDATA;
  438. }
  439. }
  440. return (context_count + 1) / 2;
  441. }
  442. static int read_extra_header(FFV1Context *f)
  443. {
  444. RangeCoder *const c = &f->c;
  445. uint8_t state[CONTEXT_SIZE];
  446. int i, j, k, ret;
  447. uint8_t state2[32][CONTEXT_SIZE];
  448. memset(state2, 128, sizeof(state2));
  449. memset(state, 128, sizeof(state));
  450. ff_init_range_decoder(c, f->avctx->extradata, f->avctx->extradata_size);
  451. ff_build_rac_states(c, 0.05 * (1LL << 32), 256 - 8);
  452. f->version = get_symbol(c, state, 0);
  453. if (f->version < 2) {
  454. av_log(f->avctx, AV_LOG_ERROR, "Invalid version in global header\n");
  455. return AVERROR_INVALIDDATA;
  456. }
  457. if (f->version > 2) {
  458. c->bytestream_end -= 4;
  459. f->micro_version = get_symbol(c, state, 0);
  460. }
  461. f->ac = f->avctx->coder_type = get_symbol(c, state, 0);
  462. if (f->ac > 1) {
  463. for (i = 1; i < 256; i++)
  464. f->state_transition[i] = get_symbol(c, state, 1) + c->one_state[i];
  465. }
  466. f->colorspace = get_symbol(c, state, 0); //YUV cs type
  467. f->avctx->bits_per_raw_sample = get_symbol(c, state, 0);
  468. f->chroma_planes = get_rac(c, state);
  469. f->chroma_h_shift = get_symbol(c, state, 0);
  470. f->chroma_v_shift = get_symbol(c, state, 0);
  471. f->transparency = get_rac(c, state);
  472. f->plane_count = 1 + (f->chroma_planes || f->version<4) + f->transparency;
  473. f->num_h_slices = 1 + get_symbol(c, state, 0);
  474. f->num_v_slices = 1 + get_symbol(c, state, 0);
  475. if (f->chroma_h_shift > 4U || f->chroma_v_shift > 4U) {
  476. av_log(f->avctx, AV_LOG_ERROR, "chroma shift parameters %d %d are invalid\n",
  477. f->chroma_h_shift, f->chroma_v_shift);
  478. return AVERROR_INVALIDDATA;
  479. }
  480. if (f->num_h_slices > (unsigned)f->width || !f->num_h_slices ||
  481. f->num_v_slices > (unsigned)f->height || !f->num_v_slices
  482. ) {
  483. av_log(f->avctx, AV_LOG_ERROR, "slice count invalid\n");
  484. return AVERROR_INVALIDDATA;
  485. }
  486. f->quant_table_count = get_symbol(c, state, 0);
  487. if (f->quant_table_count > (unsigned)MAX_QUANT_TABLES || !f->quant_table_count) {
  488. av_log(f->avctx, AV_LOG_ERROR, "quant table count %d is invalid\n", f->quant_table_count);
  489. f->quant_table_count = 0;
  490. return AVERROR_INVALIDDATA;
  491. }
  492. for (i = 0; i < f->quant_table_count; i++) {
  493. f->context_count[i] = read_quant_tables(c, f->quant_tables[i]);
  494. if (f->context_count[i] < 0) {
  495. av_log(f->avctx, AV_LOG_ERROR, "read_quant_table error\n");
  496. return AVERROR_INVALIDDATA;
  497. }
  498. }
  499. if ((ret = ffv1_allocate_initial_states(f)) < 0)
  500. return ret;
  501. for (i = 0; i < f->quant_table_count; i++)
  502. if (get_rac(c, state)) {
  503. for (j = 0; j < f->context_count[i]; j++)
  504. for (k = 0; k < CONTEXT_SIZE; k++) {
  505. int pred = j ? f->initial_states[i][j - 1][k] : 128;
  506. f->initial_states[i][j][k] =
  507. (pred + get_symbol(c, state2[k], 1)) & 0xFF;
  508. }
  509. }
  510. if (f->version > 2) {
  511. f->ec = get_symbol(c, state, 0);
  512. if (f->micro_version > 2)
  513. f->intra = get_symbol(c, state, 0);
  514. }
  515. if (f->version > 2) {
  516. unsigned v;
  517. v = av_crc(av_crc_get_table(AV_CRC_32_IEEE), 0,
  518. f->avctx->extradata, f->avctx->extradata_size);
  519. if (v) {
  520. av_log(f->avctx, AV_LOG_ERROR, "CRC mismatch %X!\n", v);
  521. return AVERROR_INVALIDDATA;
  522. }
  523. }
  524. if (f->avctx->debug & FF_DEBUG_PICT_INFO)
  525. av_log(f->avctx, AV_LOG_DEBUG,
  526. "global: ver:%d.%d, coder:%d, colorspace: %d bpr:%d chroma:%d(%d:%d), alpha:%d slices:%dx%d qtabs:%d ec:%d intra:%d\n",
  527. f->version, f->micro_version,
  528. f->ac,
  529. f->colorspace,
  530. f->avctx->bits_per_raw_sample,
  531. f->chroma_planes, f->chroma_h_shift, f->chroma_v_shift,
  532. f->transparency,
  533. f->num_h_slices, f->num_v_slices,
  534. f->quant_table_count,
  535. f->ec,
  536. f->intra
  537. );
  538. return 0;
  539. }
  540. static int read_header(FFV1Context *f)
  541. {
  542. uint8_t state[CONTEXT_SIZE];
  543. int i, j, context_count = -1; //-1 to avoid warning
  544. RangeCoder *const c = &f->slice_context[0]->c;
  545. memset(state, 128, sizeof(state));
  546. if (f->version < 2) {
  547. int chroma_planes, chroma_h_shift, chroma_v_shift, transparency, colorspace, bits_per_raw_sample;
  548. unsigned v= get_symbol(c, state, 0);
  549. if (v >= 2) {
  550. av_log(f->avctx, AV_LOG_ERROR, "invalid version %d in ver01 header\n", v);
  551. return AVERROR_INVALIDDATA;
  552. }
  553. f->version = v;
  554. f->ac = f->avctx->coder_type = get_symbol(c, state, 0);
  555. if (f->ac > 1) {
  556. for (i = 1; i < 256; i++)
  557. f->state_transition[i] = get_symbol(c, state, 1) + c->one_state[i];
  558. }
  559. colorspace = get_symbol(c, state, 0); //YUV cs type
  560. bits_per_raw_sample = f->version > 0 ? get_symbol(c, state, 0) : f->avctx->bits_per_raw_sample;
  561. chroma_planes = get_rac(c, state);
  562. chroma_h_shift = get_symbol(c, state, 0);
  563. chroma_v_shift = get_symbol(c, state, 0);
  564. transparency = get_rac(c, state);
  565. if (f->plane_count) {
  566. if (colorspace != f->colorspace ||
  567. bits_per_raw_sample != f->avctx->bits_per_raw_sample ||
  568. chroma_planes != f->chroma_planes ||
  569. chroma_h_shift != f->chroma_h_shift ||
  570. chroma_v_shift != f->chroma_v_shift ||
  571. transparency != f->transparency) {
  572. av_log(f->avctx, AV_LOG_ERROR, "Invalid change of global parameters\n");
  573. return AVERROR_INVALIDDATA;
  574. }
  575. }
  576. if (chroma_h_shift > 4U || chroma_v_shift > 4U) {
  577. av_log(f->avctx, AV_LOG_ERROR, "chroma shift parameters %d %d are invalid\n",
  578. chroma_h_shift, chroma_v_shift);
  579. return AVERROR_INVALIDDATA;
  580. }
  581. f->colorspace = colorspace;
  582. f->avctx->bits_per_raw_sample = bits_per_raw_sample;
  583. f->chroma_planes = chroma_planes;
  584. f->chroma_h_shift = chroma_h_shift;
  585. f->chroma_v_shift = chroma_v_shift;
  586. f->transparency = transparency;
  587. f->plane_count = 2 + f->transparency;
  588. }
  589. if (f->colorspace == 0) {
  590. if (f->avctx->skip_alpha) f->transparency = 0;
  591. if (!f->transparency && !f->chroma_planes) {
  592. if (f->avctx->bits_per_raw_sample <= 8)
  593. f->avctx->pix_fmt = AV_PIX_FMT_GRAY8;
  594. else
  595. f->avctx->pix_fmt = AV_PIX_FMT_GRAY16;
  596. } else if (f->avctx->bits_per_raw_sample<=8 && !f->transparency) {
  597. switch(16 * f->chroma_h_shift + f->chroma_v_shift) {
  598. case 0x00: f->avctx->pix_fmt = AV_PIX_FMT_YUV444P; break;
  599. case 0x01: f->avctx->pix_fmt = AV_PIX_FMT_YUV440P; break;
  600. case 0x10: f->avctx->pix_fmt = AV_PIX_FMT_YUV422P; break;
  601. case 0x11: f->avctx->pix_fmt = AV_PIX_FMT_YUV420P; break;
  602. case 0x20: f->avctx->pix_fmt = AV_PIX_FMT_YUV411P; break;
  603. case 0x22: f->avctx->pix_fmt = AV_PIX_FMT_YUV410P; break;
  604. }
  605. } else if (f->avctx->bits_per_raw_sample <= 8 && f->transparency) {
  606. switch(16*f->chroma_h_shift + f->chroma_v_shift) {
  607. case 0x00: f->avctx->pix_fmt = AV_PIX_FMT_YUVA444P; break;
  608. case 0x10: f->avctx->pix_fmt = AV_PIX_FMT_YUVA422P; break;
  609. case 0x11: f->avctx->pix_fmt = AV_PIX_FMT_YUVA420P; break;
  610. }
  611. } else if (f->avctx->bits_per_raw_sample == 9 && !f->transparency) {
  612. f->packed_at_lsb = 1;
  613. switch(16 * f->chroma_h_shift + f->chroma_v_shift) {
  614. case 0x00: f->avctx->pix_fmt = AV_PIX_FMT_YUV444P9; break;
  615. case 0x10: f->avctx->pix_fmt = AV_PIX_FMT_YUV422P9; break;
  616. case 0x11: f->avctx->pix_fmt = AV_PIX_FMT_YUV420P9; break;
  617. }
  618. } else if (f->avctx->bits_per_raw_sample == 9 && f->transparency) {
  619. f->packed_at_lsb = 1;
  620. switch(16 * f->chroma_h_shift + f->chroma_v_shift) {
  621. case 0x00: f->avctx->pix_fmt = AV_PIX_FMT_YUVA444P9; break;
  622. case 0x10: f->avctx->pix_fmt = AV_PIX_FMT_YUVA422P9; break;
  623. case 0x11: f->avctx->pix_fmt = AV_PIX_FMT_YUVA420P9; break;
  624. }
  625. } else if (f->avctx->bits_per_raw_sample == 10 && !f->transparency) {
  626. f->packed_at_lsb = 1;
  627. switch(16 * f->chroma_h_shift + f->chroma_v_shift) {
  628. case 0x00: f->avctx->pix_fmt = AV_PIX_FMT_YUV444P10; break;
  629. case 0x10: f->avctx->pix_fmt = AV_PIX_FMT_YUV422P10; break;
  630. case 0x11: f->avctx->pix_fmt = AV_PIX_FMT_YUV420P10; break;
  631. }
  632. } else if (f->avctx->bits_per_raw_sample == 10 && f->transparency) {
  633. f->packed_at_lsb = 1;
  634. switch(16 * f->chroma_h_shift + f->chroma_v_shift) {
  635. case 0x00: f->avctx->pix_fmt = AV_PIX_FMT_YUVA444P10; break;
  636. case 0x10: f->avctx->pix_fmt = AV_PIX_FMT_YUVA422P10; break;
  637. case 0x11: f->avctx->pix_fmt = AV_PIX_FMT_YUVA420P10; break;
  638. }
  639. } else if (f->avctx->bits_per_raw_sample == 16 && !f->transparency){
  640. switch(16 * f->chroma_h_shift + f->chroma_v_shift) {
  641. case 0x00: f->avctx->pix_fmt = AV_PIX_FMT_YUV444P16; break;
  642. case 0x10: f->avctx->pix_fmt = AV_PIX_FMT_YUV422P16; break;
  643. case 0x11: f->avctx->pix_fmt = AV_PIX_FMT_YUV420P16; break;
  644. }
  645. } else if (f->avctx->bits_per_raw_sample == 16 && f->transparency){
  646. switch(16 * f->chroma_h_shift + f->chroma_v_shift) {
  647. case 0x00: f->avctx->pix_fmt = AV_PIX_FMT_YUVA444P16; break;
  648. case 0x10: f->avctx->pix_fmt = AV_PIX_FMT_YUVA422P16; break;
  649. case 0x11: f->avctx->pix_fmt = AV_PIX_FMT_YUVA420P16; break;
  650. }
  651. }
  652. } else if (f->colorspace == 1) {
  653. if (f->chroma_h_shift || f->chroma_v_shift) {
  654. av_log(f->avctx, AV_LOG_ERROR,
  655. "chroma subsampling not supported in this colorspace\n");
  656. return AVERROR(ENOSYS);
  657. }
  658. if ( f->avctx->bits_per_raw_sample == 9)
  659. f->avctx->pix_fmt = AV_PIX_FMT_GBRP9;
  660. else if (f->avctx->bits_per_raw_sample == 10)
  661. f->avctx->pix_fmt = AV_PIX_FMT_GBRP10;
  662. else if (f->avctx->bits_per_raw_sample == 12)
  663. f->avctx->pix_fmt = AV_PIX_FMT_GBRP12;
  664. else if (f->avctx->bits_per_raw_sample == 14)
  665. f->avctx->pix_fmt = AV_PIX_FMT_GBRP14;
  666. else
  667. if (f->transparency) f->avctx->pix_fmt = AV_PIX_FMT_RGB32;
  668. else f->avctx->pix_fmt = AV_PIX_FMT_0RGB32;
  669. } else {
  670. av_log(f->avctx, AV_LOG_ERROR, "colorspace not supported\n");
  671. return AVERROR(ENOSYS);
  672. }
  673. if (f->avctx->pix_fmt == AV_PIX_FMT_NONE) {
  674. av_log(f->avctx, AV_LOG_ERROR, "format not supported\n");
  675. return AVERROR(ENOSYS);
  676. }
  677. av_dlog(f->avctx, "%d %d %d\n",
  678. f->chroma_h_shift, f->chroma_v_shift, f->avctx->pix_fmt);
  679. if (f->version < 2) {
  680. context_count = read_quant_tables(c, f->quant_table);
  681. if (context_count < 0) {
  682. av_log(f->avctx, AV_LOG_ERROR, "read_quant_table error\n");
  683. return AVERROR_INVALIDDATA;
  684. }
  685. f->slice_count = f->max_slice_count;
  686. } else if (f->version < 3) {
  687. f->slice_count = get_symbol(c, state, 0);
  688. } else {
  689. const uint8_t *p = c->bytestream_end;
  690. for (f->slice_count = 0;
  691. f->slice_count < MAX_SLICES && 3 < p - c->bytestream_start;
  692. f->slice_count++) {
  693. int trailer = 3 + 5*!!f->ec;
  694. int size = AV_RB24(p-trailer);
  695. if (size + trailer > p - c->bytestream_start)
  696. break;
  697. p -= size + trailer;
  698. }
  699. }
  700. if (f->slice_count > (unsigned)MAX_SLICES || f->slice_count <= 0 || f->slice_count > f->max_slice_count) {
  701. av_log(f->avctx, AV_LOG_ERROR, "slice count %d is invalid (max=%d)\n", f->slice_count, f->max_slice_count);
  702. return AVERROR_INVALIDDATA;
  703. }
  704. for (j = 0; j < f->slice_count; j++) {
  705. FFV1Context *fs = f->slice_context[j];
  706. fs->ac = f->ac;
  707. fs->packed_at_lsb = f->packed_at_lsb;
  708. fs->slice_damaged = 0;
  709. if (f->version == 2) {
  710. fs->slice_x = get_symbol(c, state, 0) * f->width ;
  711. fs->slice_y = get_symbol(c, state, 0) * f->height;
  712. fs->slice_width = (get_symbol(c, state, 0) + 1) * f->width + fs->slice_x;
  713. fs->slice_height = (get_symbol(c, state, 0) + 1) * f->height + fs->slice_y;
  714. fs->slice_x /= f->num_h_slices;
  715. fs->slice_y /= f->num_v_slices;
  716. fs->slice_width = fs->slice_width / f->num_h_slices - fs->slice_x;
  717. fs->slice_height = fs->slice_height / f->num_v_slices - fs->slice_y;
  718. if ((unsigned)fs->slice_width > f->width ||
  719. (unsigned)fs->slice_height > f->height)
  720. return AVERROR_INVALIDDATA;
  721. if ( (unsigned)fs->slice_x + (uint64_t)fs->slice_width > f->width
  722. || (unsigned)fs->slice_y + (uint64_t)fs->slice_height > f->height)
  723. return AVERROR_INVALIDDATA;
  724. }
  725. for (i = 0; i < f->plane_count; i++) {
  726. PlaneContext *const p = &fs->plane[i];
  727. if (f->version == 2) {
  728. int idx = get_symbol(c, state, 0);
  729. if (idx > (unsigned)f->quant_table_count) {
  730. av_log(f->avctx, AV_LOG_ERROR,
  731. "quant_table_index out of range\n");
  732. return AVERROR_INVALIDDATA;
  733. }
  734. p->quant_table_index = idx;
  735. memcpy(p->quant_table, f->quant_tables[idx],
  736. sizeof(p->quant_table));
  737. context_count = f->context_count[idx];
  738. } else {
  739. memcpy(p->quant_table, f->quant_table, sizeof(p->quant_table));
  740. }
  741. if (f->version <= 2) {
  742. av_assert0(context_count >= 0);
  743. if (p->context_count < context_count) {
  744. av_freep(&p->state);
  745. av_freep(&p->vlc_state);
  746. }
  747. p->context_count = context_count;
  748. }
  749. }
  750. }
  751. return 0;
  752. }
  753. static av_cold int decode_init(AVCodecContext *avctx)
  754. {
  755. FFV1Context *f = avctx->priv_data;
  756. int ret;
  757. if ((ret = ffv1_common_init(avctx)) < 0)
  758. return ret;
  759. if (avctx->extradata && (ret = read_extra_header(f)) < 0)
  760. return ret;
  761. if ((ret = ffv1_init_slice_contexts(f)) < 0)
  762. return ret;
  763. avctx->internal->allocate_progress = 1;
  764. return 0;
  765. }
  766. static int decode_frame(AVCodecContext *avctx, void *data, int *got_frame, AVPacket *avpkt)
  767. {
  768. const uint8_t *buf = avpkt->data;
  769. int buf_size = avpkt->size;
  770. FFV1Context *f = avctx->priv_data;
  771. RangeCoder *const c = &f->slice_context[0]->c;
  772. int i, ret;
  773. uint8_t keystate = 128;
  774. const uint8_t *buf_p;
  775. AVFrame *p;
  776. if (f->last_picture.f)
  777. ff_thread_release_buffer(avctx, &f->last_picture);
  778. FFSWAP(ThreadFrame, f->picture, f->last_picture);
  779. f->cur = p = f->picture.f;
  780. if (f->version < 3 && avctx->field_order > AV_FIELD_PROGRESSIVE) {
  781. /* we have interlaced material flagged in container */
  782. p->interlaced_frame = 1;
  783. if (avctx->field_order == AV_FIELD_TT || avctx->field_order == AV_FIELD_TB)
  784. p->top_field_first = 1;
  785. }
  786. f->avctx = avctx;
  787. ff_init_range_decoder(c, buf, buf_size);
  788. ff_build_rac_states(c, 0.05 * (1LL << 32), 256 - 8);
  789. p->pict_type = AV_PICTURE_TYPE_I; //FIXME I vs. P
  790. if (get_rac(c, &keystate)) {
  791. p->key_frame = 1;
  792. f->key_frame_ok = 0;
  793. if ((ret = read_header(f)) < 0)
  794. return ret;
  795. f->key_frame_ok = 1;
  796. } else {
  797. if (!f->key_frame_ok) {
  798. av_log(avctx, AV_LOG_ERROR,
  799. "Cannot decode non-keyframe without valid keyframe\n");
  800. return AVERROR_INVALIDDATA;
  801. }
  802. p->key_frame = 0;
  803. }
  804. if ((ret = ff_thread_get_buffer(avctx, &f->picture, AV_GET_BUFFER_FLAG_REF)) < 0)
  805. return ret;
  806. if (avctx->debug & FF_DEBUG_PICT_INFO)
  807. av_log(avctx, AV_LOG_DEBUG, "ver:%d keyframe:%d coder:%d ec:%d slices:%d bps:%d\n",
  808. f->version, p->key_frame, f->ac, f->ec, f->slice_count, f->avctx->bits_per_raw_sample);
  809. ff_thread_finish_setup(avctx);
  810. buf_p = buf + buf_size;
  811. for (i = f->slice_count - 1; i >= 0; i--) {
  812. FFV1Context *fs = f->slice_context[i];
  813. int trailer = 3 + 5*!!f->ec;
  814. int v;
  815. if (i || f->version > 2) v = AV_RB24(buf_p-trailer) + trailer;
  816. else v = buf_p - c->bytestream_start;
  817. if (buf_p - c->bytestream_start < v) {
  818. av_log(avctx, AV_LOG_ERROR, "Slice pointer chain broken\n");
  819. ff_thread_report_progress(&f->picture, INT_MAX, 0);
  820. return AVERROR_INVALIDDATA;
  821. }
  822. buf_p -= v;
  823. if (f->ec) {
  824. unsigned crc = av_crc(av_crc_get_table(AV_CRC_32_IEEE), 0, buf_p, v);
  825. if (crc) {
  826. int64_t ts = avpkt->pts != AV_NOPTS_VALUE ? avpkt->pts : avpkt->dts;
  827. av_log(f->avctx, AV_LOG_ERROR, "CRC mismatch %X!", crc);
  828. if (ts != AV_NOPTS_VALUE && avctx->pkt_timebase.num) {
  829. av_log(f->avctx, AV_LOG_ERROR, "at %f seconds\n", ts*av_q2d(avctx->pkt_timebase));
  830. } else if (ts != AV_NOPTS_VALUE) {
  831. av_log(f->avctx, AV_LOG_ERROR, "at %"PRId64"\n", ts);
  832. } else {
  833. av_log(f->avctx, AV_LOG_ERROR, "\n");
  834. }
  835. fs->slice_damaged = 1;
  836. }
  837. }
  838. if (i) {
  839. ff_init_range_decoder(&fs->c, buf_p, v);
  840. } else
  841. fs->c.bytestream_end = (uint8_t *)(buf_p + v);
  842. fs->avctx = avctx;
  843. fs->cur = p;
  844. }
  845. avctx->execute(avctx,
  846. decode_slice,
  847. &f->slice_context[0],
  848. NULL,
  849. f->slice_count,
  850. sizeof(void*));
  851. for (i = f->slice_count - 1; i >= 0; i--) {
  852. FFV1Context *fs = f->slice_context[i];
  853. int j;
  854. if (fs->slice_damaged && f->last_picture.f->data[0]) {
  855. const uint8_t *src[4];
  856. uint8_t *dst[4];
  857. ff_thread_await_progress(&f->last_picture, INT_MAX, 0);
  858. for (j = 0; j < 4; j++) {
  859. int sh = (j == 1 || j == 2) ? f->chroma_h_shift : 0;
  860. int sv = (j == 1 || j == 2) ? f->chroma_v_shift : 0;
  861. dst[j] = p->data[j] + p->linesize[j] *
  862. (fs->slice_y >> sv) + (fs->slice_x >> sh);
  863. src[j] = f->last_picture.f->data[j] + f->last_picture.f->linesize[j] *
  864. (fs->slice_y >> sv) + (fs->slice_x >> sh);
  865. }
  866. av_image_copy(dst, p->linesize, (const uint8_t **)src,
  867. f->last_picture.f->linesize,
  868. avctx->pix_fmt,
  869. fs->slice_width,
  870. fs->slice_height);
  871. }
  872. }
  873. ff_thread_report_progress(&f->picture, INT_MAX, 0);
  874. f->picture_number++;
  875. if (f->last_picture.f)
  876. ff_thread_release_buffer(avctx, &f->last_picture);
  877. f->cur = NULL;
  878. if ((ret = av_frame_ref(data, f->picture.f)) < 0)
  879. return ret;
  880. *got_frame = 1;
  881. return buf_size;
  882. }
  883. static int init_thread_copy(AVCodecContext *avctx)
  884. {
  885. FFV1Context *f = avctx->priv_data;
  886. int i, ret;
  887. f->picture.f = NULL;
  888. f->last_picture.f = NULL;
  889. f->sample_buffer = NULL;
  890. f->max_slice_count = 0;
  891. f->slice_count = 0;
  892. for (i = 0; i < f->quant_table_count; i++) {
  893. av_assert0(f->version > 1);
  894. f->initial_states[i] = av_memdup(f->initial_states[i],
  895. f->context_count[i] * sizeof(*f->initial_states[i]));
  896. }
  897. f->picture.f = av_frame_alloc();
  898. f->last_picture.f = av_frame_alloc();
  899. if ((ret = ffv1_init_slice_contexts(f)) < 0)
  900. return ret;
  901. return 0;
  902. }
  903. static void copy_fields(FFV1Context *fsdst, FFV1Context *fssrc, FFV1Context *fsrc)
  904. {
  905. fsdst->version = fsrc->version;
  906. fsdst->micro_version = fsrc->micro_version;
  907. fsdst->chroma_planes = fsrc->chroma_planes;
  908. fsdst->chroma_h_shift = fsrc->chroma_h_shift;
  909. fsdst->chroma_v_shift = fsrc->chroma_v_shift;
  910. fsdst->transparency = fsrc->transparency;
  911. fsdst->plane_count = fsrc->plane_count;
  912. fsdst->ac = fsrc->ac;
  913. fsdst->colorspace = fsrc->colorspace;
  914. fsdst->ec = fsrc->ec;
  915. fsdst->intra = fsrc->intra;
  916. fsdst->slice_damaged = fssrc->slice_damaged;
  917. fsdst->key_frame_ok = fsrc->key_frame_ok;
  918. fsdst->bits_per_raw_sample = fsrc->bits_per_raw_sample;
  919. fsdst->packed_at_lsb = fsrc->packed_at_lsb;
  920. fsdst->slice_count = fsrc->slice_count;
  921. if (fsrc->version<3){
  922. fsdst->slice_x = fssrc->slice_x;
  923. fsdst->slice_y = fssrc->slice_y;
  924. fsdst->slice_width = fssrc->slice_width;
  925. fsdst->slice_height = fssrc->slice_height;
  926. }
  927. }
  928. static int update_thread_context(AVCodecContext *dst, const AVCodecContext *src)
  929. {
  930. FFV1Context *fsrc = src->priv_data;
  931. FFV1Context *fdst = dst->priv_data;
  932. int i, ret;
  933. if (dst == src)
  934. return 0;
  935. {
  936. FFV1Context bak = *fdst;
  937. memcpy(fdst, fsrc, sizeof(*fdst));
  938. memcpy(fdst->initial_states, bak.initial_states, sizeof(fdst->initial_states));
  939. memcpy(fdst->slice_context, bak.slice_context , sizeof(fdst->slice_context));
  940. fdst->picture = bak.picture;
  941. fdst->last_picture = bak.last_picture;
  942. for (i = 0; i<fdst->num_h_slices * fdst->num_v_slices; i++) {
  943. FFV1Context *fssrc = fsrc->slice_context[i];
  944. FFV1Context *fsdst = fdst->slice_context[i];
  945. copy_fields(fsdst, fssrc, fsrc);
  946. }
  947. av_assert0(!fdst->plane[0].state);
  948. av_assert0(!fdst->sample_buffer);
  949. }
  950. av_assert1(fdst->max_slice_count == fsrc->max_slice_count);
  951. ff_thread_release_buffer(dst, &fdst->picture);
  952. if (fsrc->picture.f->data[0]) {
  953. if ((ret = ff_thread_ref_frame(&fdst->picture, &fsrc->picture)) < 0)
  954. return ret;
  955. }
  956. fdst->fsrc = fsrc;
  957. return 0;
  958. }
  959. AVCodec ff_ffv1_decoder = {
  960. .name = "ffv1",
  961. .long_name = NULL_IF_CONFIG_SMALL("FFmpeg video codec #1"),
  962. .type = AVMEDIA_TYPE_VIDEO,
  963. .id = AV_CODEC_ID_FFV1,
  964. .priv_data_size = sizeof(FFV1Context),
  965. .init = decode_init,
  966. .close = ffv1_close,
  967. .decode = decode_frame,
  968. .init_thread_copy = ONLY_IF_THREADS_ENABLED(init_thread_copy),
  969. .update_thread_context = ONLY_IF_THREADS_ENABLED(update_thread_context),
  970. .capabilities = CODEC_CAP_DR1 /*| CODEC_CAP_DRAW_HORIZ_BAND*/ |
  971. CODEC_CAP_FRAME_THREADS | CODEC_CAP_SLICE_THREADS,
  972. };