You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1117 lines
39KB

  1. /*
  2. * FFV1 decoder
  3. *
  4. * Copyright (c) 2003-2013 Michael Niedermayer <michaelni@gmx.at>
  5. *
  6. * This file is part of FFmpeg.
  7. *
  8. * FFmpeg is free software; you can redistribute it and/or
  9. * modify it under the terms of the GNU Lesser General Public
  10. * License as published by the Free Software Foundation; either
  11. * version 2.1 of the License, or (at your option) any later version.
  12. *
  13. * FFmpeg is distributed in the hope that it will be useful,
  14. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  15. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  16. * Lesser General Public License for more details.
  17. *
  18. * You should have received a copy of the GNU Lesser General Public
  19. * License along with FFmpeg; if not, write to the Free Software
  20. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  21. */
  22. /**
  23. * @file
  24. * FF Video Codec 1 (a lossless codec) decoder
  25. */
  26. #include "libavutil/avassert.h"
  27. #include "libavutil/crc.h"
  28. #include "libavutil/opt.h"
  29. #include "libavutil/imgutils.h"
  30. #include "libavutil/pixdesc.h"
  31. #include "libavutil/timer.h"
  32. #include "avcodec.h"
  33. #include "internal.h"
  34. #include "get_bits.h"
  35. #include "rangecoder.h"
  36. #include "golomb.h"
  37. #include "mathops.h"
  38. #include "ffv1.h"
  39. static inline av_flatten int get_symbol_inline(RangeCoder *c, uint8_t *state,
  40. int is_signed)
  41. {
  42. if (get_rac(c, state + 0))
  43. return 0;
  44. else {
  45. int i, e, a;
  46. e = 0;
  47. while (get_rac(c, state + 1 + FFMIN(e, 9))) { // 1..10
  48. e++;
  49. if (e > 31)
  50. return AVERROR_INVALIDDATA;
  51. }
  52. a = 1;
  53. for (i = e - 1; i >= 0; i--)
  54. a += a + get_rac(c, state + 22 + FFMIN(i, 9)); // 22..31
  55. e = -(is_signed && get_rac(c, state + 11 + FFMIN(e, 10))); // 11..21
  56. return (a ^ e) - e;
  57. }
  58. }
  59. static av_noinline int get_symbol(RangeCoder *c, uint8_t *state, int is_signed)
  60. {
  61. return get_symbol_inline(c, state, is_signed);
  62. }
  63. static inline int get_vlc_symbol(GetBitContext *gb, VlcState *const state,
  64. int bits)
  65. {
  66. int k, i, v, ret;
  67. i = state->count;
  68. k = 0;
  69. while (i < state->error_sum) { // FIXME: optimize
  70. k++;
  71. i += i;
  72. }
  73. v = get_sr_golomb(gb, k, 12, bits);
  74. av_dlog(NULL, "v:%d bias:%d error:%d drift:%d count:%d k:%d",
  75. v, state->bias, state->error_sum, state->drift, state->count, k);
  76. #if 0 // JPEG LS
  77. if (k == 0 && 2 * state->drift <= -state->count)
  78. v ^= (-1);
  79. #else
  80. v ^= ((2 * state->drift + state->count) >> 31);
  81. #endif
  82. ret = fold(v + state->bias, bits);
  83. update_vlc_state(state, v);
  84. return ret;
  85. }
  86. static av_always_inline void decode_line(FFV1Context *s, int w,
  87. int16_t *sample[2],
  88. int plane_index, int bits)
  89. {
  90. PlaneContext *const p = &s->plane[plane_index];
  91. RangeCoder *const c = &s->c;
  92. int x;
  93. int run_count = 0;
  94. int run_mode = 0;
  95. int run_index = s->run_index;
  96. if (s->slice_coding_mode == 1) {
  97. int i;
  98. for (x = 0; x < w; x++) {
  99. int v = 0;
  100. for (i=0; i<bits; i++) {
  101. uint8_t state = 128;
  102. v += v + get_rac(c, &state);
  103. }
  104. sample[1][x] = v;
  105. }
  106. return;
  107. }
  108. for (x = 0; x < w; x++) {
  109. int diff, context, sign;
  110. context = get_context(p, sample[1] + x, sample[0] + x, sample[1] + x);
  111. if (context < 0) {
  112. context = -context;
  113. sign = 1;
  114. } else
  115. sign = 0;
  116. av_assert2(context < p->context_count);
  117. if (s->ac) {
  118. diff = get_symbol_inline(c, p->state[context], 1);
  119. } else {
  120. if (context == 0 && run_mode == 0)
  121. run_mode = 1;
  122. if (run_mode) {
  123. if (run_count == 0 && run_mode == 1) {
  124. if (get_bits1(&s->gb)) {
  125. run_count = 1 << ff_log2_run[run_index];
  126. if (x + run_count <= w)
  127. run_index++;
  128. } else {
  129. if (ff_log2_run[run_index])
  130. run_count = get_bits(&s->gb, ff_log2_run[run_index]);
  131. else
  132. run_count = 0;
  133. if (run_index)
  134. run_index--;
  135. run_mode = 2;
  136. }
  137. }
  138. run_count--;
  139. if (run_count < 0) {
  140. run_mode = 0;
  141. run_count = 0;
  142. diff = get_vlc_symbol(&s->gb, &p->vlc_state[context],
  143. bits);
  144. if (diff >= 0)
  145. diff++;
  146. } else
  147. diff = 0;
  148. } else
  149. diff = get_vlc_symbol(&s->gb, &p->vlc_state[context], bits);
  150. av_dlog(s->avctx, "count:%d index:%d, mode:%d, x:%d pos:%d\n",
  151. run_count, run_index, run_mode, x, get_bits_count(&s->gb));
  152. }
  153. if (sign)
  154. diff = -diff;
  155. sample[1][x] = (predict(sample[1] + x, sample[0] + x) + diff) &
  156. ((1 << bits) - 1);
  157. }
  158. s->run_index = run_index;
  159. }
  160. static void decode_plane(FFV1Context *s, uint8_t *src,
  161. int w, int h, int stride, int plane_index)
  162. {
  163. int x, y;
  164. int16_t *sample[2];
  165. sample[0] = s->sample_buffer + 3;
  166. sample[1] = s->sample_buffer + w + 6 + 3;
  167. s->run_index = 0;
  168. memset(s->sample_buffer, 0, 2 * (w + 6) * sizeof(*s->sample_buffer));
  169. for (y = 0; y < h; y++) {
  170. int16_t *temp = sample[0]; // FIXME: try a normal buffer
  171. sample[0] = sample[1];
  172. sample[1] = temp;
  173. sample[1][-1] = sample[0][0];
  174. sample[0][w] = sample[0][w - 1];
  175. // { START_TIMER
  176. if (s->avctx->bits_per_raw_sample <= 8) {
  177. decode_line(s, w, sample, plane_index, 8);
  178. for (x = 0; x < w; x++)
  179. src[x + stride * y] = sample[1][x];
  180. } else {
  181. decode_line(s, w, sample, plane_index, s->avctx->bits_per_raw_sample);
  182. if (s->packed_at_lsb) {
  183. for (x = 0; x < w; x++) {
  184. ((uint16_t*)(src + stride*y))[x] = sample[1][x];
  185. }
  186. } else {
  187. for (x = 0; x < w; x++) {
  188. ((uint16_t*)(src + stride*y))[x] = sample[1][x] << (16 - s->avctx->bits_per_raw_sample);
  189. }
  190. }
  191. }
  192. // STOP_TIMER("decode-line") }
  193. }
  194. }
  195. static void decode_rgb_frame(FFV1Context *s, uint8_t *src[3], int w, int h, int stride[3])
  196. {
  197. int x, y, p;
  198. int16_t *sample[4][2];
  199. int lbd = s->avctx->bits_per_raw_sample <= 8;
  200. int bits = s->avctx->bits_per_raw_sample > 0 ? s->avctx->bits_per_raw_sample : 8;
  201. int offset = 1 << bits;
  202. for (x = 0; x < 4; x++) {
  203. sample[x][0] = s->sample_buffer + x * 2 * (w + 6) + 3;
  204. sample[x][1] = s->sample_buffer + (x * 2 + 1) * (w + 6) + 3;
  205. }
  206. s->run_index = 0;
  207. memset(s->sample_buffer, 0, 8 * (w + 6) * sizeof(*s->sample_buffer));
  208. for (y = 0; y < h; y++) {
  209. for (p = 0; p < 3 + s->transparency; p++) {
  210. int16_t *temp = sample[p][0]; // FIXME: try a normal buffer
  211. sample[p][0] = sample[p][1];
  212. sample[p][1] = temp;
  213. sample[p][1][-1]= sample[p][0][0 ];
  214. sample[p][0][ w]= sample[p][0][w-1];
  215. if (lbd && s->slice_coding_mode == 0)
  216. decode_line(s, w, sample[p], (p + 1)/2, 9);
  217. else
  218. decode_line(s, w, sample[p], (p + 1)/2, bits + (s->slice_coding_mode != 1));
  219. }
  220. for (x = 0; x < w; x++) {
  221. int g = sample[0][1][x];
  222. int b = sample[1][1][x];
  223. int r = sample[2][1][x];
  224. int a = sample[3][1][x];
  225. if (s->slice_coding_mode != 1) {
  226. b -= offset;
  227. r -= offset;
  228. g -= (b * s->slice_rct_by_coef + r * s->slice_rct_ry_coef) >> 2;
  229. b += g;
  230. r += g;
  231. }
  232. if (lbd)
  233. *((uint32_t*)(src[0] + x*4 + stride[0]*y)) = b + (g<<8) + (r<<16) + (a<<24);
  234. else {
  235. *((uint16_t*)(src[0] + x*2 + stride[0]*y)) = b;
  236. *((uint16_t*)(src[1] + x*2 + stride[1]*y)) = g;
  237. *((uint16_t*)(src[2] + x*2 + stride[2]*y)) = r;
  238. }
  239. }
  240. }
  241. }
  242. static int decode_slice_header(FFV1Context *f, FFV1Context *fs)
  243. {
  244. RangeCoder *c = &fs->c;
  245. uint8_t state[CONTEXT_SIZE];
  246. unsigned ps, i, context_count;
  247. memset(state, 128, sizeof(state));
  248. av_assert0(f->version > 2);
  249. fs->slice_x = get_symbol(c, state, 0) * f->width ;
  250. fs->slice_y = get_symbol(c, state, 0) * f->height;
  251. fs->slice_width = (get_symbol(c, state, 0) + 1) * f->width + fs->slice_x;
  252. fs->slice_height = (get_symbol(c, state, 0) + 1) * f->height + fs->slice_y;
  253. fs->slice_x /= f->num_h_slices;
  254. fs->slice_y /= f->num_v_slices;
  255. fs->slice_width = fs->slice_width /f->num_h_slices - fs->slice_x;
  256. fs->slice_height = fs->slice_height/f->num_v_slices - fs->slice_y;
  257. if ((unsigned)fs->slice_width > f->width || (unsigned)fs->slice_height > f->height)
  258. return -1;
  259. if ( (unsigned)fs->slice_x + (uint64_t)fs->slice_width > f->width
  260. || (unsigned)fs->slice_y + (uint64_t)fs->slice_height > f->height)
  261. return -1;
  262. for (i = 0; i < f->plane_count; i++) {
  263. PlaneContext * const p = &fs->plane[i];
  264. int idx = get_symbol(c, state, 0);
  265. if (idx > (unsigned)f->quant_table_count) {
  266. av_log(f->avctx, AV_LOG_ERROR, "quant_table_index out of range\n");
  267. return -1;
  268. }
  269. p->quant_table_index = idx;
  270. memcpy(p->quant_table, f->quant_tables[idx], sizeof(p->quant_table));
  271. context_count = f->context_count[idx];
  272. if (p->context_count < context_count) {
  273. av_freep(&p->state);
  274. av_freep(&p->vlc_state);
  275. }
  276. p->context_count = context_count;
  277. }
  278. ps = get_symbol(c, state, 0);
  279. if (ps == 1) {
  280. f->cur->interlaced_frame = 1;
  281. f->cur->top_field_first = 1;
  282. } else if (ps == 2) {
  283. f->cur->interlaced_frame = 1;
  284. f->cur->top_field_first = 0;
  285. } else if (ps == 3) {
  286. f->cur->interlaced_frame = 0;
  287. }
  288. f->cur->sample_aspect_ratio.num = get_symbol(c, state, 0);
  289. f->cur->sample_aspect_ratio.den = get_symbol(c, state, 0);
  290. if (av_image_check_sar(f->width, f->height,
  291. f->cur->sample_aspect_ratio) < 0) {
  292. av_log(f->avctx, AV_LOG_WARNING, "ignoring invalid SAR: %u/%u\n",
  293. f->cur->sample_aspect_ratio.num,
  294. f->cur->sample_aspect_ratio.den);
  295. f->cur->sample_aspect_ratio = (AVRational){ 0, 1 };
  296. }
  297. if (fs->version > 3) {
  298. fs->slice_reset_contexts = get_rac(c, state);
  299. fs->slice_coding_mode = get_symbol(c, state, 0);
  300. if (fs->slice_coding_mode != 1) {
  301. fs->slice_rct_by_coef = get_symbol(c, state, 0);
  302. fs->slice_rct_ry_coef = get_symbol(c, state, 0);
  303. if ((uint64_t)fs->slice_rct_by_coef + (uint64_t)fs->slice_rct_ry_coef > 4) {
  304. av_log(f->avctx, AV_LOG_ERROR, "slice_rct_y_coef out of range\n");
  305. return AVERROR_INVALIDDATA;
  306. }
  307. }
  308. }
  309. return 0;
  310. }
  311. static int decode_slice(AVCodecContext *c, void *arg)
  312. {
  313. FFV1Context *fs = *(void **)arg;
  314. FFV1Context *f = fs->avctx->priv_data;
  315. int width, height, x, y, ret;
  316. const int ps = av_pix_fmt_desc_get(c->pix_fmt)->comp[0].step_minus1 + 1;
  317. AVFrame * const p = f->cur;
  318. int i, si;
  319. for( si=0; fs != f->slice_context[si]; si ++)
  320. ;
  321. if(f->fsrc && !p->key_frame)
  322. ff_thread_await_progress(&f->last_picture, si, 0);
  323. if(f->fsrc && !p->key_frame) {
  324. FFV1Context *fssrc = f->fsrc->slice_context[si];
  325. FFV1Context *fsdst = f->slice_context[si];
  326. av_assert1(fsdst->plane_count == fssrc->plane_count);
  327. av_assert1(fsdst == fs);
  328. if (!p->key_frame)
  329. fsdst->slice_damaged |= fssrc->slice_damaged;
  330. for (i = 0; i < f->plane_count; i++) {
  331. PlaneContext *psrc = &fssrc->plane[i];
  332. PlaneContext *pdst = &fsdst->plane[i];
  333. av_free(pdst->state);
  334. av_free(pdst->vlc_state);
  335. memcpy(pdst, psrc, sizeof(*pdst));
  336. pdst->state = NULL;
  337. pdst->vlc_state = NULL;
  338. if (fssrc->ac) {
  339. pdst->state = av_malloc_array(CONTEXT_SIZE, psrc->context_count);
  340. memcpy(pdst->state, psrc->state, CONTEXT_SIZE * psrc->context_count);
  341. } else {
  342. pdst->vlc_state = av_malloc_array(sizeof(*pdst->vlc_state), psrc->context_count);
  343. memcpy(pdst->vlc_state, psrc->vlc_state, sizeof(*pdst->vlc_state) * psrc->context_count);
  344. }
  345. }
  346. }
  347. fs->slice_rct_by_coef = 1;
  348. fs->slice_rct_ry_coef = 1;
  349. if (f->version > 2) {
  350. if (ffv1_init_slice_state(f, fs) < 0)
  351. return AVERROR(ENOMEM);
  352. if (decode_slice_header(f, fs) < 0) {
  353. fs->slice_damaged = 1;
  354. return AVERROR_INVALIDDATA;
  355. }
  356. }
  357. if ((ret = ffv1_init_slice_state(f, fs)) < 0)
  358. return ret;
  359. if (f->cur->key_frame || fs->slice_reset_contexts)
  360. ffv1_clear_slice_state(f, fs);
  361. width = fs->slice_width;
  362. height = fs->slice_height;
  363. x = fs->slice_x;
  364. y = fs->slice_y;
  365. if (!fs->ac) {
  366. if (f->version == 3 && f->micro_version > 1 || f->version > 3)
  367. get_rac(&fs->c, (uint8_t[]) { 129 });
  368. fs->ac_byte_count = f->version > 2 || (!x && !y) ? fs->c.bytestream - fs->c.bytestream_start - 1 : 0;
  369. init_get_bits(&fs->gb,
  370. fs->c.bytestream_start + fs->ac_byte_count,
  371. (fs->c.bytestream_end - fs->c.bytestream_start - fs->ac_byte_count) * 8);
  372. }
  373. av_assert1(width && height);
  374. if (f->colorspace == 0) {
  375. const int chroma_width = FF_CEIL_RSHIFT(width, f->chroma_h_shift);
  376. const int chroma_height = FF_CEIL_RSHIFT(height, f->chroma_v_shift);
  377. const int cx = x >> f->chroma_h_shift;
  378. const int cy = y >> f->chroma_v_shift;
  379. decode_plane(fs, p->data[0] + ps*x + y*p->linesize[0], width, height, p->linesize[0], 0);
  380. if (f->chroma_planes) {
  381. decode_plane(fs, p->data[1] + ps*cx+cy*p->linesize[1], chroma_width, chroma_height, p->linesize[1], 1);
  382. decode_plane(fs, p->data[2] + ps*cx+cy*p->linesize[2], chroma_width, chroma_height, p->linesize[2], 1);
  383. }
  384. if (fs->transparency)
  385. decode_plane(fs, p->data[3] + ps*x + y*p->linesize[3], width, height, p->linesize[3], 2);
  386. } else {
  387. uint8_t *planes[3] = { p->data[0] + ps * x + y * p->linesize[0],
  388. p->data[1] + ps * x + y * p->linesize[1],
  389. p->data[2] + ps * x + y * p->linesize[2] };
  390. decode_rgb_frame(fs, planes, width, height, p->linesize);
  391. }
  392. if (fs->ac && f->version > 2) {
  393. int v;
  394. get_rac(&fs->c, (uint8_t[]) { 129 });
  395. v = fs->c.bytestream_end - fs->c.bytestream - 2 - 5*f->ec;
  396. if (v) {
  397. av_log(f->avctx, AV_LOG_ERROR, "bytestream end mismatching by %d\n", v);
  398. fs->slice_damaged = 1;
  399. }
  400. }
  401. emms_c();
  402. ff_thread_report_progress(&f->picture, si, 0);
  403. return 0;
  404. }
  405. static int read_quant_table(RangeCoder *c, int16_t *quant_table, int scale)
  406. {
  407. int v;
  408. int i = 0;
  409. uint8_t state[CONTEXT_SIZE];
  410. memset(state, 128, sizeof(state));
  411. for (v = 0; i < 128; v++) {
  412. unsigned len = get_symbol(c, state, 0) + 1;
  413. if (len > 128 - i)
  414. return AVERROR_INVALIDDATA;
  415. while (len--) {
  416. quant_table[i] = scale * v;
  417. i++;
  418. }
  419. }
  420. for (i = 1; i < 128; i++)
  421. quant_table[256 - i] = -quant_table[i];
  422. quant_table[128] = -quant_table[127];
  423. return 2 * v - 1;
  424. }
  425. static int read_quant_tables(RangeCoder *c,
  426. int16_t quant_table[MAX_CONTEXT_INPUTS][256])
  427. {
  428. int i;
  429. int context_count = 1;
  430. for (i = 0; i < 5; i++) {
  431. int ret = read_quant_table(c, quant_table[i], context_count);
  432. if (ret < 0)
  433. return ret;
  434. context_count *= ret;
  435. if (context_count > 32768U) {
  436. return AVERROR_INVALIDDATA;
  437. }
  438. }
  439. return (context_count + 1) / 2;
  440. }
  441. static int read_extra_header(FFV1Context *f)
  442. {
  443. RangeCoder *const c = &f->c;
  444. uint8_t state[CONTEXT_SIZE];
  445. int i, j, k, ret;
  446. uint8_t state2[32][CONTEXT_SIZE];
  447. memset(state2, 128, sizeof(state2));
  448. memset(state, 128, sizeof(state));
  449. ff_init_range_decoder(c, f->avctx->extradata, f->avctx->extradata_size);
  450. ff_build_rac_states(c, 0.05 * (1LL << 32), 256 - 8);
  451. f->version = get_symbol(c, state, 0);
  452. if (f->version < 2) {
  453. av_log(f->avctx, AV_LOG_ERROR, "Invalid version in global header\n");
  454. return AVERROR_INVALIDDATA;
  455. }
  456. if (f->version > 2) {
  457. c->bytestream_end -= 4;
  458. f->micro_version = get_symbol(c, state, 0);
  459. }
  460. f->ac = f->avctx->coder_type = get_symbol(c, state, 0);
  461. if (f->ac > 1) {
  462. for (i = 1; i < 256; i++)
  463. f->state_transition[i] = get_symbol(c, state, 1) + c->one_state[i];
  464. }
  465. f->colorspace = get_symbol(c, state, 0); //YUV cs type
  466. f->avctx->bits_per_raw_sample = get_symbol(c, state, 0);
  467. f->chroma_planes = get_rac(c, state);
  468. f->chroma_h_shift = get_symbol(c, state, 0);
  469. f->chroma_v_shift = get_symbol(c, state, 0);
  470. f->transparency = get_rac(c, state);
  471. f->plane_count = 1 + (f->chroma_planes || f->version<4) + f->transparency;
  472. f->num_h_slices = 1 + get_symbol(c, state, 0);
  473. f->num_v_slices = 1 + get_symbol(c, state, 0);
  474. if (f->chroma_h_shift > 4U || f->chroma_v_shift > 4U) {
  475. av_log(f->avctx, AV_LOG_ERROR, "chroma shift parameters %d %d are invalid\n",
  476. f->chroma_h_shift, f->chroma_v_shift);
  477. return AVERROR_INVALIDDATA;
  478. }
  479. if (f->num_h_slices > (unsigned)f->width || !f->num_h_slices ||
  480. f->num_v_slices > (unsigned)f->height || !f->num_v_slices
  481. ) {
  482. av_log(f->avctx, AV_LOG_ERROR, "slice count invalid\n");
  483. return AVERROR_INVALIDDATA;
  484. }
  485. f->quant_table_count = get_symbol(c, state, 0);
  486. if (f->quant_table_count > (unsigned)MAX_QUANT_TABLES)
  487. return AVERROR_INVALIDDATA;
  488. for (i = 0; i < f->quant_table_count; i++) {
  489. f->context_count[i] = read_quant_tables(c, f->quant_tables[i]);
  490. if (f->context_count[i] < 0) {
  491. av_log(f->avctx, AV_LOG_ERROR, "read_quant_table error\n");
  492. return AVERROR_INVALIDDATA;
  493. }
  494. }
  495. if ((ret = ffv1_allocate_initial_states(f)) < 0)
  496. return ret;
  497. for (i = 0; i < f->quant_table_count; i++)
  498. if (get_rac(c, state)) {
  499. for (j = 0; j < f->context_count[i]; j++)
  500. for (k = 0; k < CONTEXT_SIZE; k++) {
  501. int pred = j ? f->initial_states[i][j - 1][k] : 128;
  502. f->initial_states[i][j][k] =
  503. (pred + get_symbol(c, state2[k], 1)) & 0xFF;
  504. }
  505. }
  506. if (f->version > 2) {
  507. f->ec = get_symbol(c, state, 0);
  508. if (f->micro_version > 2)
  509. f->intra = get_symbol(c, state, 0);
  510. }
  511. if (f->version > 2) {
  512. unsigned v;
  513. v = av_crc(av_crc_get_table(AV_CRC_32_IEEE), 0,
  514. f->avctx->extradata, f->avctx->extradata_size);
  515. if (v) {
  516. av_log(f->avctx, AV_LOG_ERROR, "CRC mismatch %X!\n", v);
  517. return AVERROR_INVALIDDATA;
  518. }
  519. }
  520. if (f->avctx->debug & FF_DEBUG_PICT_INFO)
  521. av_log(f->avctx, AV_LOG_DEBUG,
  522. "global: ver:%d.%d, coder:%d, colorspace: %d bpr:%d chroma:%d(%d:%d), alpha:%d slices:%dx%d qtabs:%d ec:%d intra:%d\n",
  523. f->version, f->micro_version,
  524. f->ac,
  525. f->colorspace,
  526. f->avctx->bits_per_raw_sample,
  527. f->chroma_planes, f->chroma_h_shift, f->chroma_v_shift,
  528. f->transparency,
  529. f->num_h_slices, f->num_v_slices,
  530. f->quant_table_count,
  531. f->ec,
  532. f->intra
  533. );
  534. return 0;
  535. }
  536. static int read_header(FFV1Context *f)
  537. {
  538. uint8_t state[CONTEXT_SIZE];
  539. int i, j, context_count = -1; //-1 to avoid warning
  540. RangeCoder *const c = &f->slice_context[0]->c;
  541. memset(state, 128, sizeof(state));
  542. if (f->version < 2) {
  543. int chroma_planes, chroma_h_shift, chroma_v_shift, transparency, colorspace, bits_per_raw_sample;
  544. unsigned v= get_symbol(c, state, 0);
  545. if (v >= 2) {
  546. av_log(f->avctx, AV_LOG_ERROR, "invalid version %d in ver01 header\n", v);
  547. return AVERROR_INVALIDDATA;
  548. }
  549. f->version = v;
  550. f->ac = f->avctx->coder_type = get_symbol(c, state, 0);
  551. if (f->ac > 1) {
  552. for (i = 1; i < 256; i++)
  553. f->state_transition[i] = get_symbol(c, state, 1) + c->one_state[i];
  554. }
  555. colorspace = get_symbol(c, state, 0); //YUV cs type
  556. bits_per_raw_sample = f->version > 0 ? get_symbol(c, state, 0) : f->avctx->bits_per_raw_sample;
  557. chroma_planes = get_rac(c, state);
  558. chroma_h_shift = get_symbol(c, state, 0);
  559. chroma_v_shift = get_symbol(c, state, 0);
  560. transparency = get_rac(c, state);
  561. if (f->plane_count) {
  562. if (colorspace != f->colorspace ||
  563. bits_per_raw_sample != f->avctx->bits_per_raw_sample ||
  564. chroma_planes != f->chroma_planes ||
  565. chroma_h_shift != f->chroma_h_shift ||
  566. chroma_v_shift != f->chroma_v_shift ||
  567. transparency != f->transparency) {
  568. av_log(f->avctx, AV_LOG_ERROR, "Invalid change of global parameters\n");
  569. return AVERROR_INVALIDDATA;
  570. }
  571. }
  572. if (chroma_h_shift > 4U || chroma_v_shift > 4U) {
  573. av_log(f->avctx, AV_LOG_ERROR, "chroma shift parameters %d %d are invalid\n",
  574. chroma_h_shift, chroma_v_shift);
  575. return AVERROR_INVALIDDATA;
  576. }
  577. f->colorspace = colorspace;
  578. f->avctx->bits_per_raw_sample = bits_per_raw_sample;
  579. f->chroma_planes = chroma_planes;
  580. f->chroma_h_shift = chroma_h_shift;
  581. f->chroma_v_shift = chroma_v_shift;
  582. f->transparency = transparency;
  583. f->plane_count = 2 + f->transparency;
  584. }
  585. if (f->colorspace == 0) {
  586. if (f->avctx->skip_alpha) f->transparency = 0;
  587. if (!f->transparency && !f->chroma_planes) {
  588. if (f->avctx->bits_per_raw_sample <= 8)
  589. f->avctx->pix_fmt = AV_PIX_FMT_GRAY8;
  590. else
  591. f->avctx->pix_fmt = AV_PIX_FMT_GRAY16;
  592. } else if (f->avctx->bits_per_raw_sample<=8 && !f->transparency) {
  593. switch(16 * f->chroma_h_shift + f->chroma_v_shift) {
  594. case 0x00: f->avctx->pix_fmt = AV_PIX_FMT_YUV444P; break;
  595. case 0x01: f->avctx->pix_fmt = AV_PIX_FMT_YUV440P; break;
  596. case 0x10: f->avctx->pix_fmt = AV_PIX_FMT_YUV422P; break;
  597. case 0x11: f->avctx->pix_fmt = AV_PIX_FMT_YUV420P; break;
  598. case 0x20: f->avctx->pix_fmt = AV_PIX_FMT_YUV411P; break;
  599. case 0x22: f->avctx->pix_fmt = AV_PIX_FMT_YUV410P; break;
  600. }
  601. } else if (f->avctx->bits_per_raw_sample <= 8 && f->transparency) {
  602. switch(16*f->chroma_h_shift + f->chroma_v_shift) {
  603. case 0x00: f->avctx->pix_fmt = AV_PIX_FMT_YUVA444P; break;
  604. case 0x10: f->avctx->pix_fmt = AV_PIX_FMT_YUVA422P; break;
  605. case 0x11: f->avctx->pix_fmt = AV_PIX_FMT_YUVA420P; break;
  606. }
  607. } else if (f->avctx->bits_per_raw_sample == 9 && !f->transparency) {
  608. f->packed_at_lsb = 1;
  609. switch(16 * f->chroma_h_shift + f->chroma_v_shift) {
  610. case 0x00: f->avctx->pix_fmt = AV_PIX_FMT_YUV444P9; break;
  611. case 0x10: f->avctx->pix_fmt = AV_PIX_FMT_YUV422P9; break;
  612. case 0x11: f->avctx->pix_fmt = AV_PIX_FMT_YUV420P9; break;
  613. }
  614. } else if (f->avctx->bits_per_raw_sample == 9 && f->transparency) {
  615. f->packed_at_lsb = 1;
  616. switch(16 * f->chroma_h_shift + f->chroma_v_shift) {
  617. case 0x00: f->avctx->pix_fmt = AV_PIX_FMT_YUVA444P9; break;
  618. case 0x10: f->avctx->pix_fmt = AV_PIX_FMT_YUVA422P9; break;
  619. case 0x11: f->avctx->pix_fmt = AV_PIX_FMT_YUVA420P9; break;
  620. }
  621. } else if (f->avctx->bits_per_raw_sample == 10 && !f->transparency) {
  622. f->packed_at_lsb = 1;
  623. switch(16 * f->chroma_h_shift + f->chroma_v_shift) {
  624. case 0x00: f->avctx->pix_fmt = AV_PIX_FMT_YUV444P10; break;
  625. case 0x10: f->avctx->pix_fmt = AV_PIX_FMT_YUV422P10; break;
  626. case 0x11: f->avctx->pix_fmt = AV_PIX_FMT_YUV420P10; break;
  627. }
  628. } else if (f->avctx->bits_per_raw_sample == 10 && f->transparency) {
  629. f->packed_at_lsb = 1;
  630. switch(16 * f->chroma_h_shift + f->chroma_v_shift) {
  631. case 0x00: f->avctx->pix_fmt = AV_PIX_FMT_YUVA444P10; break;
  632. case 0x10: f->avctx->pix_fmt = AV_PIX_FMT_YUVA422P10; break;
  633. case 0x11: f->avctx->pix_fmt = AV_PIX_FMT_YUVA420P10; break;
  634. }
  635. } else if (f->avctx->bits_per_raw_sample == 16 && !f->transparency){
  636. switch(16 * f->chroma_h_shift + f->chroma_v_shift) {
  637. case 0x00: f->avctx->pix_fmt = AV_PIX_FMT_YUV444P16; break;
  638. case 0x10: f->avctx->pix_fmt = AV_PIX_FMT_YUV422P16; break;
  639. case 0x11: f->avctx->pix_fmt = AV_PIX_FMT_YUV420P16; break;
  640. }
  641. } else if (f->avctx->bits_per_raw_sample == 16 && f->transparency){
  642. switch(16 * f->chroma_h_shift + f->chroma_v_shift) {
  643. case 0x00: f->avctx->pix_fmt = AV_PIX_FMT_YUVA444P16; break;
  644. case 0x10: f->avctx->pix_fmt = AV_PIX_FMT_YUVA422P16; break;
  645. case 0x11: f->avctx->pix_fmt = AV_PIX_FMT_YUVA420P16; break;
  646. }
  647. }
  648. } else if (f->colorspace == 1) {
  649. if (f->chroma_h_shift || f->chroma_v_shift) {
  650. av_log(f->avctx, AV_LOG_ERROR,
  651. "chroma subsampling not supported in this colorspace\n");
  652. return AVERROR(ENOSYS);
  653. }
  654. if ( f->avctx->bits_per_raw_sample == 9)
  655. f->avctx->pix_fmt = AV_PIX_FMT_GBRP9;
  656. else if (f->avctx->bits_per_raw_sample == 10)
  657. f->avctx->pix_fmt = AV_PIX_FMT_GBRP10;
  658. else if (f->avctx->bits_per_raw_sample == 12)
  659. f->avctx->pix_fmt = AV_PIX_FMT_GBRP12;
  660. else if (f->avctx->bits_per_raw_sample == 14)
  661. f->avctx->pix_fmt = AV_PIX_FMT_GBRP14;
  662. else
  663. if (f->transparency) f->avctx->pix_fmt = AV_PIX_FMT_RGB32;
  664. else f->avctx->pix_fmt = AV_PIX_FMT_0RGB32;
  665. } else {
  666. av_log(f->avctx, AV_LOG_ERROR, "colorspace not supported\n");
  667. return AVERROR(ENOSYS);
  668. }
  669. if (f->avctx->pix_fmt == AV_PIX_FMT_NONE) {
  670. av_log(f->avctx, AV_LOG_ERROR, "format not supported\n");
  671. return AVERROR(ENOSYS);
  672. }
  673. av_dlog(f->avctx, "%d %d %d\n",
  674. f->chroma_h_shift, f->chroma_v_shift, f->avctx->pix_fmt);
  675. if (f->version < 2) {
  676. context_count = read_quant_tables(c, f->quant_table);
  677. if (context_count < 0) {
  678. av_log(f->avctx, AV_LOG_ERROR, "read_quant_table error\n");
  679. return AVERROR_INVALIDDATA;
  680. }
  681. f->slice_count = f->max_slice_count;
  682. } else if (f->version < 3) {
  683. f->slice_count = get_symbol(c, state, 0);
  684. } else {
  685. const uint8_t *p = c->bytestream_end;
  686. for (f->slice_count = 0;
  687. f->slice_count < MAX_SLICES && 3 < p - c->bytestream_start;
  688. f->slice_count++) {
  689. int trailer = 3 + 5*!!f->ec;
  690. int size = AV_RB24(p-trailer);
  691. if (size + trailer > p - c->bytestream_start)
  692. break;
  693. p -= size + trailer;
  694. }
  695. }
  696. if (f->slice_count > (unsigned)MAX_SLICES || f->slice_count <= 0 || f->slice_count > f->max_slice_count) {
  697. av_log(f->avctx, AV_LOG_ERROR, "slice count %d is invalid (max=%d)\n", f->slice_count, f->max_slice_count);
  698. return AVERROR_INVALIDDATA;
  699. }
  700. for (j = 0; j < f->slice_count; j++) {
  701. FFV1Context *fs = f->slice_context[j];
  702. fs->ac = f->ac;
  703. fs->packed_at_lsb = f->packed_at_lsb;
  704. fs->slice_damaged = 0;
  705. if (f->version == 2) {
  706. fs->slice_x = get_symbol(c, state, 0) * f->width ;
  707. fs->slice_y = get_symbol(c, state, 0) * f->height;
  708. fs->slice_width = (get_symbol(c, state, 0) + 1) * f->width + fs->slice_x;
  709. fs->slice_height = (get_symbol(c, state, 0) + 1) * f->height + fs->slice_y;
  710. fs->slice_x /= f->num_h_slices;
  711. fs->slice_y /= f->num_v_slices;
  712. fs->slice_width = fs->slice_width / f->num_h_slices - fs->slice_x;
  713. fs->slice_height = fs->slice_height / f->num_v_slices - fs->slice_y;
  714. if ((unsigned)fs->slice_width > f->width ||
  715. (unsigned)fs->slice_height > f->height)
  716. return AVERROR_INVALIDDATA;
  717. if ( (unsigned)fs->slice_x + (uint64_t)fs->slice_width > f->width
  718. || (unsigned)fs->slice_y + (uint64_t)fs->slice_height > f->height)
  719. return AVERROR_INVALIDDATA;
  720. }
  721. for (i = 0; i < f->plane_count; i++) {
  722. PlaneContext *const p = &fs->plane[i];
  723. if (f->version == 2) {
  724. int idx = get_symbol(c, state, 0);
  725. if (idx > (unsigned)f->quant_table_count) {
  726. av_log(f->avctx, AV_LOG_ERROR,
  727. "quant_table_index out of range\n");
  728. return AVERROR_INVALIDDATA;
  729. }
  730. p->quant_table_index = idx;
  731. memcpy(p->quant_table, f->quant_tables[idx],
  732. sizeof(p->quant_table));
  733. context_count = f->context_count[idx];
  734. } else {
  735. memcpy(p->quant_table, f->quant_table, sizeof(p->quant_table));
  736. }
  737. if (f->version <= 2) {
  738. av_assert0(context_count >= 0);
  739. if (p->context_count < context_count) {
  740. av_freep(&p->state);
  741. av_freep(&p->vlc_state);
  742. }
  743. p->context_count = context_count;
  744. }
  745. }
  746. }
  747. return 0;
  748. }
  749. static av_cold int decode_init(AVCodecContext *avctx)
  750. {
  751. FFV1Context *f = avctx->priv_data;
  752. int ret;
  753. if ((ret = ffv1_common_init(avctx)) < 0)
  754. return ret;
  755. if (avctx->extradata && (ret = read_extra_header(f)) < 0)
  756. return ret;
  757. if ((ret = ffv1_init_slice_contexts(f)) < 0)
  758. return ret;
  759. avctx->internal->allocate_progress = 1;
  760. return 0;
  761. }
  762. static int decode_frame(AVCodecContext *avctx, void *data, int *got_frame, AVPacket *avpkt)
  763. {
  764. const uint8_t *buf = avpkt->data;
  765. int buf_size = avpkt->size;
  766. FFV1Context *f = avctx->priv_data;
  767. RangeCoder *const c = &f->slice_context[0]->c;
  768. int i, ret;
  769. uint8_t keystate = 128;
  770. const uint8_t *buf_p;
  771. AVFrame *p;
  772. if (f->last_picture.f)
  773. ff_thread_release_buffer(avctx, &f->last_picture);
  774. FFSWAP(ThreadFrame, f->picture, f->last_picture);
  775. f->cur = p = f->picture.f;
  776. if (f->version < 3 && avctx->field_order > AV_FIELD_PROGRESSIVE) {
  777. /* we have interlaced material flagged in container */
  778. p->interlaced_frame = 1;
  779. if (avctx->field_order == AV_FIELD_TT || avctx->field_order == AV_FIELD_TB)
  780. p->top_field_first = 1;
  781. }
  782. f->avctx = avctx;
  783. ff_init_range_decoder(c, buf, buf_size);
  784. ff_build_rac_states(c, 0.05 * (1LL << 32), 256 - 8);
  785. p->pict_type = AV_PICTURE_TYPE_I; //FIXME I vs. P
  786. if (get_rac(c, &keystate)) {
  787. p->key_frame = 1;
  788. f->key_frame_ok = 0;
  789. if ((ret = read_header(f)) < 0)
  790. return ret;
  791. f->key_frame_ok = 1;
  792. } else {
  793. if (!f->key_frame_ok) {
  794. av_log(avctx, AV_LOG_ERROR,
  795. "Cannot decode non-keyframe without valid keyframe\n");
  796. return AVERROR_INVALIDDATA;
  797. }
  798. p->key_frame = 0;
  799. }
  800. if ((ret = ff_thread_get_buffer(avctx, &f->picture, AV_GET_BUFFER_FLAG_REF)) < 0)
  801. return ret;
  802. if (avctx->debug & FF_DEBUG_PICT_INFO)
  803. av_log(avctx, AV_LOG_DEBUG, "ver:%d keyframe:%d coder:%d ec:%d slices:%d bps:%d\n",
  804. f->version, p->key_frame, f->ac, f->ec, f->slice_count, f->avctx->bits_per_raw_sample);
  805. ff_thread_finish_setup(avctx);
  806. buf_p = buf + buf_size;
  807. for (i = f->slice_count - 1; i >= 0; i--) {
  808. FFV1Context *fs = f->slice_context[i];
  809. int trailer = 3 + 5*!!f->ec;
  810. int v;
  811. if (i || f->version > 2) v = AV_RB24(buf_p-trailer) + trailer;
  812. else v = buf_p - c->bytestream_start;
  813. if (buf_p - c->bytestream_start < v) {
  814. av_log(avctx, AV_LOG_ERROR, "Slice pointer chain broken\n");
  815. return AVERROR_INVALIDDATA;
  816. }
  817. buf_p -= v;
  818. if (f->ec) {
  819. unsigned crc = av_crc(av_crc_get_table(AV_CRC_32_IEEE), 0, buf_p, v);
  820. if (crc) {
  821. int64_t ts = avpkt->pts != AV_NOPTS_VALUE ? avpkt->pts : avpkt->dts;
  822. av_log(f->avctx, AV_LOG_ERROR, "CRC mismatch %X!", crc);
  823. if (ts != AV_NOPTS_VALUE && avctx->pkt_timebase.num) {
  824. av_log(f->avctx, AV_LOG_ERROR, "at %f seconds\n", ts*av_q2d(avctx->pkt_timebase));
  825. } else if (ts != AV_NOPTS_VALUE) {
  826. av_log(f->avctx, AV_LOG_ERROR, "at %"PRId64"\n", ts);
  827. } else {
  828. av_log(f->avctx, AV_LOG_ERROR, "\n");
  829. }
  830. fs->slice_damaged = 1;
  831. }
  832. }
  833. if (i) {
  834. ff_init_range_decoder(&fs->c, buf_p, v);
  835. } else
  836. fs->c.bytestream_end = (uint8_t *)(buf_p + v);
  837. fs->avctx = avctx;
  838. fs->cur = p;
  839. }
  840. avctx->execute(avctx,
  841. decode_slice,
  842. &f->slice_context[0],
  843. NULL,
  844. f->slice_count,
  845. sizeof(void*));
  846. for (i = f->slice_count - 1; i >= 0; i--) {
  847. FFV1Context *fs = f->slice_context[i];
  848. int j;
  849. if (fs->slice_damaged && f->last_picture.f->data[0]) {
  850. const uint8_t *src[4];
  851. uint8_t *dst[4];
  852. ff_thread_await_progress(&f->last_picture, INT_MAX, 0);
  853. for (j = 0; j < 4; j++) {
  854. int sh = (j == 1 || j == 2) ? f->chroma_h_shift : 0;
  855. int sv = (j == 1 || j == 2) ? f->chroma_v_shift : 0;
  856. dst[j] = p->data[j] + p->linesize[j] *
  857. (fs->slice_y >> sv) + (fs->slice_x >> sh);
  858. src[j] = f->last_picture.f->data[j] + f->last_picture.f->linesize[j] *
  859. (fs->slice_y >> sv) + (fs->slice_x >> sh);
  860. }
  861. av_image_copy(dst, p->linesize, (const uint8_t **)src,
  862. f->last_picture.f->linesize,
  863. avctx->pix_fmt,
  864. fs->slice_width,
  865. fs->slice_height);
  866. }
  867. }
  868. ff_thread_report_progress(&f->picture, INT_MAX, 0);
  869. f->picture_number++;
  870. if (f->last_picture.f)
  871. ff_thread_release_buffer(avctx, &f->last_picture);
  872. f->cur = NULL;
  873. if ((ret = av_frame_ref(data, f->picture.f)) < 0)
  874. return ret;
  875. *got_frame = 1;
  876. return buf_size;
  877. }
  878. static int init_thread_copy(AVCodecContext *avctx)
  879. {
  880. FFV1Context *f = avctx->priv_data;
  881. int i, ret;
  882. f->picture.f = NULL;
  883. f->last_picture.f = NULL;
  884. f->sample_buffer = NULL;
  885. f->max_slice_count = 0;
  886. f->slice_count = 0;
  887. for (i = 0; i < f->quant_table_count; i++) {
  888. av_assert0(f->version > 1);
  889. f->initial_states[i] = av_memdup(f->initial_states[i],
  890. f->context_count[i] * sizeof(*f->initial_states[i]));
  891. }
  892. f->picture.f = av_frame_alloc();
  893. f->last_picture.f = av_frame_alloc();
  894. if ((ret = ffv1_init_slice_contexts(f)) < 0)
  895. return ret;
  896. return 0;
  897. }
  898. static void copy_fields(FFV1Context *fsdst, FFV1Context *fssrc, FFV1Context *fsrc)
  899. {
  900. fsdst->version = fsrc->version;
  901. fsdst->micro_version = fsrc->micro_version;
  902. fsdst->chroma_planes = fsrc->chroma_planes;
  903. fsdst->chroma_h_shift = fsrc->chroma_h_shift;
  904. fsdst->chroma_v_shift = fsrc->chroma_v_shift;
  905. fsdst->transparency = fsrc->transparency;
  906. fsdst->plane_count = fsrc->plane_count;
  907. fsdst->ac = fsrc->ac;
  908. fsdst->colorspace = fsrc->colorspace;
  909. fsdst->ec = fsrc->ec;
  910. fsdst->intra = fsrc->intra;
  911. fsdst->slice_damaged = fssrc->slice_damaged;
  912. fsdst->key_frame_ok = fsrc->key_frame_ok;
  913. fsdst->bits_per_raw_sample = fsrc->bits_per_raw_sample;
  914. fsdst->packed_at_lsb = fsrc->packed_at_lsb;
  915. fsdst->slice_count = fsrc->slice_count;
  916. if (fsrc->version<3){
  917. fsdst->slice_x = fssrc->slice_x;
  918. fsdst->slice_y = fssrc->slice_y;
  919. fsdst->slice_width = fssrc->slice_width;
  920. fsdst->slice_height = fssrc->slice_height;
  921. }
  922. }
  923. static int update_thread_context(AVCodecContext *dst, const AVCodecContext *src)
  924. {
  925. FFV1Context *fsrc = src->priv_data;
  926. FFV1Context *fdst = dst->priv_data;
  927. int i, ret;
  928. if (dst == src)
  929. return 0;
  930. {
  931. FFV1Context bak = *fdst;
  932. memcpy(fdst, fsrc, sizeof(*fdst));
  933. memcpy(fdst->initial_states, bak.initial_states, sizeof(fdst->initial_states));
  934. memcpy(fdst->slice_context, bak.slice_context , sizeof(fdst->slice_context));
  935. fdst->picture = bak.picture;
  936. fdst->last_picture = bak.last_picture;
  937. for (i = 0; i<fdst->num_h_slices * fdst->num_v_slices; i++) {
  938. FFV1Context *fssrc = fsrc->slice_context[i];
  939. FFV1Context *fsdst = fdst->slice_context[i];
  940. copy_fields(fsdst, fssrc, fsrc);
  941. }
  942. av_assert0(!fdst->plane[0].state);
  943. av_assert0(!fdst->sample_buffer);
  944. }
  945. av_assert1(fdst->max_slice_count == fsrc->max_slice_count);
  946. ff_thread_release_buffer(dst, &fdst->picture);
  947. if (fsrc->picture.f->data[0]) {
  948. if ((ret = ff_thread_ref_frame(&fdst->picture, &fsrc->picture)) < 0)
  949. return ret;
  950. }
  951. fdst->fsrc = fsrc;
  952. return 0;
  953. }
  954. AVCodec ff_ffv1_decoder = {
  955. .name = "ffv1",
  956. .long_name = NULL_IF_CONFIG_SMALL("FFmpeg video codec #1"),
  957. .type = AVMEDIA_TYPE_VIDEO,
  958. .id = AV_CODEC_ID_FFV1,
  959. .priv_data_size = sizeof(FFV1Context),
  960. .init = decode_init,
  961. .close = ffv1_close,
  962. .decode = decode_frame,
  963. .init_thread_copy = ONLY_IF_THREADS_ENABLED(init_thread_copy),
  964. .update_thread_context = ONLY_IF_THREADS_ENABLED(update_thread_context),
  965. .capabilities = CODEC_CAP_DR1 /*| CODEC_CAP_DRAW_HORIZ_BAND*/ |
  966. CODEC_CAP_FRAME_THREADS | CODEC_CAP_SLICE_THREADS,
  967. };