You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

510 lines
16KB

  1. /*
  2. * Apple Intermediate Codec decoder
  3. *
  4. * Copyright (c) 2013 Konstantin Shishkov
  5. *
  6. * This file is part of FFmpeg.
  7. *
  8. * FFmpeg is free software; you can redistribute it and/or
  9. * modify it under the terms of the GNU Lesser General Public
  10. * License as published by the Free Software Foundation; either
  11. * version 2.1 of the License, or (at your option) any later version.
  12. *
  13. * FFmpeg is distributed in the hope that it will be useful,
  14. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  15. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  16. * Lesser General Public License for more details.
  17. *
  18. * You should have received a copy of the GNU Lesser General Public
  19. * License along with FFmpeg; if not, write to the Free Software
  20. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  21. */
  22. #include <inttypes.h>
  23. #include "avcodec.h"
  24. #include "bytestream.h"
  25. #include "internal.h"
  26. #include "get_bits.h"
  27. #include "golomb.h"
  28. #include "idctdsp.h"
  29. #include "thread.h"
  30. #include "unary.h"
  31. #define AIC_HDR_SIZE 24
  32. #define AIC_BAND_COEFFS (64 + 32 + 192 + 96)
  33. enum AICBands {
  34. COEFF_LUMA = 0,
  35. COEFF_CHROMA,
  36. COEFF_LUMA_EXT,
  37. COEFF_CHROMA_EXT,
  38. NUM_BANDS
  39. };
  40. static const uint8_t aic_num_band_coeffs[NUM_BANDS] = { 64, 32, 192, 96 };
  41. static const uint16_t aic_band_off[NUM_BANDS] = { 0, 64, 96, 288 };
  42. static const uint8_t aic_quant_matrix[64] = {
  43. 8, 16, 19, 22, 22, 26, 26, 27,
  44. 16, 16, 22, 22, 26, 27, 27, 29,
  45. 19, 22, 26, 26, 27, 29, 29, 35,
  46. 22, 24, 27, 27, 29, 32, 34, 38,
  47. 26, 27, 29, 29, 32, 35, 38, 46,
  48. 27, 29, 34, 34, 35, 40, 46, 56,
  49. 29, 34, 34, 37, 40, 48, 56, 69,
  50. 34, 37, 38, 40, 48, 58, 69, 83,
  51. };
  52. static const uint8_t aic_y_scan[64] = {
  53. 0, 4, 1, 2, 5, 8, 12, 9,
  54. 6, 3, 7, 10, 13, 14, 11, 15,
  55. 47, 43, 46, 45, 42, 39, 35, 38,
  56. 41, 44, 40, 37, 34, 33, 36, 32,
  57. 16, 20, 17, 18, 21, 24, 28, 25,
  58. 22, 19, 23, 26, 29, 30, 27, 31,
  59. 63, 59, 62, 61, 58, 55, 51, 54,
  60. 57, 60, 56, 53, 50, 49, 52, 48,
  61. };
  62. static const uint8_t aic_y_ext_scan[192] = {
  63. 64, 72, 65, 66, 73, 80, 88, 81,
  64. 74, 67, 75, 82, 89, 90, 83, 91,
  65. 0, 4, 1, 2, 5, 8, 12, 9,
  66. 6, 3, 7, 10, 13, 14, 11, 15,
  67. 16, 20, 17, 18, 21, 24, 28, 25,
  68. 22, 19, 23, 26, 29, 30, 27, 31,
  69. 155, 147, 154, 153, 146, 139, 131, 138,
  70. 145, 152, 144, 137, 130, 129, 136, 128,
  71. 47, 43, 46, 45, 42, 39, 35, 38,
  72. 41, 44, 40, 37, 34, 33, 36, 32,
  73. 63, 59, 62, 61, 58, 55, 51, 54,
  74. 57, 60, 56, 53, 50, 49, 52, 48,
  75. 96, 104, 97, 98, 105, 112, 120, 113,
  76. 106, 99, 107, 114, 121, 122, 115, 123,
  77. 68, 76, 69, 70, 77, 84, 92, 85,
  78. 78, 71, 79, 86, 93, 94, 87, 95,
  79. 100, 108, 101, 102, 109, 116, 124, 117,
  80. 110, 103, 111, 118, 125, 126, 119, 127,
  81. 187, 179, 186, 185, 178, 171, 163, 170,
  82. 177, 184, 176, 169, 162, 161, 168, 160,
  83. 159, 151, 158, 157, 150, 143, 135, 142,
  84. 149, 156, 148, 141, 134, 133, 140, 132,
  85. 191, 183, 190, 189, 182, 175, 167, 174,
  86. 181, 188, 180, 173, 166, 165, 172, 164,
  87. };
  88. static const uint8_t aic_c_scan[64] = {
  89. 0, 4, 1, 2, 5, 8, 12, 9,
  90. 6, 3, 7, 10, 13, 14, 11, 15,
  91. 31, 27, 30, 29, 26, 23, 19, 22,
  92. 25, 28, 24, 21, 18, 17, 20, 16,
  93. 32, 36, 33, 34, 37, 40, 44, 41,
  94. 38, 35, 39, 42, 45, 46, 43, 47,
  95. 63, 59, 62, 61, 58, 55, 51, 54,
  96. 57, 60, 56, 53, 50, 49, 52, 48,
  97. };
  98. static const uint8_t aic_c_ext_scan[192] = {
  99. 16, 24, 17, 18, 25, 32, 40, 33,
  100. 26, 19, 27, 34, 41, 42, 35, 43,
  101. 0, 4, 1, 2, 5, 8, 12, 9,
  102. 6, 3, 7, 10, 13, 14, 11, 15,
  103. 20, 28, 21, 22, 29, 36, 44, 37,
  104. 30, 23, 31, 38, 45, 46, 39, 47,
  105. 95, 87, 94, 93, 86, 79, 71, 78,
  106. 85, 92, 84, 77, 70, 69, 76, 68,
  107. 63, 59, 62, 61, 58, 55, 51, 54,
  108. 57, 60, 56, 53, 50, 49, 52, 48,
  109. 91, 83, 90, 89, 82, 75, 67, 74,
  110. 81, 88, 80, 73, 66, 65, 72, 64,
  111. 112, 120, 113, 114, 121, 128, 136, 129,
  112. 122, 115, 123, 130, 137, 138, 131, 139,
  113. 96, 100, 97, 98, 101, 104, 108, 105,
  114. 102, 99, 103, 106, 109, 110, 107, 111,
  115. 116, 124, 117, 118, 125, 132, 140, 133,
  116. 126, 119, 127, 134, 141, 142, 135, 143,
  117. 191, 183, 190, 189, 182, 175, 167, 174,
  118. 181, 188, 180, 173, 166, 165, 172, 164,
  119. 159, 155, 158, 157, 154, 151, 147, 150,
  120. 153, 156, 152, 149, 146, 145, 148, 144,
  121. 187, 179, 186, 185, 178, 171, 163, 170,
  122. 177, 184, 176, 169, 162, 161, 168, 160,
  123. };
  124. static const uint8_t * const aic_scan[NUM_BANDS] = {
  125. aic_y_scan, aic_c_scan, aic_y_ext_scan, aic_c_ext_scan
  126. };
  127. typedef struct AICContext {
  128. AVCodecContext *avctx;
  129. AVFrame *frame;
  130. IDCTDSPContext idsp;
  131. ScanTable scantable;
  132. int num_x_slices;
  133. int slice_width;
  134. int mb_width, mb_height;
  135. int quant;
  136. int interlaced;
  137. int16_t *slice_data;
  138. int16_t *data_ptr[NUM_BANDS];
  139. DECLARE_ALIGNED(16, int16_t, block)[64];
  140. DECLARE_ALIGNED(16, uint8_t, quant_matrix)[64];
  141. } AICContext;
  142. static int aic_decode_header(AICContext *ctx, const uint8_t *src, int size)
  143. {
  144. uint32_t frame_size;
  145. int width, height;
  146. if (src[0] != 1) {
  147. av_log(ctx->avctx, AV_LOG_ERROR, "Invalid version %d\n", src[0]);
  148. return AVERROR_INVALIDDATA;
  149. }
  150. if (src[1] != AIC_HDR_SIZE - 2) {
  151. av_log(ctx->avctx, AV_LOG_ERROR, "Invalid header size %d\n", src[1]);
  152. return AVERROR_INVALIDDATA;
  153. }
  154. frame_size = AV_RB32(src + 2);
  155. width = AV_RB16(src + 6);
  156. height = AV_RB16(src + 8);
  157. if (frame_size > size) {
  158. av_log(ctx->avctx, AV_LOG_ERROR, "Frame size should be %"PRIu32" got %d\n",
  159. frame_size, size);
  160. return AVERROR_INVALIDDATA;
  161. }
  162. if (width != ctx->avctx->width || height != ctx->avctx->height) {
  163. av_log(ctx->avctx, AV_LOG_ERROR,
  164. "Picture dimension changed: old: %d x %d, new: %d x %d\n",
  165. ctx->avctx->width, ctx->avctx->height, width, height);
  166. return AVERROR_INVALIDDATA;
  167. }
  168. ctx->quant = src[15];
  169. ctx->interlaced = ((src[16] >> 4) == 3);
  170. return 0;
  171. }
  172. #define GET_CODE(val, type, add_bits) \
  173. do { \
  174. if (type) \
  175. val = get_ue_golomb(gb); \
  176. else \
  177. val = get_unary(gb, 1, 31); \
  178. if (add_bits) \
  179. val = (val << add_bits) + get_bits(gb, add_bits); \
  180. } while (0)
  181. static int aic_decode_coeffs(GetBitContext *gb, int16_t *dst,
  182. int band, int slice_width, int force_chroma)
  183. {
  184. int has_skips, coeff_type, coeff_bits, skip_type, skip_bits;
  185. const int num_coeffs = aic_num_band_coeffs[band];
  186. const uint8_t *scan = aic_scan[band | force_chroma];
  187. int mb, idx;
  188. unsigned val;
  189. if (get_bits_left(gb) < 5)
  190. return AVERROR_INVALIDDATA;
  191. has_skips = get_bits1(gb);
  192. coeff_type = get_bits1(gb);
  193. coeff_bits = get_bits(gb, 3);
  194. if (has_skips) {
  195. skip_type = get_bits1(gb);
  196. skip_bits = get_bits(gb, 3);
  197. for (mb = 0; mb < slice_width; mb++) {
  198. idx = -1;
  199. do {
  200. GET_CODE(val, skip_type, skip_bits);
  201. if (val >= 0x10000)
  202. return AVERROR_INVALIDDATA;
  203. idx += val + 1;
  204. if (idx >= num_coeffs)
  205. break;
  206. GET_CODE(val, coeff_type, coeff_bits);
  207. val++;
  208. if (val >= 0x10000)
  209. return AVERROR_INVALIDDATA;
  210. dst[scan[idx]] = val;
  211. } while (idx < num_coeffs - 1);
  212. dst += num_coeffs;
  213. }
  214. } else {
  215. for (mb = 0; mb < slice_width; mb++) {
  216. for (idx = 0; idx < num_coeffs; idx++) {
  217. GET_CODE(val, coeff_type, coeff_bits);
  218. if (val >= 0x10000)
  219. return AVERROR_INVALIDDATA;
  220. dst[scan[idx]] = val;
  221. }
  222. dst += num_coeffs;
  223. }
  224. }
  225. return 0;
  226. }
  227. static void recombine_block(int16_t *dst, const uint8_t *scan,
  228. int16_t **base, int16_t **ext)
  229. {
  230. int i, j;
  231. for (i = 0; i < 4; i++) {
  232. for (j = 0; j < 4; j++)
  233. dst[scan[i * 8 + j]] = (*base)[j];
  234. for (j = 0; j < 4; j++)
  235. dst[scan[i * 8 + j + 4]] = (*ext)[j];
  236. *base += 4;
  237. *ext += 4;
  238. }
  239. for (; i < 8; i++) {
  240. for (j = 0; j < 8; j++)
  241. dst[scan[i * 8 + j]] = (*ext)[j];
  242. *ext += 8;
  243. }
  244. }
  245. static void recombine_block_il(int16_t *dst, const uint8_t *scan,
  246. int16_t **base, int16_t **ext,
  247. int block_no)
  248. {
  249. int i, j;
  250. if (block_no < 2) {
  251. for (i = 0; i < 8; i++) {
  252. for (j = 0; j < 4; j++)
  253. dst[scan[i * 8 + j]] = (*base)[j];
  254. for (j = 0; j < 4; j++)
  255. dst[scan[i * 8 + j + 4]] = (*ext)[j];
  256. *base += 4;
  257. *ext += 4;
  258. }
  259. } else {
  260. for (i = 0; i < 64; i++)
  261. dst[scan[i]] = (*ext)[i];
  262. *ext += 64;
  263. }
  264. }
  265. static void unquant_block(int16_t *block, int q, uint8_t *quant_matrix)
  266. {
  267. int i;
  268. for (i = 0; i < 64; i++) {
  269. int val = (uint16_t)block[i];
  270. int sign = val & 1;
  271. block[i] = (((val >> 1) ^ -sign) * q * quant_matrix[i] >> 4)
  272. + sign;
  273. }
  274. }
  275. static int aic_decode_slice(AICContext *ctx, int mb_x, int mb_y,
  276. const uint8_t *src, int src_size)
  277. {
  278. GetBitContext gb;
  279. int ret, i, mb, blk;
  280. int slice_width = FFMIN(ctx->slice_width, ctx->mb_width - mb_x);
  281. int last_row = mb_y && mb_y == ctx->mb_height - 1;
  282. int y_pos, c_pos;
  283. uint8_t *Y, *C[2];
  284. uint8_t *dst;
  285. int16_t *base_y = ctx->data_ptr[COEFF_LUMA];
  286. int16_t *base_c = ctx->data_ptr[COEFF_CHROMA];
  287. int16_t *ext_y = ctx->data_ptr[COEFF_LUMA_EXT];
  288. int16_t *ext_c = ctx->data_ptr[COEFF_CHROMA_EXT];
  289. const int ystride = ctx->frame->linesize[0];
  290. if (last_row) {
  291. y_pos = (ctx->avctx->height - 16);
  292. c_pos = ((ctx->avctx->height+1)/2 - 8);
  293. } else {
  294. y_pos = mb_y * 16;
  295. c_pos = mb_y * 8;
  296. }
  297. Y = ctx->frame->data[0] + mb_x * 16 + y_pos * ystride;
  298. for (i = 0; i < 2; i++)
  299. C[i] = ctx->frame->data[i + 1] + mb_x * 8
  300. + c_pos * ctx->frame->linesize[i + 1];
  301. init_get_bits(&gb, src, src_size * 8);
  302. memset(ctx->slice_data, 0,
  303. sizeof(*ctx->slice_data) * slice_width * AIC_BAND_COEFFS);
  304. for (i = 0; i < NUM_BANDS; i++)
  305. if ((ret = aic_decode_coeffs(&gb, ctx->data_ptr[i],
  306. i, slice_width,
  307. !ctx->interlaced)) < 0)
  308. return ret;
  309. for (mb = 0; mb < slice_width; mb++) {
  310. for (blk = 0; blk < 4; blk++) {
  311. if (!ctx->interlaced)
  312. recombine_block(ctx->block, ctx->scantable.permutated,
  313. &base_y, &ext_y);
  314. else
  315. recombine_block_il(ctx->block, ctx->scantable.permutated,
  316. &base_y, &ext_y, blk);
  317. unquant_block(ctx->block, ctx->quant, ctx->quant_matrix);
  318. ctx->idsp.idct(ctx->block);
  319. if (!ctx->interlaced) {
  320. dst = Y + (blk >> 1) * 8 * ystride + (blk & 1) * 8;
  321. ctx->idsp.put_signed_pixels_clamped(ctx->block, dst, ystride);
  322. } else {
  323. dst = Y + (blk & 1) * 8 + (blk >> 1) * ystride;
  324. ctx->idsp.put_signed_pixels_clamped(ctx->block, dst,
  325. ystride * 2);
  326. }
  327. }
  328. Y += 16;
  329. for (blk = 0; blk < 2; blk++) {
  330. recombine_block(ctx->block, ctx->scantable.permutated,
  331. &base_c, &ext_c);
  332. unquant_block(ctx->block, ctx->quant, ctx->quant_matrix);
  333. ctx->idsp.idct(ctx->block);
  334. ctx->idsp.put_signed_pixels_clamped(ctx->block, C[blk],
  335. ctx->frame->linesize[blk + 1]);
  336. C[blk] += 8;
  337. }
  338. }
  339. return 0;
  340. }
  341. static int aic_decode_frame(AVCodecContext *avctx, void *data, int *got_frame,
  342. AVPacket *avpkt)
  343. {
  344. AICContext *ctx = avctx->priv_data;
  345. const uint8_t *buf = avpkt->data;
  346. int buf_size = avpkt->size;
  347. GetByteContext gb;
  348. uint32_t off;
  349. int x, y, ret;
  350. int slice_size;
  351. ThreadFrame frame = { .f = data };
  352. ctx->frame = data;
  353. ctx->frame->pict_type = AV_PICTURE_TYPE_I;
  354. ctx->frame->key_frame = 1;
  355. off = FFALIGN(AIC_HDR_SIZE + ctx->num_x_slices * ctx->mb_height * 2, 4);
  356. if (buf_size < off) {
  357. av_log(avctx, AV_LOG_ERROR, "Too small frame\n");
  358. return AVERROR_INVALIDDATA;
  359. }
  360. ret = aic_decode_header(ctx, buf, buf_size);
  361. if (ret < 0) {
  362. av_log(avctx, AV_LOG_ERROR, "Invalid header\n");
  363. return ret;
  364. }
  365. if ((ret = ff_thread_get_buffer(avctx, &frame, 0)) < 0)
  366. return ret;
  367. bytestream2_init(&gb, buf + AIC_HDR_SIZE,
  368. ctx->num_x_slices * ctx->mb_height * 2);
  369. for (y = 0; y < ctx->mb_height; y++) {
  370. for (x = 0; x < ctx->mb_width; x += ctx->slice_width) {
  371. slice_size = bytestream2_get_le16(&gb) * 4;
  372. if (slice_size + off > buf_size || !slice_size) {
  373. av_log(avctx, AV_LOG_ERROR,
  374. "Incorrect slice size %d at %d.%d\n", slice_size, x, y);
  375. return AVERROR_INVALIDDATA;
  376. }
  377. ret = aic_decode_slice(ctx, x, y, buf + off, slice_size);
  378. if (ret < 0) {
  379. av_log(avctx, AV_LOG_ERROR,
  380. "Error decoding slice at %d.%d\n", x, y);
  381. return ret;
  382. }
  383. off += slice_size;
  384. }
  385. }
  386. *got_frame = 1;
  387. return avpkt->size;
  388. }
  389. static av_cold int aic_decode_init(AVCodecContext *avctx)
  390. {
  391. AICContext *ctx = avctx->priv_data;
  392. int i;
  393. uint8_t scan[64];
  394. ctx->avctx = avctx;
  395. avctx->pix_fmt = AV_PIX_FMT_YUV420P;
  396. ff_idctdsp_init(&ctx->idsp, avctx);
  397. for (i = 0; i < 64; i++)
  398. scan[i] = i;
  399. ff_init_scantable(ctx->idsp.idct_permutation, &ctx->scantable, scan);
  400. for (i = 0; i < 64; i++)
  401. ctx->quant_matrix[ctx->idsp.idct_permutation[i]] = aic_quant_matrix[i];
  402. ctx->mb_width = FFALIGN(avctx->width, 16) >> 4;
  403. ctx->mb_height = FFALIGN(avctx->height, 16) >> 4;
  404. ctx->num_x_slices = (ctx->mb_width + 15) >> 4;
  405. ctx->slice_width = 16;
  406. for (i = 1; i < ctx->mb_width; i++) {
  407. if (!(ctx->mb_width % i) && (ctx->mb_width / i <= 32)) {
  408. ctx->slice_width = ctx->mb_width / i;
  409. ctx->num_x_slices = i;
  410. break;
  411. }
  412. }
  413. ctx->slice_data = av_malloc_array(ctx->slice_width, AIC_BAND_COEFFS
  414. * sizeof(*ctx->slice_data));
  415. if (!ctx->slice_data) {
  416. av_log(avctx, AV_LOG_ERROR, "Error allocating slice buffer\n");
  417. return AVERROR(ENOMEM);
  418. }
  419. for (i = 0; i < NUM_BANDS; i++)
  420. ctx->data_ptr[i] = ctx->slice_data + ctx->slice_width
  421. * aic_band_off[i];
  422. return 0;
  423. }
  424. static av_cold int aic_decode_close(AVCodecContext *avctx)
  425. {
  426. AICContext *ctx = avctx->priv_data;
  427. av_freep(&ctx->slice_data);
  428. return 0;
  429. }
  430. AVCodec ff_aic_decoder = {
  431. .name = "aic",
  432. .long_name = NULL_IF_CONFIG_SMALL("Apple Intermediate Codec"),
  433. .type = AVMEDIA_TYPE_VIDEO,
  434. .id = AV_CODEC_ID_AIC,
  435. .priv_data_size = sizeof(AICContext),
  436. .init = aic_decode_init,
  437. .close = aic_decode_close,
  438. .decode = aic_decode_frame,
  439. .capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_FRAME_THREADS,
  440. .init_thread_copy = ONLY_IF_THREADS_ENABLED(aic_decode_init),
  441. .caps_internal = FF_CODEC_CAP_INIT_THREADSAFE,
  442. };