You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

493 lines
16KB

  1. /*
  2. * Apple Intermediate Codec decoder
  3. *
  4. * Copyright (c) 2013 Konstantin Shishkov
  5. *
  6. * This file is part of Libav.
  7. *
  8. * Libav is free software; you can redistribute it and/or
  9. * modify it under the terms of the GNU Lesser General Public
  10. * License as published by the Free Software Foundation; either
  11. * version 2.1 of the License, or (at your option) any later version.
  12. *
  13. * Libav is distributed in the hope that it will be useful,
  14. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  15. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  16. * Lesser General Public License for more details.
  17. *
  18. * You should have received a copy of the GNU Lesser General Public
  19. * License along with Libav; if not, write to the Free Software
  20. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  21. */
  22. #include <inttypes.h>
  23. #include "avcodec.h"
  24. #include "bitstream.h"
  25. #include "bytestream.h"
  26. #include "golomb.h"
  27. #include "internal.h"
  28. #include "idctdsp.h"
  29. #include "thread.h"
  30. #include "unary.h"
  31. #define AIC_HDR_SIZE 24
  32. #define AIC_BAND_COEFFS (64 + 32 + 192 + 96)
  33. enum AICBands {
  34. COEFF_LUMA = 0,
  35. COEFF_CHROMA,
  36. COEFF_LUMA_EXT,
  37. COEFF_CHROMA_EXT,
  38. NUM_BANDS
  39. };
  40. static const int aic_num_band_coeffs[NUM_BANDS] = { 64, 32, 192, 96 };
  41. static const int aic_band_off[NUM_BANDS] = { 0, 64, 96, 288 };
  42. static const uint8_t aic_quant_matrix[64] = {
  43. 8, 16, 19, 22, 22, 26, 26, 27,
  44. 16, 16, 22, 22, 26, 27, 27, 29,
  45. 19, 22, 26, 26, 27, 29, 29, 35,
  46. 22, 24, 27, 27, 29, 32, 34, 38,
  47. 26, 27, 29, 29, 32, 35, 38, 46,
  48. 27, 29, 34, 34, 35, 40, 46, 56,
  49. 29, 34, 34, 37, 40, 48, 56, 69,
  50. 34, 37, 38, 40, 48, 58, 69, 83,
  51. };
  52. static const uint8_t aic_y_scan[64] = {
  53. 0, 4, 1, 2, 5, 8, 12, 9,
  54. 6, 3, 7, 10, 13, 14, 11, 15,
  55. 47, 43, 46, 45, 42, 39, 35, 38,
  56. 41, 44, 40, 37, 34, 33, 36, 32,
  57. 16, 20, 17, 18, 21, 24, 28, 25,
  58. 22, 19, 23, 26, 29, 30, 27, 31,
  59. 63, 59, 62, 61, 58, 55, 51, 54,
  60. 57, 60, 56, 53, 50, 49, 52, 48,
  61. };
  62. static const uint8_t aic_y_ext_scan[192] = {
  63. 64, 72, 65, 66, 73, 80, 88, 81,
  64. 74, 67, 75, 82, 89, 90, 83, 91,
  65. 0, 4, 1, 2, 5, 8, 12, 9,
  66. 6, 3, 7, 10, 13, 14, 11, 15,
  67. 16, 20, 17, 18, 21, 24, 28, 25,
  68. 22, 19, 23, 26, 29, 30, 27, 31,
  69. 155, 147, 154, 153, 146, 139, 131, 138,
  70. 145, 152, 144, 137, 130, 129, 136, 128,
  71. 47, 43, 46, 45, 42, 39, 35, 38,
  72. 41, 44, 40, 37, 34, 33, 36, 32,
  73. 63, 59, 62, 61, 58, 55, 51, 54,
  74. 57, 60, 56, 53, 50, 49, 52, 48,
  75. 96, 104, 97, 98, 105, 112, 120, 113,
  76. 106, 99, 107, 114, 121, 122, 115, 123,
  77. 68, 76, 69, 70, 77, 84, 92, 85,
  78. 78, 71, 79, 86, 93, 94, 87, 95,
  79. 100, 108, 101, 102, 109, 116, 124, 117,
  80. 110, 103, 111, 118, 125, 126, 119, 127,
  81. 187, 179, 186, 185, 178, 171, 163, 170,
  82. 177, 184, 176, 169, 162, 161, 168, 160,
  83. 159, 151, 158, 157, 150, 143, 135, 142,
  84. 149, 156, 148, 141, 134, 133, 140, 132,
  85. 191, 183, 190, 189, 182, 175, 167, 174,
  86. 181, 188, 180, 173, 166, 165, 172, 164,
  87. };
  88. static const uint8_t aic_c_scan[64] = {
  89. 0, 4, 1, 2, 5, 8, 12, 9,
  90. 6, 3, 7, 10, 13, 14, 11, 15,
  91. 31, 27, 30, 29, 26, 23, 19, 22,
  92. 25, 28, 24, 21, 18, 17, 20, 16,
  93. 32, 36, 33, 34, 37, 40, 44, 41,
  94. 38, 35, 39, 42, 45, 46, 43, 47,
  95. 63, 59, 62, 61, 58, 55, 51, 54,
  96. 57, 60, 56, 53, 50, 49, 52, 48,
  97. };
  98. static const uint8_t aic_c_ext_scan[192] = {
  99. 16, 24, 17, 18, 25, 32, 40, 33,
  100. 26, 19, 27, 34, 41, 42, 35, 43,
  101. 0, 4, 1, 2, 5, 8, 12, 9,
  102. 6, 3, 7, 10, 13, 14, 11, 15,
  103. 20, 28, 21, 22, 29, 36, 44, 37,
  104. 30, 23, 31, 38, 45, 46, 39, 47,
  105. 95, 87, 94, 93, 86, 79, 71, 78,
  106. 85, 92, 84, 77, 70, 69, 76, 68,
  107. 63, 59, 62, 61, 58, 55, 51, 54,
  108. 57, 60, 56, 53, 50, 49, 52, 48,
  109. 91, 83, 90, 89, 82, 75, 67, 74,
  110. 81, 88, 80, 73, 66, 65, 72, 64,
  111. 112, 120, 113, 114, 121, 128, 136, 129,
  112. 122, 115, 123, 130, 137, 138, 131, 139,
  113. 96, 100, 97, 98, 101, 104, 108, 105,
  114. 102, 99, 103, 106, 109, 110, 107, 111,
  115. 116, 124, 117, 118, 125, 132, 140, 133,
  116. 126, 119, 127, 134, 141, 142, 135, 143,
  117. 191, 183, 190, 189, 182, 175, 167, 174,
  118. 181, 188, 180, 173, 166, 165, 172, 164,
  119. 159, 155, 158, 157, 154, 151, 147, 150,
  120. 153, 156, 152, 149, 146, 145, 148, 144,
  121. 187, 179, 186, 185, 178, 171, 163, 170,
  122. 177, 184, 176, 169, 162, 161, 168, 160,
  123. };
  124. static const uint8_t * const aic_scan[NUM_BANDS] = {
  125. aic_y_scan, aic_c_scan, aic_y_ext_scan, aic_c_ext_scan
  126. };
  127. typedef struct AICContext {
  128. AVCodecContext *avctx;
  129. AVFrame *frame;
  130. IDCTDSPContext idsp;
  131. ScanTable scantable;
  132. int num_x_slices;
  133. int slice_width;
  134. int mb_width, mb_height;
  135. int quant;
  136. int interlaced;
  137. int16_t *slice_data;
  138. int16_t *data_ptr[NUM_BANDS];
  139. DECLARE_ALIGNED(16, int16_t, block)[64];
  140. } AICContext;
  141. static int aic_decode_header(AICContext *ctx, const uint8_t *src, int size)
  142. {
  143. uint32_t frame_size;
  144. int width, height;
  145. if (src[0] != 1) {
  146. av_log(ctx->avctx, AV_LOG_ERROR, "Invalid version %d\n", src[0]);
  147. return AVERROR_INVALIDDATA;
  148. }
  149. if (src[1] != AIC_HDR_SIZE - 2) {
  150. av_log(ctx->avctx, AV_LOG_ERROR, "Invalid header size %d\n", src[1]);
  151. return AVERROR_INVALIDDATA;
  152. }
  153. frame_size = AV_RB32(src + 2);
  154. width = AV_RB16(src + 6);
  155. height = AV_RB16(src + 8);
  156. if (frame_size > size) {
  157. av_log(ctx->avctx, AV_LOG_ERROR, "Frame size should be %"PRIu32" got %d\n",
  158. frame_size, size);
  159. return AVERROR_INVALIDDATA;
  160. }
  161. if (width != ctx->avctx->width || height != ctx->avctx->height) {
  162. av_log(ctx->avctx, AV_LOG_ERROR,
  163. "Picture dimension changed: old: %d x %d, new: %d x %d\n",
  164. ctx->avctx->width, ctx->avctx->height, width, height);
  165. return AVERROR_INVALIDDATA;
  166. }
  167. ctx->quant = src[15];
  168. ctx->interlaced = ((src[16] >> 4) == 3);
  169. return 0;
  170. }
  171. #define GET_CODE(val, type, add_bits) \
  172. do { \
  173. if (type) \
  174. val = get_ue_golomb(bc); \
  175. else \
  176. val = get_unary(bc, 1, 31); \
  177. if (add_bits) \
  178. val = (val << add_bits) + bitstream_read(bc, add_bits); \
  179. } while (0)
  180. static int aic_decode_coeffs(BitstreamContext *bc, int16_t *dst,
  181. int band, int slice_width, int force_chroma)
  182. {
  183. int has_skips, coeff_type, coeff_bits, skip_type, skip_bits;
  184. const int num_coeffs = aic_num_band_coeffs[band];
  185. const uint8_t *scan = aic_scan[band | force_chroma];
  186. int mb, idx, val;
  187. has_skips = bitstream_read_bit(bc);
  188. coeff_type = bitstream_read_bit(bc);
  189. coeff_bits = bitstream_read(bc, 3);
  190. if (has_skips) {
  191. skip_type = bitstream_read_bit(bc);
  192. skip_bits = bitstream_read(bc, 3);
  193. for (mb = 0; mb < slice_width; mb++) {
  194. idx = -1;
  195. do {
  196. GET_CODE(val, skip_type, skip_bits);
  197. if (val < 0)
  198. return AVERROR_INVALIDDATA;
  199. idx += val + 1;
  200. if (idx >= num_coeffs)
  201. break;
  202. GET_CODE(val, coeff_type, coeff_bits);
  203. val++;
  204. if (val >= 0x10000 || val < 0)
  205. return AVERROR_INVALIDDATA;
  206. dst[scan[idx]] = val;
  207. } while (idx < num_coeffs - 1);
  208. dst += num_coeffs;
  209. }
  210. } else {
  211. for (mb = 0; mb < slice_width; mb++) {
  212. for (idx = 0; idx < num_coeffs; idx++) {
  213. GET_CODE(val, coeff_type, coeff_bits);
  214. if (val >= 0x10000 || val < 0)
  215. return AVERROR_INVALIDDATA;
  216. dst[scan[idx]] = val;
  217. }
  218. dst += num_coeffs;
  219. }
  220. }
  221. return 0;
  222. }
  223. static void recombine_block(int16_t *dst, const uint8_t *scan,
  224. int16_t **base, int16_t **ext)
  225. {
  226. int i, j;
  227. for (i = 0; i < 4; i++) {
  228. for (j = 0; j < 4; j++)
  229. dst[scan[i * 8 + j]] = (*base)[j];
  230. for (j = 0; j < 4; j++)
  231. dst[scan[i * 8 + j + 4]] = (*ext)[j];
  232. *base += 4;
  233. *ext += 4;
  234. }
  235. for (; i < 8; i++) {
  236. for (j = 0; j < 8; j++)
  237. dst[scan[i * 8 + j]] = (*ext)[j];
  238. *ext += 8;
  239. }
  240. }
  241. static void recombine_block_il(int16_t *dst, const uint8_t *scan,
  242. int16_t **base, int16_t **ext,
  243. int block_no)
  244. {
  245. int i, j;
  246. if (block_no < 2) {
  247. for (i = 0; i < 8; i++) {
  248. for (j = 0; j < 4; j++)
  249. dst[scan[i * 8 + j]] = (*base)[j];
  250. for (j = 0; j < 4; j++)
  251. dst[scan[i * 8 + j + 4]] = (*ext)[j];
  252. *base += 4;
  253. *ext += 4;
  254. }
  255. } else {
  256. for (i = 0; i < 64; i++)
  257. dst[scan[i]] = (*ext)[i];
  258. *ext += 64;
  259. }
  260. }
  261. static void unquant_block(int16_t *block, int q)
  262. {
  263. int i;
  264. for (i = 0; i < 64; i++) {
  265. int val = (uint16_t)block[i];
  266. int sign = val & 1;
  267. block[i] = (((val >> 1) ^ -sign) * q * aic_quant_matrix[i] >> 4)
  268. + sign;
  269. }
  270. }
  271. static int aic_decode_slice(AICContext *ctx, int mb_x, int mb_y,
  272. const uint8_t *src, int src_size)
  273. {
  274. BitstreamContext bc;
  275. int ret, i, mb, blk;
  276. int slice_width = FFMIN(ctx->slice_width, ctx->mb_width - mb_x);
  277. uint8_t *Y, *C[2];
  278. uint8_t *dst;
  279. int16_t *base_y = ctx->data_ptr[COEFF_LUMA];
  280. int16_t *base_c = ctx->data_ptr[COEFF_CHROMA];
  281. int16_t *ext_y = ctx->data_ptr[COEFF_LUMA_EXT];
  282. int16_t *ext_c = ctx->data_ptr[COEFF_CHROMA_EXT];
  283. const int ystride = ctx->frame->linesize[0];
  284. Y = ctx->frame->data[0] + mb_x * 16 + mb_y * 16 * ystride;
  285. for (i = 0; i < 2; i++)
  286. C[i] = ctx->frame->data[i + 1] + mb_x * 8
  287. + mb_y * 8 * ctx->frame->linesize[i + 1];
  288. bitstream_init8(&bc, src, src_size);
  289. memset(ctx->slice_data, 0,
  290. sizeof(*ctx->slice_data) * slice_width * AIC_BAND_COEFFS);
  291. for (i = 0; i < NUM_BANDS; i++)
  292. if ((ret = aic_decode_coeffs(&bc, ctx->data_ptr[i],
  293. i, slice_width,
  294. !ctx->interlaced)) < 0)
  295. return ret;
  296. for (mb = 0; mb < slice_width; mb++) {
  297. for (blk = 0; blk < 4; blk++) {
  298. if (!ctx->interlaced)
  299. recombine_block(ctx->block, ctx->scantable.permutated,
  300. &base_y, &ext_y);
  301. else
  302. recombine_block_il(ctx->block, ctx->scantable.permutated,
  303. &base_y, &ext_y, blk);
  304. unquant_block(ctx->block, ctx->quant);
  305. ctx->idsp.idct(ctx->block);
  306. if (!ctx->interlaced) {
  307. dst = Y + (blk >> 1) * 8 * ystride + (blk & 1) * 8;
  308. ctx->idsp.put_signed_pixels_clamped(ctx->block, dst, ystride);
  309. } else {
  310. dst = Y + (blk & 1) * 8 + (blk >> 1) * ystride;
  311. ctx->idsp.put_signed_pixels_clamped(ctx->block, dst,
  312. ystride * 2);
  313. }
  314. }
  315. Y += 16;
  316. for (blk = 0; blk < 2; blk++) {
  317. recombine_block(ctx->block, ctx->scantable.permutated,
  318. &base_c, &ext_c);
  319. unquant_block(ctx->block, ctx->quant);
  320. ctx->idsp.idct(ctx->block);
  321. ctx->idsp.put_signed_pixels_clamped(ctx->block, C[blk],
  322. ctx->frame->linesize[blk + 1]);
  323. C[blk] += 8;
  324. }
  325. }
  326. return 0;
  327. }
  328. static int aic_decode_frame(AVCodecContext *avctx, void *data, int *got_frame,
  329. AVPacket *avpkt)
  330. {
  331. AICContext *ctx = avctx->priv_data;
  332. const uint8_t *buf = avpkt->data;
  333. int buf_size = avpkt->size;
  334. GetByteContext gb;
  335. uint32_t off;
  336. int x, y, ret;
  337. int slice_size;
  338. ThreadFrame frame = { .f = data };
  339. ctx->frame = data;
  340. ctx->frame->pict_type = AV_PICTURE_TYPE_I;
  341. ctx->frame->key_frame = 1;
  342. off = FFALIGN(AIC_HDR_SIZE + ctx->num_x_slices * ctx->mb_height * 2, 4);
  343. if (buf_size < off) {
  344. av_log(avctx, AV_LOG_ERROR, "Too small frame\n");
  345. return AVERROR_INVALIDDATA;
  346. }
  347. ret = aic_decode_header(ctx, buf, buf_size);
  348. if (ret < 0) {
  349. av_log(avctx, AV_LOG_ERROR, "Invalid header\n");
  350. return ret;
  351. }
  352. if ((ret = ff_thread_get_buffer(avctx, &frame, 0)) < 0)
  353. return ret;
  354. bytestream2_init(&gb, buf + AIC_HDR_SIZE,
  355. ctx->num_x_slices * ctx->mb_height * 2);
  356. for (y = 0; y < ctx->mb_height; y++) {
  357. for (x = 0; x < ctx->mb_width; x += ctx->slice_width) {
  358. slice_size = bytestream2_get_le16(&gb) * 4;
  359. if (slice_size + off > buf_size || !slice_size) {
  360. av_log(avctx, AV_LOG_ERROR,
  361. "Incorrect slice size %d at %d.%d\n", slice_size, x, y);
  362. return AVERROR_INVALIDDATA;
  363. }
  364. ret = aic_decode_slice(ctx, x, y, buf + off, slice_size);
  365. if (ret < 0) {
  366. av_log(avctx, AV_LOG_ERROR,
  367. "Error decoding slice at %d.%d\n", x, y);
  368. return ret;
  369. }
  370. off += slice_size;
  371. }
  372. }
  373. *got_frame = 1;
  374. return avpkt->size;
  375. }
  376. static av_cold int aic_decode_init(AVCodecContext *avctx)
  377. {
  378. AICContext *ctx = avctx->priv_data;
  379. int i;
  380. uint8_t scan[64];
  381. ctx->avctx = avctx;
  382. avctx->pix_fmt = AV_PIX_FMT_YUV420P;
  383. ff_idctdsp_init(&ctx->idsp, avctx);
  384. for (i = 0; i < 64; i++)
  385. scan[i] = i;
  386. ff_init_scantable(ctx->idsp.idct_permutation, &ctx->scantable, scan);
  387. ctx->mb_width = FFALIGN(avctx->width, 16) >> 4;
  388. ctx->mb_height = FFALIGN(avctx->height, 16) >> 4;
  389. ctx->num_x_slices = (ctx->mb_width + 15) >> 4;
  390. ctx->slice_width = 16;
  391. for (i = 1; i < 32; i++) {
  392. if (!(ctx->mb_width % i) && (ctx->mb_width / i <= 32)) {
  393. ctx->slice_width = ctx->mb_width / i;
  394. ctx->num_x_slices = i;
  395. break;
  396. }
  397. }
  398. ctx->slice_data = av_malloc(ctx->slice_width * AIC_BAND_COEFFS
  399. * sizeof(*ctx->slice_data));
  400. if (!ctx->slice_data) {
  401. av_log(avctx, AV_LOG_ERROR, "Error allocating slice buffer\n");
  402. return AVERROR(ENOMEM);
  403. }
  404. for (i = 0; i < NUM_BANDS; i++)
  405. ctx->data_ptr[i] = ctx->slice_data + ctx->slice_width
  406. * aic_band_off[i];
  407. return 0;
  408. }
  409. static av_cold int aic_decode_close(AVCodecContext *avctx)
  410. {
  411. AICContext *ctx = avctx->priv_data;
  412. av_freep(&ctx->slice_data);
  413. return 0;
  414. }
  415. AVCodec ff_aic_decoder = {
  416. .name = "aic",
  417. .long_name = NULL_IF_CONFIG_SMALL("Apple Intermediate Codec"),
  418. .type = AVMEDIA_TYPE_VIDEO,
  419. .id = AV_CODEC_ID_AIC,
  420. .priv_data_size = sizeof(AICContext),
  421. .init = aic_decode_init,
  422. .close = aic_decode_close,
  423. .decode = aic_decode_frame,
  424. .capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_FRAME_THREADS,
  425. .init_thread_copy = ONLY_IF_THREADS_ENABLED(aic_decode_init),
  426. .caps_internal = FF_CODEC_CAP_INIT_THREADSAFE,
  427. };