You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1139 lines
39KB

  1. /*
  2. * Intel Indeo 3 (IV31, IV32, etc.) video decoder for ffmpeg
  3. * written, produced, and directed by Alan Smithee
  4. *
  5. * This file is part of FFmpeg.
  6. *
  7. * FFmpeg is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU Lesser General Public
  9. * License as published by the Free Software Foundation; either
  10. * version 2.1 of the License, or (at your option) any later version.
  11. *
  12. * FFmpeg is distributed in the hope that it will be useful,
  13. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  15. * Lesser General Public License for more details.
  16. *
  17. * You should have received a copy of the GNU Lesser General Public
  18. * License along with FFmpeg; if not, write to the Free Software
  19. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20. */
  21. #include <stdio.h>
  22. #include <stdlib.h>
  23. #include <string.h>
  24. #include <unistd.h>
  25. #include "avcodec.h"
  26. #include "dsputil.h"
  27. #include "bytestream.h"
  28. #include "indeo3data.h"
  29. typedef struct
  30. {
  31. unsigned char *Ybuf;
  32. unsigned char *Ubuf;
  33. unsigned char *Vbuf;
  34. unsigned char *the_buf;
  35. unsigned int the_buf_size;
  36. unsigned short y_w, y_h;
  37. unsigned short uv_w, uv_h;
  38. } YUVBufs;
  39. typedef struct Indeo3DecodeContext {
  40. AVCodecContext *avctx;
  41. int width, height;
  42. AVFrame frame;
  43. YUVBufs iv_frame[2];
  44. YUVBufs *cur_frame;
  45. YUVBufs *ref_frame;
  46. unsigned char *ModPred;
  47. unsigned short *corrector_type;
  48. } Indeo3DecodeContext;
  49. static const int corrector_type_0[24] = {
  50. 195, 159, 133, 115, 101, 93, 87, 77,
  51. 195, 159, 133, 115, 101, 93, 87, 77,
  52. 128, 79, 79, 79, 79, 79, 79, 79
  53. };
  54. static const int corrector_type_2[8] = { 9, 7, 6, 8, 5, 4, 3, 2 };
  55. static av_cold void build_modpred(Indeo3DecodeContext *s)
  56. {
  57. int i, j;
  58. s->ModPred = (unsigned char *) av_malloc (8 * 128);
  59. for (i=0; i < 128; ++i) {
  60. s->ModPred[i+0*128] = (i > 126) ? 254 : 2*((i + 1) - ((i + 1) % 2));
  61. s->ModPred[i+1*128] = (i == 7) ? 20 : ((i == 119 || i == 120)
  62. ? 236 : 2*((i + 2) - ((i + 1) % 3)));
  63. s->ModPred[i+2*128] = (i > 125) ? 248 : 2*((i + 2) - ((i + 2) % 4));
  64. s->ModPred[i+3*128] = 2*((i + 1) - ((i - 3) % 5));
  65. s->ModPred[i+4*128] = (i == 8) ? 20 : 2*((i + 1) - ((i - 3) % 6));
  66. s->ModPred[i+5*128] = 2*((i + 4) - ((i + 3) % 7));
  67. s->ModPred[i+6*128] = (i > 123) ? 240 : 2*((i + 4) - ((i + 4) % 8));
  68. s->ModPred[i+7*128] = 2*((i + 5) - ((i + 4) % 9));
  69. }
  70. s->corrector_type = (unsigned short *) av_malloc (24 * 256 * sizeof(unsigned short));
  71. for (i=0; i < 24; ++i) {
  72. for (j=0; j < 256; ++j) {
  73. s->corrector_type[i*256+j] = (j < corrector_type_0[i])
  74. ? 1 : ((j < 248 || (i == 16 && j == 248))
  75. ? 0 : corrector_type_2[j - 248]);
  76. }
  77. }
  78. }
  79. static void iv_Decode_Chunk(Indeo3DecodeContext *s, unsigned char *cur,
  80. unsigned char *ref, int width, int height, const unsigned char *buf1,
  81. long fflags2, const unsigned char *hdr,
  82. const unsigned char *buf2, int min_width_160);
  83. /* ---------------------------------------------------------------------- */
  84. static av_cold void iv_alloc_frames(Indeo3DecodeContext *s)
  85. {
  86. int luma_width, luma_height, luma_pixels, chroma_width, chroma_height,
  87. chroma_pixels, i;
  88. unsigned int bufsize;
  89. luma_width = (s->width + 3) & (~3);
  90. luma_height = (s->height + 3) & (~3);
  91. s->iv_frame[0].y_w = s->iv_frame[0].y_h =
  92. s->iv_frame[0].the_buf_size = 0;
  93. s->iv_frame[1].y_w = s->iv_frame[1].y_h =
  94. s->iv_frame[1].the_buf_size = 0;
  95. s->iv_frame[1].the_buf = NULL;
  96. chroma_width = ((luma_width >> 2) + 3) & (~3);
  97. chroma_height = ((luma_height>> 2) + 3) & (~3);
  98. luma_pixels = luma_width * luma_height;
  99. chroma_pixels = chroma_width * chroma_height;
  100. bufsize = luma_pixels * 2 + luma_width * 3 +
  101. (chroma_pixels + chroma_width) * 4;
  102. if((s->iv_frame[0].the_buf =
  103. (s->iv_frame[0].the_buf_size == 0 ? av_malloc(bufsize) :
  104. av_realloc(s->iv_frame[0].the_buf, bufsize))) == NULL)
  105. return;
  106. s->iv_frame[0].y_w = s->iv_frame[1].y_w = luma_width;
  107. s->iv_frame[0].y_h = s->iv_frame[1].y_h = luma_height;
  108. s->iv_frame[0].uv_w = s->iv_frame[1].uv_w = chroma_width;
  109. s->iv_frame[0].uv_h = s->iv_frame[1].uv_h = chroma_height;
  110. s->iv_frame[0].the_buf_size = bufsize;
  111. s->iv_frame[0].Ybuf = s->iv_frame[0].the_buf + luma_width;
  112. i = luma_pixels + luma_width * 2;
  113. s->iv_frame[1].Ybuf = s->iv_frame[0].the_buf + i;
  114. i += (luma_pixels + luma_width);
  115. s->iv_frame[0].Ubuf = s->iv_frame[0].the_buf + i;
  116. i += (chroma_pixels + chroma_width);
  117. s->iv_frame[1].Ubuf = s->iv_frame[0].the_buf + i;
  118. i += (chroma_pixels + chroma_width);
  119. s->iv_frame[0].Vbuf = s->iv_frame[0].the_buf + i;
  120. i += (chroma_pixels + chroma_width);
  121. s->iv_frame[1].Vbuf = s->iv_frame[0].the_buf + i;
  122. for(i = 1; i <= luma_width; i++)
  123. s->iv_frame[0].Ybuf[-i] = s->iv_frame[1].Ybuf[-i] =
  124. s->iv_frame[0].Ubuf[-i] = 0x80;
  125. for(i = 1; i <= chroma_width; i++) {
  126. s->iv_frame[1].Ubuf[-i] = 0x80;
  127. s->iv_frame[0].Vbuf[-i] = 0x80;
  128. s->iv_frame[1].Vbuf[-i] = 0x80;
  129. s->iv_frame[1].Vbuf[chroma_pixels+i-1] = 0x80;
  130. }
  131. }
  132. /* ---------------------------------------------------------------------- */
  133. static av_cold void iv_free_func(Indeo3DecodeContext *s)
  134. {
  135. int i;
  136. for(i = 0 ; i < 2 ; i++) {
  137. if(s->iv_frame[i].the_buf != NULL)
  138. av_free(s->iv_frame[i].the_buf);
  139. s->iv_frame[i].Ybuf = s->iv_frame[i].Ubuf =
  140. s->iv_frame[i].Vbuf = NULL;
  141. s->iv_frame[i].the_buf = NULL;
  142. s->iv_frame[i].the_buf_size = 0;
  143. s->iv_frame[i].y_w = s->iv_frame[i].y_h = 0;
  144. s->iv_frame[i].uv_w = s->iv_frame[i].uv_h = 0;
  145. }
  146. av_free(s->ModPred);
  147. av_free(s->corrector_type);
  148. }
  149. /* ---------------------------------------------------------------------- */
  150. static unsigned long iv_decode_frame(Indeo3DecodeContext *s,
  151. const unsigned char *buf, int buf_size)
  152. {
  153. unsigned int hdr_width, hdr_height,
  154. chroma_width, chroma_height;
  155. unsigned long fflags1, fflags2, fflags3, offs1, offs2, offs3, offs;
  156. const unsigned char *hdr_pos, *buf_pos;
  157. buf_pos = buf;
  158. buf_pos += 18;
  159. fflags1 = bytestream_get_le16(&buf_pos);
  160. fflags3 = bytestream_get_le32(&buf_pos);
  161. fflags2 = *buf_pos++;
  162. buf_pos += 3;
  163. hdr_height = bytestream_get_le16(&buf_pos);
  164. hdr_width = bytestream_get_le16(&buf_pos);
  165. if(avcodec_check_dimensions(NULL, hdr_width, hdr_height))
  166. return -1;
  167. chroma_height = ((hdr_height >> 2) + 3) & 0x7ffc;
  168. chroma_width = ((hdr_width >> 2) + 3) & 0x7ffc;
  169. offs1 = bytestream_get_le32(&buf_pos);
  170. offs2 = bytestream_get_le32(&buf_pos);
  171. offs3 = bytestream_get_le32(&buf_pos);
  172. buf_pos += 4;
  173. hdr_pos = buf_pos;
  174. if(fflags3 == 0x80) return 4;
  175. if(fflags1 & 0x200) {
  176. s->cur_frame = s->iv_frame + 1;
  177. s->ref_frame = s->iv_frame;
  178. } else {
  179. s->cur_frame = s->iv_frame;
  180. s->ref_frame = s->iv_frame + 1;
  181. }
  182. buf_pos = buf + 16 + offs1;
  183. offs = bytestream_get_le32(&buf_pos);
  184. iv_Decode_Chunk(s, s->cur_frame->Ybuf, s->ref_frame->Ybuf, hdr_width,
  185. hdr_height, buf_pos + offs * 2, fflags2, hdr_pos, buf_pos,
  186. FFMIN(hdr_width, 160));
  187. if (!(s->avctx->flags & CODEC_FLAG_GRAY))
  188. {
  189. buf_pos = buf + 16 + offs2;
  190. offs = bytestream_get_le32(&buf_pos);
  191. iv_Decode_Chunk(s, s->cur_frame->Vbuf, s->ref_frame->Vbuf, chroma_width,
  192. chroma_height, buf_pos + offs * 2, fflags2, hdr_pos, buf_pos,
  193. FFMIN(chroma_width, 40));
  194. buf_pos = buf + 16 + offs3;
  195. offs = bytestream_get_le32(&buf_pos);
  196. iv_Decode_Chunk(s, s->cur_frame->Ubuf, s->ref_frame->Ubuf, chroma_width,
  197. chroma_height, buf_pos + offs * 2, fflags2, hdr_pos, buf_pos,
  198. FFMIN(chroma_width, 40));
  199. }
  200. return 8;
  201. }
  202. typedef struct {
  203. long xpos;
  204. long ypos;
  205. long width;
  206. long height;
  207. long split_flag;
  208. long split_direction;
  209. long usl7;
  210. } ustr_t;
  211. /* ---------------------------------------------------------------------- */
  212. #define LV1_CHECK(buf1,rle_v3,lv1,lp2) \
  213. if((lv1 & 0x80) != 0) { \
  214. if(rle_v3 != 0) \
  215. rle_v3 = 0; \
  216. else { \
  217. rle_v3 = 1; \
  218. buf1 -= 2; \
  219. } \
  220. } \
  221. lp2 = 4;
  222. #define RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3) \
  223. if(rle_v3 == 0) { \
  224. rle_v2 = *buf1; \
  225. rle_v1 = 1; \
  226. if(rle_v2 > 32) { \
  227. rle_v2 -= 32; \
  228. rle_v1 = 0; \
  229. } \
  230. rle_v3 = 1; \
  231. } \
  232. buf1--;
  233. #define LP2_CHECK(buf1,rle_v3,lp2) \
  234. if(lp2 == 0 && rle_v3 != 0) \
  235. rle_v3 = 0; \
  236. else { \
  237. buf1--; \
  238. rle_v3 = 1; \
  239. }
  240. #define RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2) \
  241. rle_v2--; \
  242. if(rle_v2 == 0) { \
  243. rle_v3 = 0; \
  244. buf1 += 2; \
  245. } \
  246. lp2 = 4;
  247. static void iv_Decode_Chunk(Indeo3DecodeContext *s,
  248. unsigned char *cur, unsigned char *ref, int width, int height,
  249. const unsigned char *buf1, long fflags2, const unsigned char *hdr,
  250. const unsigned char *buf2, int min_width_160)
  251. {
  252. unsigned char bit_buf;
  253. unsigned long bit_pos, lv, lv1, lv2;
  254. long *width_tbl, width_tbl_arr[10];
  255. const signed char *ref_vectors;
  256. unsigned char *cur_frm_pos, *ref_frm_pos, *cp, *cp2;
  257. uint32_t *cur_lp, *ref_lp;
  258. const uint32_t *correction_lp[2], *correctionloworder_lp[2], *correctionhighorder_lp[2];
  259. unsigned short *correction_type_sp[2];
  260. ustr_t strip_tbl[20], *strip;
  261. int i, j, k, lp1, lp2, flag1, cmd, blks_width, blks_height, region_160_width,
  262. rle_v1, rle_v2, rle_v3;
  263. unsigned short res;
  264. bit_buf = 0;
  265. ref_vectors = NULL;
  266. width_tbl = width_tbl_arr + 1;
  267. i = (width < 0 ? width + 3 : width)/4;
  268. for(j = -1; j < 8; j++)
  269. width_tbl[j] = i * j;
  270. strip = strip_tbl;
  271. for(region_160_width = 0; region_160_width < (width - min_width_160); region_160_width += min_width_160);
  272. strip->ypos = strip->xpos = 0;
  273. for(strip->width = min_width_160; width > strip->width; strip->width *= 2);
  274. strip->height = height;
  275. strip->split_direction = 0;
  276. strip->split_flag = 0;
  277. strip->usl7 = 0;
  278. bit_pos = 0;
  279. rle_v1 = rle_v2 = rle_v3 = 0;
  280. while(strip >= strip_tbl) {
  281. if(bit_pos <= 0) {
  282. bit_pos = 8;
  283. bit_buf = *buf1++;
  284. }
  285. bit_pos -= 2;
  286. cmd = (bit_buf >> bit_pos) & 0x03;
  287. if(cmd == 0) {
  288. strip++;
  289. memcpy(strip, strip-1, sizeof(ustr_t));
  290. strip->split_flag = 1;
  291. strip->split_direction = 0;
  292. strip->height = (strip->height > 8 ? ((strip->height+8)>>4)<<3 : 4);
  293. continue;
  294. } else if(cmd == 1) {
  295. strip++;
  296. memcpy(strip, strip-1, sizeof(ustr_t));
  297. strip->split_flag = 1;
  298. strip->split_direction = 1;
  299. strip->width = (strip->width > 8 ? ((strip->width+8)>>4)<<3 : 4);
  300. continue;
  301. } else if(cmd == 2) {
  302. if(strip->usl7 == 0) {
  303. strip->usl7 = 1;
  304. ref_vectors = NULL;
  305. continue;
  306. }
  307. } else if(cmd == 3) {
  308. if(strip->usl7 == 0) {
  309. strip->usl7 = 1;
  310. ref_vectors = (const signed char*)buf2 + (*buf1 * 2);
  311. buf1++;
  312. continue;
  313. }
  314. }
  315. cur_frm_pos = cur + width * strip->ypos + strip->xpos;
  316. if((blks_width = strip->width) < 0)
  317. blks_width += 3;
  318. blks_width >>= 2;
  319. blks_height = strip->height;
  320. if(ref_vectors != NULL) {
  321. ref_frm_pos = ref + (ref_vectors[0] + strip->ypos) * width +
  322. ref_vectors[1] + strip->xpos;
  323. } else
  324. ref_frm_pos = cur_frm_pos - width_tbl[4];
  325. if(cmd == 2) {
  326. if(bit_pos <= 0) {
  327. bit_pos = 8;
  328. bit_buf = *buf1++;
  329. }
  330. bit_pos -= 2;
  331. cmd = (bit_buf >> bit_pos) & 0x03;
  332. if(cmd == 0 || ref_vectors != NULL) {
  333. for(lp1 = 0; lp1 < blks_width; lp1++) {
  334. for(i = 0, j = 0; i < blks_height; i++, j += width_tbl[1])
  335. ((uint32_t *)cur_frm_pos)[j] = ((uint32_t *)ref_frm_pos)[j];
  336. cur_frm_pos += 4;
  337. ref_frm_pos += 4;
  338. }
  339. } else if(cmd != 1)
  340. return;
  341. } else {
  342. k = *buf1 >> 4;
  343. j = *buf1 & 0x0f;
  344. buf1++;
  345. lv = j + fflags2;
  346. if((lv - 8) <= 7 && (k == 0 || k == 3 || k == 10)) {
  347. cp2 = s->ModPred + ((lv - 8) << 7);
  348. cp = ref_frm_pos;
  349. for(i = 0; i < blks_width << 2; i++) {
  350. int v = *cp >> 1;
  351. *(cp++) = cp2[v];
  352. }
  353. }
  354. if(k == 1 || k == 4) {
  355. lv = (hdr[j] & 0xf) + fflags2;
  356. correction_type_sp[0] = s->corrector_type + (lv << 8);
  357. correction_lp[0] = correction + (lv << 8);
  358. lv = (hdr[j] >> 4) + fflags2;
  359. correction_lp[1] = correction + (lv << 8);
  360. correction_type_sp[1] = s->corrector_type + (lv << 8);
  361. } else {
  362. correctionloworder_lp[0] = correctionloworder_lp[1] = correctionloworder + (lv << 8);
  363. correctionhighorder_lp[0] = correctionhighorder_lp[1] = correctionhighorder + (lv << 8);
  364. correction_type_sp[0] = correction_type_sp[1] = s->corrector_type + (lv << 8);
  365. correction_lp[0] = correction_lp[1] = correction + (lv << 8);
  366. }
  367. switch(k) {
  368. case 1:
  369. case 0: /********** CASE 0 **********/
  370. for( ; blks_height > 0; blks_height -= 4) {
  371. for(lp1 = 0; lp1 < blks_width; lp1++) {
  372. for(lp2 = 0; lp2 < 4; ) {
  373. k = *buf1++;
  374. cur_lp = ((uint32_t *)cur_frm_pos) + width_tbl[lp2];
  375. ref_lp = ((uint32_t *)ref_frm_pos) + width_tbl[lp2];
  376. switch(correction_type_sp[0][k]) {
  377. case 0:
  378. *cur_lp = le2me_32(((le2me_32(*ref_lp) >> 1) + correction_lp[lp2 & 0x01][k]) << 1);
  379. lp2++;
  380. break;
  381. case 1:
  382. res = ((le2me_16(((unsigned short *)(ref_lp))[0]) >> 1) + correction_lp[lp2 & 0x01][*buf1]) << 1;
  383. ((unsigned short *)cur_lp)[0] = le2me_16(res);
  384. res = ((le2me_16(((unsigned short *)(ref_lp))[1]) >> 1) + correction_lp[lp2 & 0x01][k]) << 1;
  385. ((unsigned short *)cur_lp)[1] = le2me_16(res);
  386. buf1++;
  387. lp2++;
  388. break;
  389. case 2:
  390. if(lp2 == 0) {
  391. for(i = 0, j = 0; i < 2; i++, j += width_tbl[1])
  392. cur_lp[j] = ref_lp[j];
  393. lp2 += 2;
  394. }
  395. break;
  396. case 3:
  397. if(lp2 < 2) {
  398. for(i = 0, j = 0; i < (3 - lp2); i++, j += width_tbl[1])
  399. cur_lp[j] = ref_lp[j];
  400. lp2 = 3;
  401. }
  402. break;
  403. case 8:
  404. if(lp2 == 0) {
  405. RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3)
  406. if(rle_v1 == 1 || ref_vectors != NULL) {
  407. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  408. cur_lp[j] = ref_lp[j];
  409. }
  410. RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2)
  411. break;
  412. } else {
  413. rle_v1 = 1;
  414. rle_v2 = *buf1 - 1;
  415. }
  416. case 5:
  417. LP2_CHECK(buf1,rle_v3,lp2)
  418. case 4:
  419. for(i = 0, j = 0; i < (4 - lp2); i++, j += width_tbl[1])
  420. cur_lp[j] = ref_lp[j];
  421. lp2 = 4;
  422. break;
  423. case 7:
  424. if(rle_v3 != 0)
  425. rle_v3 = 0;
  426. else {
  427. buf1--;
  428. rle_v3 = 1;
  429. }
  430. case 6:
  431. if(ref_vectors != NULL) {
  432. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  433. cur_lp[j] = ref_lp[j];
  434. }
  435. lp2 = 4;
  436. break;
  437. case 9:
  438. lv1 = *buf1++;
  439. lv = (lv1 & 0x7F) << 1;
  440. lv += (lv << 8);
  441. lv += (lv << 16);
  442. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  443. cur_lp[j] = lv;
  444. LV1_CHECK(buf1,rle_v3,lv1,lp2)
  445. break;
  446. default:
  447. return;
  448. }
  449. }
  450. cur_frm_pos += 4;
  451. ref_frm_pos += 4;
  452. }
  453. cur_frm_pos += ((width - blks_width) * 4);
  454. ref_frm_pos += ((width - blks_width) * 4);
  455. }
  456. break;
  457. case 4:
  458. case 3: /********** CASE 3 **********/
  459. if(ref_vectors != NULL)
  460. return;
  461. flag1 = 1;
  462. for( ; blks_height > 0; blks_height -= 8) {
  463. for(lp1 = 0; lp1 < blks_width; lp1++) {
  464. for(lp2 = 0; lp2 < 4; ) {
  465. k = *buf1++;
  466. cur_lp = ((uint32_t *)cur_frm_pos) + width_tbl[lp2 * 2];
  467. ref_lp = ((uint32_t *)cur_frm_pos) + width_tbl[(lp2 * 2) - 1];
  468. switch(correction_type_sp[lp2 & 0x01][k]) {
  469. case 0:
  470. cur_lp[width_tbl[1]] = le2me_32(((le2me_32(*ref_lp) >> 1) + correction_lp[lp2 & 0x01][k]) << 1);
  471. if(lp2 > 0 || flag1 == 0 || strip->ypos != 0)
  472. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  473. else
  474. cur_lp[0] = le2me_32(((le2me_32(*ref_lp) >> 1) + correction_lp[lp2 & 0x01][k]) << 1);
  475. lp2++;
  476. break;
  477. case 1:
  478. res = ((le2me_16(((unsigned short *)ref_lp)[0]) >> 1) + correction_lp[lp2 & 0x01][*buf1]) << 1;
  479. ((unsigned short *)cur_lp)[width_tbl[2]] = le2me_16(res);
  480. res = ((le2me_16(((unsigned short *)ref_lp)[1]) >> 1) + correction_lp[lp2 & 0x01][k]) << 1;
  481. ((unsigned short *)cur_lp)[width_tbl[2]+1] = le2me_16(res);
  482. if(lp2 > 0 || flag1 == 0 || strip->ypos != 0)
  483. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  484. else
  485. cur_lp[0] = cur_lp[width_tbl[1]];
  486. buf1++;
  487. lp2++;
  488. break;
  489. case 2:
  490. if(lp2 == 0) {
  491. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  492. cur_lp[j] = *ref_lp;
  493. lp2 += 2;
  494. }
  495. break;
  496. case 3:
  497. if(lp2 < 2) {
  498. for(i = 0, j = 0; i < 6 - (lp2 * 2); i++, j += width_tbl[1])
  499. cur_lp[j] = *ref_lp;
  500. lp2 = 3;
  501. }
  502. break;
  503. case 6:
  504. lp2 = 4;
  505. break;
  506. case 7:
  507. if(rle_v3 != 0)
  508. rle_v3 = 0;
  509. else {
  510. buf1--;
  511. rle_v3 = 1;
  512. }
  513. lp2 = 4;
  514. break;
  515. case 8:
  516. if(lp2 == 0) {
  517. RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3)
  518. if(rle_v1 == 1) {
  519. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1])
  520. cur_lp[j] = ref_lp[j];
  521. }
  522. RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2)
  523. break;
  524. } else {
  525. rle_v2 = (*buf1) - 1;
  526. rle_v1 = 1;
  527. }
  528. case 5:
  529. LP2_CHECK(buf1,rle_v3,lp2)
  530. case 4:
  531. for(i = 0, j = 0; i < 8 - (lp2 * 2); i++, j += width_tbl[1])
  532. cur_lp[j] = *ref_lp;
  533. lp2 = 4;
  534. break;
  535. case 9:
  536. av_log(s->avctx, AV_LOG_ERROR, "UNTESTED.\n");
  537. lv1 = *buf1++;
  538. lv = (lv1 & 0x7F) << 1;
  539. lv += (lv << 8);
  540. lv += (lv << 16);
  541. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  542. cur_lp[j] = lv;
  543. LV1_CHECK(buf1,rle_v3,lv1,lp2)
  544. break;
  545. default:
  546. return;
  547. }
  548. }
  549. cur_frm_pos += 4;
  550. }
  551. cur_frm_pos += (((width * 2) - blks_width) * 4);
  552. flag1 = 0;
  553. }
  554. break;
  555. case 10: /********** CASE 10 **********/
  556. if(ref_vectors == NULL) {
  557. flag1 = 1;
  558. for( ; blks_height > 0; blks_height -= 8) {
  559. for(lp1 = 0; lp1 < blks_width; lp1 += 2) {
  560. for(lp2 = 0; lp2 < 4; ) {
  561. k = *buf1++;
  562. cur_lp = ((uint32_t *)cur_frm_pos) + width_tbl[lp2 * 2];
  563. ref_lp = ((uint32_t *)cur_frm_pos) + width_tbl[(lp2 * 2) - 1];
  564. lv1 = ref_lp[0];
  565. lv2 = ref_lp[1];
  566. if(lp2 == 0 && flag1 != 0) {
  567. #ifdef WORDS_BIGENDIAN
  568. lv1 = lv1 & 0xFF00FF00;
  569. lv1 = (lv1 >> 8) | lv1;
  570. lv2 = lv2 & 0xFF00FF00;
  571. lv2 = (lv2 >> 8) | lv2;
  572. #else
  573. lv1 = lv1 & 0x00FF00FF;
  574. lv1 = (lv1 << 8) | lv1;
  575. lv2 = lv2 & 0x00FF00FF;
  576. lv2 = (lv2 << 8) | lv2;
  577. #endif
  578. }
  579. switch(correction_type_sp[lp2 & 0x01][k]) {
  580. case 0:
  581. cur_lp[width_tbl[1]] = le2me_32(((le2me_32(lv1) >> 1) + correctionloworder_lp[lp2 & 0x01][k]) << 1);
  582. cur_lp[width_tbl[1]+1] = le2me_32(((le2me_32(lv2) >> 1) + correctionhighorder_lp[lp2 & 0x01][k]) << 1);
  583. if(lp2 > 0 || strip->ypos != 0 || flag1 == 0) {
  584. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  585. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  586. } else {
  587. cur_lp[0] = cur_lp[width_tbl[1]];
  588. cur_lp[1] = cur_lp[width_tbl[1]+1];
  589. }
  590. lp2++;
  591. break;
  592. case 1:
  593. cur_lp[width_tbl[1]] = le2me_32(((le2me_32(lv1) >> 1) + correctionloworder_lp[lp2 & 0x01][*buf1]) << 1);
  594. cur_lp[width_tbl[1]+1] = le2me_32(((le2me_32(lv2) >> 1) + correctionloworder_lp[lp2 & 0x01][k]) << 1);
  595. if(lp2 > 0 || strip->ypos != 0 || flag1 == 0) {
  596. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  597. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  598. } else {
  599. cur_lp[0] = cur_lp[width_tbl[1]];
  600. cur_lp[1] = cur_lp[width_tbl[1]+1];
  601. }
  602. buf1++;
  603. lp2++;
  604. break;
  605. case 2:
  606. if(lp2 == 0) {
  607. if(flag1 != 0) {
  608. for(i = 0, j = width_tbl[1]; i < 3; i++, j += width_tbl[1]) {
  609. cur_lp[j] = lv1;
  610. cur_lp[j+1] = lv2;
  611. }
  612. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  613. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  614. } else {
  615. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1]) {
  616. cur_lp[j] = lv1;
  617. cur_lp[j+1] = lv2;
  618. }
  619. }
  620. lp2 += 2;
  621. }
  622. break;
  623. case 3:
  624. if(lp2 < 2) {
  625. if(lp2 == 0 && flag1 != 0) {
  626. for(i = 0, j = width_tbl[1]; i < 5; i++, j += width_tbl[1]) {
  627. cur_lp[j] = lv1;
  628. cur_lp[j+1] = lv2;
  629. }
  630. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  631. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  632. } else {
  633. for(i = 0, j = 0; i < 6 - (lp2 * 2); i++, j += width_tbl[1]) {
  634. cur_lp[j] = lv1;
  635. cur_lp[j+1] = lv2;
  636. }
  637. }
  638. lp2 = 3;
  639. }
  640. break;
  641. case 8:
  642. if(lp2 == 0) {
  643. RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3)
  644. if(rle_v1 == 1) {
  645. if(flag1 != 0) {
  646. for(i = 0, j = width_tbl[1]; i < 7; i++, j += width_tbl[1]) {
  647. cur_lp[j] = lv1;
  648. cur_lp[j+1] = lv2;
  649. }
  650. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  651. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  652. } else {
  653. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1]) {
  654. cur_lp[j] = lv1;
  655. cur_lp[j+1] = lv2;
  656. }
  657. }
  658. }
  659. RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2)
  660. break;
  661. } else {
  662. rle_v1 = 1;
  663. rle_v2 = (*buf1) - 1;
  664. }
  665. case 5:
  666. LP2_CHECK(buf1,rle_v3,lp2)
  667. case 4:
  668. if(lp2 == 0 && flag1 != 0) {
  669. for(i = 0, j = width_tbl[1]; i < 7; i++, j += width_tbl[1]) {
  670. cur_lp[j] = lv1;
  671. cur_lp[j+1] = lv2;
  672. }
  673. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  674. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  675. } else {
  676. for(i = 0, j = 0; i < 8 - (lp2 * 2); i++, j += width_tbl[1]) {
  677. cur_lp[j] = lv1;
  678. cur_lp[j+1] = lv2;
  679. }
  680. }
  681. lp2 = 4;
  682. break;
  683. case 6:
  684. lp2 = 4;
  685. break;
  686. case 7:
  687. if(lp2 == 0) {
  688. if(rle_v3 != 0)
  689. rle_v3 = 0;
  690. else {
  691. buf1--;
  692. rle_v3 = 1;
  693. }
  694. lp2 = 4;
  695. }
  696. break;
  697. case 9:
  698. av_log(s->avctx, AV_LOG_ERROR, "UNTESTED.\n");
  699. lv1 = *buf1;
  700. lv = (lv1 & 0x7F) << 1;
  701. lv += (lv << 8);
  702. lv += (lv << 16);
  703. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1])
  704. cur_lp[j] = lv;
  705. LV1_CHECK(buf1,rle_v3,lv1,lp2)
  706. break;
  707. default:
  708. return;
  709. }
  710. }
  711. cur_frm_pos += 8;
  712. }
  713. cur_frm_pos += (((width * 2) - blks_width) * 4);
  714. flag1 = 0;
  715. }
  716. } else {
  717. for( ; blks_height > 0; blks_height -= 8) {
  718. for(lp1 = 0; lp1 < blks_width; lp1 += 2) {
  719. for(lp2 = 0; lp2 < 4; ) {
  720. k = *buf1++;
  721. cur_lp = ((uint32_t *)cur_frm_pos) + width_tbl[lp2 * 2];
  722. ref_lp = ((uint32_t *)ref_frm_pos) + width_tbl[lp2 * 2];
  723. switch(correction_type_sp[lp2 & 0x01][k]) {
  724. case 0:
  725. lv1 = correctionloworder_lp[lp2 & 0x01][k];
  726. lv2 = correctionhighorder_lp[lp2 & 0x01][k];
  727. cur_lp[0] = le2me_32(((le2me_32(ref_lp[0]) >> 1) + lv1) << 1);
  728. cur_lp[1] = le2me_32(((le2me_32(ref_lp[1]) >> 1) + lv2) << 1);
  729. cur_lp[width_tbl[1]] = le2me_32(((le2me_32(ref_lp[width_tbl[1]]) >> 1) + lv1) << 1);
  730. cur_lp[width_tbl[1]+1] = le2me_32(((le2me_32(ref_lp[width_tbl[1]+1]) >> 1) + lv2) << 1);
  731. lp2++;
  732. break;
  733. case 1:
  734. lv1 = correctionloworder_lp[lp2 & 0x01][*buf1++];
  735. lv2 = correctionloworder_lp[lp2 & 0x01][k];
  736. cur_lp[0] = le2me_32(((le2me_32(ref_lp[0]) >> 1) + lv1) << 1);
  737. cur_lp[1] = le2me_32(((le2me_32(ref_lp[1]) >> 1) + lv2) << 1);
  738. cur_lp[width_tbl[1]] = le2me_32(((le2me_32(ref_lp[width_tbl[1]]) >> 1) + lv1) << 1);
  739. cur_lp[width_tbl[1]+1] = le2me_32(((le2me_32(ref_lp[width_tbl[1]+1]) >> 1) + lv2) << 1);
  740. lp2++;
  741. break;
  742. case 2:
  743. if(lp2 == 0) {
  744. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1]) {
  745. cur_lp[j] = ref_lp[j];
  746. cur_lp[j+1] = ref_lp[j+1];
  747. }
  748. lp2 += 2;
  749. }
  750. break;
  751. case 3:
  752. if(lp2 < 2) {
  753. for(i = 0, j = 0; i < 6 - (lp2 * 2); i++, j += width_tbl[1]) {
  754. cur_lp[j] = ref_lp[j];
  755. cur_lp[j+1] = ref_lp[j+1];
  756. }
  757. lp2 = 3;
  758. }
  759. break;
  760. case 8:
  761. if(lp2 == 0) {
  762. RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3)
  763. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1]) {
  764. ((uint32_t *)cur_frm_pos)[j] = ((uint32_t *)ref_frm_pos)[j];
  765. ((uint32_t *)cur_frm_pos)[j+1] = ((uint32_t *)ref_frm_pos)[j+1];
  766. }
  767. RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2)
  768. break;
  769. } else {
  770. rle_v1 = 1;
  771. rle_v2 = (*buf1) - 1;
  772. }
  773. case 5:
  774. case 7:
  775. LP2_CHECK(buf1,rle_v3,lp2)
  776. case 6:
  777. case 4:
  778. for(i = 0, j = 0; i < 8 - (lp2 * 2); i++, j += width_tbl[1]) {
  779. cur_lp[j] = ref_lp[j];
  780. cur_lp[j+1] = ref_lp[j+1];
  781. }
  782. lp2 = 4;
  783. break;
  784. case 9:
  785. av_log(s->avctx, AV_LOG_ERROR, "UNTESTED.\n");
  786. lv1 = *buf1;
  787. lv = (lv1 & 0x7F) << 1;
  788. lv += (lv << 8);
  789. lv += (lv << 16);
  790. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1])
  791. ((uint32_t *)cur_frm_pos)[j] = ((uint32_t *)cur_frm_pos)[j+1] = lv;
  792. LV1_CHECK(buf1,rle_v3,lv1,lp2)
  793. break;
  794. default:
  795. return;
  796. }
  797. }
  798. cur_frm_pos += 8;
  799. ref_frm_pos += 8;
  800. }
  801. cur_frm_pos += (((width * 2) - blks_width) * 4);
  802. ref_frm_pos += (((width * 2) - blks_width) * 4);
  803. }
  804. }
  805. break;
  806. case 11: /********** CASE 11 **********/
  807. if(ref_vectors == NULL)
  808. return;
  809. for( ; blks_height > 0; blks_height -= 8) {
  810. for(lp1 = 0; lp1 < blks_width; lp1++) {
  811. for(lp2 = 0; lp2 < 4; ) {
  812. k = *buf1++;
  813. cur_lp = ((uint32_t *)cur_frm_pos) + width_tbl[lp2 * 2];
  814. ref_lp = ((uint32_t *)ref_frm_pos) + width_tbl[lp2 * 2];
  815. switch(correction_type_sp[lp2 & 0x01][k]) {
  816. case 0:
  817. cur_lp[0] = le2me_32(((le2me_32(*ref_lp) >> 1) + correction_lp[lp2 & 0x01][k]) << 1);
  818. cur_lp[width_tbl[1]] = le2me_32(((le2me_32(ref_lp[width_tbl[1]]) >> 1) + correction_lp[lp2 & 0x01][k]) << 1);
  819. lp2++;
  820. break;
  821. case 1:
  822. lv1 = (unsigned short)(correction_lp[lp2 & 0x01][*buf1++]);
  823. lv2 = (unsigned short)(correction_lp[lp2 & 0x01][k]);
  824. res = (unsigned short)(((le2me_16(((unsigned short *)ref_lp)[0]) >> 1) + lv1) << 1);
  825. ((unsigned short *)cur_lp)[0] = le2me_16(res);
  826. res = (unsigned short)(((le2me_16(((unsigned short *)ref_lp)[1]) >> 1) + lv2) << 1);
  827. ((unsigned short *)cur_lp)[1] = le2me_16(res);
  828. res = (unsigned short)(((le2me_16(((unsigned short *)ref_lp)[width_tbl[2]]) >> 1) + lv1) << 1);
  829. ((unsigned short *)cur_lp)[width_tbl[2]] = le2me_16(res);
  830. res = (unsigned short)(((le2me_16(((unsigned short *)ref_lp)[width_tbl[2]+1]) >> 1) + lv2) << 1);
  831. ((unsigned short *)cur_lp)[width_tbl[2]+1] = le2me_16(res);
  832. lp2++;
  833. break;
  834. case 2:
  835. if(lp2 == 0) {
  836. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  837. cur_lp[j] = ref_lp[j];
  838. lp2 += 2;
  839. }
  840. break;
  841. case 3:
  842. if(lp2 < 2) {
  843. for(i = 0, j = 0; i < 6 - (lp2 * 2); i++, j += width_tbl[1])
  844. cur_lp[j] = ref_lp[j];
  845. lp2 = 3;
  846. }
  847. break;
  848. case 8:
  849. if(lp2 == 0) {
  850. RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3)
  851. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1])
  852. cur_lp[j] = ref_lp[j];
  853. RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2)
  854. break;
  855. } else {
  856. rle_v1 = 1;
  857. rle_v2 = (*buf1) - 1;
  858. }
  859. case 5:
  860. case 7:
  861. LP2_CHECK(buf1,rle_v3,lp2)
  862. case 4:
  863. case 6:
  864. for(i = 0, j = 0; i < 8 - (lp2 * 2); i++, j += width_tbl[1])
  865. cur_lp[j] = ref_lp[j];
  866. lp2 = 4;
  867. break;
  868. case 9:
  869. av_log(s->avctx, AV_LOG_ERROR, "UNTESTED.\n");
  870. lv1 = *buf1++;
  871. lv = (lv1 & 0x7F) << 1;
  872. lv += (lv << 8);
  873. lv += (lv << 16);
  874. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  875. cur_lp[j] = lv;
  876. LV1_CHECK(buf1,rle_v3,lv1,lp2)
  877. break;
  878. default:
  879. return;
  880. }
  881. }
  882. cur_frm_pos += 4;
  883. ref_frm_pos += 4;
  884. }
  885. cur_frm_pos += (((width * 2) - blks_width) * 4);
  886. ref_frm_pos += (((width * 2) - blks_width) * 4);
  887. }
  888. break;
  889. default:
  890. return;
  891. }
  892. }
  893. if(strip < strip_tbl)
  894. return;
  895. for( ; strip >= strip_tbl; strip--) {
  896. if(strip->split_flag != 0) {
  897. strip->split_flag = 0;
  898. strip->usl7 = (strip-1)->usl7;
  899. if(strip->split_direction) {
  900. strip->xpos += strip->width;
  901. strip->width = (strip-1)->width - strip->width;
  902. if(region_160_width <= strip->xpos && width < strip->width + strip->xpos)
  903. strip->width = width - strip->xpos;
  904. } else {
  905. strip->ypos += strip->height;
  906. strip->height = (strip-1)->height - strip->height;
  907. }
  908. break;
  909. }
  910. }
  911. }
  912. }
  913. static av_cold int indeo3_decode_init(AVCodecContext *avctx)
  914. {
  915. Indeo3DecodeContext *s = avctx->priv_data;
  916. s->avctx = avctx;
  917. s->width = avctx->width;
  918. s->height = avctx->height;
  919. avctx->pix_fmt = PIX_FMT_YUV410P;
  920. build_modpred(s);
  921. iv_alloc_frames(s);
  922. return 0;
  923. }
  924. static int indeo3_decode_frame(AVCodecContext *avctx,
  925. void *data, int *data_size,
  926. const unsigned char *buf, int buf_size)
  927. {
  928. Indeo3DecodeContext *s=avctx->priv_data;
  929. unsigned char *src, *dest;
  930. int y;
  931. iv_decode_frame(s, buf, buf_size);
  932. if(s->frame.data[0])
  933. avctx->release_buffer(avctx, &s->frame);
  934. s->frame.reference = 0;
  935. if(avctx->get_buffer(avctx, &s->frame) < 0) {
  936. av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed\n");
  937. return -1;
  938. }
  939. src = s->cur_frame->Ybuf;
  940. dest = s->frame.data[0];
  941. for (y = 0; y < s->height; y++) {
  942. memcpy(dest, src, s->cur_frame->y_w);
  943. src += s->cur_frame->y_w;
  944. dest += s->frame.linesize[0];
  945. }
  946. if (!(s->avctx->flags & CODEC_FLAG_GRAY))
  947. {
  948. src = s->cur_frame->Ubuf;
  949. dest = s->frame.data[1];
  950. for (y = 0; y < s->height / 4; y++) {
  951. memcpy(dest, src, s->cur_frame->uv_w);
  952. src += s->cur_frame->uv_w;
  953. dest += s->frame.linesize[1];
  954. }
  955. src = s->cur_frame->Vbuf;
  956. dest = s->frame.data[2];
  957. for (y = 0; y < s->height / 4; y++) {
  958. memcpy(dest, src, s->cur_frame->uv_w);
  959. src += s->cur_frame->uv_w;
  960. dest += s->frame.linesize[2];
  961. }
  962. }
  963. *data_size=sizeof(AVFrame);
  964. *(AVFrame*)data= s->frame;
  965. return buf_size;
  966. }
  967. static av_cold int indeo3_decode_end(AVCodecContext *avctx)
  968. {
  969. Indeo3DecodeContext *s = avctx->priv_data;
  970. iv_free_func(s);
  971. return 0;
  972. }
  973. AVCodec indeo3_decoder = {
  974. "indeo3",
  975. CODEC_TYPE_VIDEO,
  976. CODEC_ID_INDEO3,
  977. sizeof(Indeo3DecodeContext),
  978. indeo3_decode_init,
  979. NULL,
  980. indeo3_decode_end,
  981. indeo3_decode_frame,
  982. 0,
  983. NULL
  984. };