You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1152 lines
39KB

  1. /*
  2. * Intel Indeo 3 (IV31, IV32, etc.) video decoder for ffmpeg
  3. * written, produced, and directed by Alan Smithee
  4. *
  5. * This library is free software; you can redistribute it and/or
  6. * modify it under the terms of the GNU Lesser General Public
  7. * License as published by the Free Software Foundation; either
  8. * version 2 of the License, or (at your option) any later version.
  9. *
  10. * This library is distributed in the hope that it will be useful,
  11. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  13. * Lesser General Public License for more details.
  14. *
  15. * You should have received a copy of the GNU Lesser General Public
  16. * License along with this library; if not, write to the Free Software
  17. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  18. */
  19. #include <stdio.h>
  20. #include <stdlib.h>
  21. #include <string.h>
  22. #include <unistd.h>
  23. #include "common.h"
  24. #include "avcodec.h"
  25. #include "dsputil.h"
  26. #include "mpegvideo.h"
  27. #include "indeo3data.h"
  28. typedef struct
  29. {
  30. unsigned char *Ybuf;
  31. unsigned char *Ubuf;
  32. unsigned char *Vbuf;
  33. unsigned char *the_buf;
  34. unsigned int the_buf_size;
  35. unsigned short y_w, y_h;
  36. unsigned short uv_w, uv_h;
  37. } YUVBufs;
  38. typedef struct Indeo3DecodeContext {
  39. AVCodecContext *avctx;
  40. int width, height;
  41. AVFrame frame;
  42. YUVBufs iv_frame[2];
  43. YUVBufs *cur_frame;
  44. YUVBufs *ref_frame;
  45. unsigned char *ModPred;
  46. unsigned short *corrector_type;
  47. } Indeo3DecodeContext;
  48. static int corrector_type_0[24] = {
  49. 195, 159, 133, 115, 101, 93, 87, 77,
  50. 195, 159, 133, 115, 101, 93, 87, 77,
  51. 128, 79, 79, 79, 79, 79, 79, 79
  52. };
  53. static int corrector_type_2[8] = { 9, 7, 6, 8, 5, 4, 3, 2 };
  54. static void build_modpred(Indeo3DecodeContext *s)
  55. {
  56. int i, j;
  57. s->ModPred = (unsigned char *) av_malloc (8 * 128);
  58. for (i=0; i < 128; ++i) {
  59. s->ModPred[i+0*128] = (i > 126) ? 254 : 2*((i + 1) - ((i + 1) % 2));
  60. s->ModPred[i+1*128] = (i == 7) ? 20 : ((i == 119 || i == 120)
  61. ? 236 : 2*((i + 2) - ((i + 1) % 3)));
  62. s->ModPred[i+2*128] = (i > 125) ? 248 : 2*((i + 2) - ((i + 2) % 4));
  63. s->ModPred[i+3*128] = 2*((i + 1) - ((i - 3) % 5));
  64. s->ModPred[i+4*128] = (i == 8) ? 20 : 2*((i + 1) - ((i - 3) % 6));
  65. s->ModPred[i+5*128] = 2*((i + 4) - ((i + 3) % 7));
  66. s->ModPred[i+6*128] = (i > 123) ? 240 : 2*((i + 4) - ((i + 4) % 8));
  67. s->ModPred[i+7*128] = 2*((i + 5) - ((i + 4) % 9));
  68. }
  69. s->corrector_type = (unsigned short *) av_malloc (24 * 256 * sizeof(unsigned short));
  70. for (i=0; i < 24; ++i) {
  71. for (j=0; j < 256; ++j) {
  72. s->corrector_type[i*256+j] = (j < corrector_type_0[i])
  73. ? 1 : ((j < 248 || (i == 16 && j == 248))
  74. ? 0 : corrector_type_2[j - 248]);
  75. }
  76. }
  77. }
  78. static void iv_Decode_Chunk(Indeo3DecodeContext *s, unsigned char *cur,
  79. unsigned char *ref, int width, int height, unsigned char *buf1,
  80. long fflags2, unsigned char *hdr,
  81. unsigned char *buf2, int min_width_160);
  82. #ifndef min
  83. #define min(a,b) ((a) < (b) ? (a) : (b))
  84. #endif
  85. /* ---------------------------------------------------------------------- */
  86. static void iv_alloc_frames(Indeo3DecodeContext *s)
  87. {
  88. int luma_width, luma_height, luma_pixels, chroma_width, chroma_height,
  89. chroma_pixels, i;
  90. unsigned int bufsize;
  91. luma_width = (s->width + 3) & (~3);
  92. luma_height = (s->height + 3) & (~3);
  93. s->iv_frame[0].y_w = s->iv_frame[0].y_h =
  94. s->iv_frame[0].the_buf_size = 0;
  95. s->iv_frame[1].y_w = s->iv_frame[1].y_h =
  96. s->iv_frame[1].the_buf_size = 0;
  97. s->iv_frame[1].the_buf = NULL;
  98. chroma_width = ((luma_width >> 2) + 3) & (~3);
  99. chroma_height = ((luma_height>> 2) + 3) & (~3);
  100. luma_pixels = luma_width * luma_height;
  101. chroma_pixels = chroma_width * chroma_height;
  102. bufsize = luma_pixels * 2 + luma_width * 3 +
  103. (chroma_pixels + chroma_width) * 4;
  104. if((s->iv_frame[0].the_buf =
  105. (s->iv_frame[0].the_buf_size == 0 ? av_malloc(bufsize) :
  106. av_realloc(s->iv_frame[0].the_buf, bufsize))) == NULL)
  107. return;
  108. s->iv_frame[0].y_w = s->iv_frame[1].y_w = luma_width;
  109. s->iv_frame[0].y_h = s->iv_frame[1].y_h = luma_height;
  110. s->iv_frame[0].uv_w = s->iv_frame[1].uv_w = chroma_width;
  111. s->iv_frame[0].uv_h = s->iv_frame[1].uv_h = chroma_height;
  112. s->iv_frame[0].the_buf_size = bufsize;
  113. s->iv_frame[0].Ybuf = s->iv_frame[0].the_buf + luma_width;
  114. i = luma_pixels + luma_width * 2;
  115. s->iv_frame[1].Ybuf = s->iv_frame[0].the_buf + i;
  116. i += (luma_pixels + luma_width);
  117. s->iv_frame[0].Ubuf = s->iv_frame[0].the_buf + i;
  118. i += (chroma_pixels + chroma_width);
  119. s->iv_frame[1].Ubuf = s->iv_frame[0].the_buf + i;
  120. i += (chroma_pixels + chroma_width);
  121. s->iv_frame[0].Vbuf = s->iv_frame[0].the_buf + i;
  122. i += (chroma_pixels + chroma_width);
  123. s->iv_frame[1].Vbuf = s->iv_frame[0].the_buf + i;
  124. for(i = 1; i <= luma_width; i++)
  125. s->iv_frame[0].Ybuf[-i] = s->iv_frame[1].Ybuf[-i] =
  126. s->iv_frame[0].Ubuf[-i] = 0x80;
  127. for(i = 1; i <= chroma_width; i++) {
  128. s->iv_frame[1].Ubuf[-i] = 0x80;
  129. s->iv_frame[0].Vbuf[-i] = 0x80;
  130. s->iv_frame[1].Vbuf[-i] = 0x80;
  131. s->iv_frame[1].Vbuf[chroma_pixels+i-1] = 0x80;
  132. }
  133. }
  134. /* ---------------------------------------------------------------------- */
  135. static void iv_free_func(Indeo3DecodeContext *s)
  136. {
  137. int i;
  138. for(i = 0 ; i < 2 ; i++) {
  139. if(s->iv_frame[i].the_buf != NULL)
  140. av_free(s->iv_frame[i].the_buf);
  141. s->iv_frame[i].Ybuf = s->iv_frame[i].Ubuf =
  142. s->iv_frame[i].Vbuf = NULL;
  143. s->iv_frame[i].the_buf = NULL;
  144. s->iv_frame[i].the_buf_size = 0;
  145. s->iv_frame[i].y_w = s->iv_frame[i].y_h = 0;
  146. s->iv_frame[i].uv_w = s->iv_frame[i].uv_h = 0;
  147. }
  148. av_free(s->ModPred);
  149. av_free(s->corrector_type);
  150. }
  151. /* ---------------------------------------------------------------------- */
  152. static unsigned long iv_decode_frame(Indeo3DecodeContext *s,
  153. unsigned char *buf, int buf_size)
  154. {
  155. unsigned int hdr_width, hdr_height,
  156. chroma_width, chroma_height;
  157. unsigned long fflags1, fflags2, fflags3, offs1, offs2, offs3, offs;
  158. unsigned char *hdr_pos, *buf_pos;
  159. buf_pos = buf;
  160. buf_pos += 18;
  161. fflags1 = le2me_16(*(uint16_t *)buf_pos);
  162. buf_pos += 2;
  163. fflags3 = le2me_32(*(uint32_t *)buf_pos);
  164. buf_pos += 4;
  165. fflags2 = *buf_pos++;
  166. buf_pos += 3;
  167. hdr_height = le2me_16(*(uint16_t *)buf_pos);
  168. buf_pos += 2;
  169. hdr_width = le2me_16(*(uint16_t *)buf_pos);
  170. if(avcodec_check_dimensions(NULL, hdr_width, hdr_height))
  171. return -1;
  172. buf_pos += 2;
  173. chroma_height = ((hdr_height >> 2) + 3) & 0x7ffc;
  174. chroma_width = ((hdr_width >> 2) + 3) & 0x7ffc;
  175. offs1 = le2me_32(*(uint32_t *)buf_pos);
  176. buf_pos += 4;
  177. offs2 = le2me_32(*(uint32_t *)buf_pos);
  178. buf_pos += 4;
  179. offs3 = le2me_32(*(uint32_t *)buf_pos);
  180. buf_pos += 8;
  181. hdr_pos = buf_pos;
  182. if(fflags3 == 0x80) return 4;
  183. if(fflags1 & 0x200) {
  184. s->cur_frame = s->iv_frame + 1;
  185. s->ref_frame = s->iv_frame;
  186. } else {
  187. s->cur_frame = s->iv_frame;
  188. s->ref_frame = s->iv_frame + 1;
  189. }
  190. buf_pos = buf + 16 + offs1;
  191. offs = le2me_32(*(uint32_t *)buf_pos);
  192. buf_pos += 4;
  193. iv_Decode_Chunk(s, s->cur_frame->Ybuf, s->ref_frame->Ybuf, hdr_width,
  194. hdr_height, buf_pos + offs * 2, fflags2, hdr_pos, buf_pos,
  195. min(hdr_width, 160));
  196. if (!(s->avctx->flags & CODEC_FLAG_GRAY))
  197. {
  198. buf_pos = buf + 16 + offs2;
  199. offs = le2me_32(*(uint32_t *)buf_pos);
  200. buf_pos += 4;
  201. iv_Decode_Chunk(s, s->cur_frame->Vbuf, s->ref_frame->Vbuf, chroma_width,
  202. chroma_height, buf_pos + offs * 2, fflags2, hdr_pos, buf_pos,
  203. min(chroma_width, 40));
  204. buf_pos = buf + 16 + offs3;
  205. offs = le2me_32(*(uint32_t *)buf_pos);
  206. buf_pos += 4;
  207. iv_Decode_Chunk(s, s->cur_frame->Ubuf, s->ref_frame->Ubuf, chroma_width,
  208. chroma_height, buf_pos + offs * 2, fflags2, hdr_pos, buf_pos,
  209. min(chroma_width, 40));
  210. }
  211. return 8;
  212. }
  213. typedef struct {
  214. long xpos;
  215. long ypos;
  216. long width;
  217. long height;
  218. long split_flag;
  219. long split_direction;
  220. long usl7;
  221. } ustr_t;
  222. /* ---------------------------------------------------------------------- */
  223. #define LV1_CHECK(buf1,rle_v3,lv1,lp2) \
  224. if((lv1 & 0x80) != 0) { \
  225. if(rle_v3 != 0) \
  226. rle_v3 = 0; \
  227. else { \
  228. rle_v3 = 1; \
  229. buf1 -= 2; \
  230. } \
  231. } \
  232. lp2 = 4;
  233. #define RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3) \
  234. if(rle_v3 == 0) { \
  235. rle_v2 = *buf1; \
  236. rle_v1 = 1; \
  237. if(rle_v2 > 32) { \
  238. rle_v2 -= 32; \
  239. rle_v1 = 0; \
  240. } \
  241. rle_v3 = 1; \
  242. } \
  243. buf1--;
  244. #define LP2_CHECK(buf1,rle_v3,lp2) \
  245. if(lp2 == 0 && rle_v3 != 0) \
  246. rle_v3 = 0; \
  247. else { \
  248. buf1--; \
  249. rle_v3 = 1; \
  250. }
  251. #define RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2) \
  252. rle_v2--; \
  253. if(rle_v2 == 0) { \
  254. rle_v3 = 0; \
  255. buf1 += 2; \
  256. } \
  257. lp2 = 4;
  258. static void iv_Decode_Chunk(Indeo3DecodeContext *s,
  259. unsigned char *cur, unsigned char *ref, int width, int height,
  260. unsigned char *buf1, long fflags2, unsigned char *hdr,
  261. unsigned char *buf2, int min_width_160)
  262. {
  263. unsigned char bit_buf;
  264. unsigned long bit_pos, lv, lv1, lv2;
  265. long *width_tbl, width_tbl_arr[10];
  266. signed char *ref_vectors;
  267. unsigned char *cur_frm_pos, *ref_frm_pos, *cp, *cp2;
  268. uint32_t *cur_lp, *ref_lp;
  269. const uint32_t *correction_lp[2], *correctionloworder_lp[2], *correctionhighorder_lp[2];
  270. unsigned short *correction_type_sp[2];
  271. ustr_t strip_tbl[20], *strip;
  272. int i, j, k, lp1, lp2, flag1, cmd, blks_width, blks_height, region_160_width,
  273. rle_v1, rle_v2, rle_v3;
  274. unsigned short res;
  275. bit_buf = 0;
  276. ref_vectors = NULL;
  277. width_tbl = width_tbl_arr + 1;
  278. i = (width < 0 ? width + 3 : width)/4;
  279. for(j = -1; j < 8; j++)
  280. width_tbl[j] = i * j;
  281. strip = strip_tbl;
  282. for(region_160_width = 0; region_160_width < (width - min_width_160); region_160_width += min_width_160);
  283. strip->ypos = strip->xpos = 0;
  284. for(strip->width = min_width_160; width > strip->width; strip->width *= 2);
  285. strip->height = height;
  286. strip->split_direction = 0;
  287. strip->split_flag = 0;
  288. strip->usl7 = 0;
  289. bit_pos = 0;
  290. rle_v1 = rle_v2 = rle_v3 = 0;
  291. while(strip >= strip_tbl) {
  292. if(bit_pos <= 0) {
  293. bit_pos = 8;
  294. bit_buf = *buf1++;
  295. }
  296. bit_pos -= 2;
  297. cmd = (bit_buf >> bit_pos) & 0x03;
  298. if(cmd == 0) {
  299. strip++;
  300. memcpy(strip, strip-1, sizeof(ustr_t));
  301. strip->split_flag = 1;
  302. strip->split_direction = 0;
  303. strip->height = (strip->height > 8 ? ((strip->height+8)>>4)<<3 : 4);
  304. continue;
  305. } else if(cmd == 1) {
  306. strip++;
  307. memcpy(strip, strip-1, sizeof(ustr_t));
  308. strip->split_flag = 1;
  309. strip->split_direction = 1;
  310. strip->width = (strip->width > 8 ? ((strip->width+8)>>4)<<3 : 4);
  311. continue;
  312. } else if(cmd == 2) {
  313. if(strip->usl7 == 0) {
  314. strip->usl7 = 1;
  315. ref_vectors = NULL;
  316. continue;
  317. }
  318. } else if(cmd == 3) {
  319. if(strip->usl7 == 0) {
  320. strip->usl7 = 1;
  321. ref_vectors = buf2 + (*buf1 * 2);
  322. buf1++;
  323. continue;
  324. }
  325. }
  326. cur_frm_pos = cur + width * strip->ypos + strip->xpos;
  327. if((blks_width = strip->width) < 0)
  328. blks_width += 3;
  329. blks_width >>= 2;
  330. blks_height = strip->height;
  331. if(ref_vectors != NULL) {
  332. ref_frm_pos = ref + (ref_vectors[0] + strip->ypos) * width +
  333. ref_vectors[1] + strip->xpos;
  334. } else
  335. ref_frm_pos = cur_frm_pos - width_tbl[4];
  336. if(cmd == 2) {
  337. if(bit_pos <= 0) {
  338. bit_pos = 8;
  339. bit_buf = *buf1++;
  340. }
  341. bit_pos -= 2;
  342. cmd = (bit_buf >> bit_pos) & 0x03;
  343. if(cmd == 0 || ref_vectors != NULL) {
  344. for(lp1 = 0; lp1 < blks_width; lp1++) {
  345. for(i = 0, j = 0; i < blks_height; i++, j += width_tbl[1])
  346. ((uint32_t *)cur_frm_pos)[j] = ((uint32_t *)ref_frm_pos)[j];
  347. cur_frm_pos += 4;
  348. ref_frm_pos += 4;
  349. }
  350. } else if(cmd != 1)
  351. return;
  352. } else {
  353. k = *buf1 >> 4;
  354. j = *buf1 & 0x0f;
  355. buf1++;
  356. lv = j + fflags2;
  357. if((lv - 8) <= 7 && (k == 0 || k == 3 || k == 10)) {
  358. cp2 = s->ModPred + ((lv - 8) << 7);
  359. cp = ref_frm_pos;
  360. for(i = 0; i < blks_width << 2; i++) {
  361. int v = *cp >> 1;
  362. *(cp++) = cp2[v];
  363. }
  364. }
  365. if(k == 1 || k == 4) {
  366. lv = (hdr[j] & 0xf) + fflags2;
  367. correction_type_sp[0] = s->corrector_type + (lv << 8);
  368. correction_lp[0] = correction + (lv << 8);
  369. lv = (hdr[j] >> 4) + fflags2;
  370. correction_lp[1] = correction + (lv << 8);
  371. correction_type_sp[1] = s->corrector_type + (lv << 8);
  372. } else {
  373. correctionloworder_lp[0] = correctionloworder_lp[1] = correctionloworder + (lv << 8);
  374. correctionhighorder_lp[0] = correctionhighorder_lp[1] = correctionhighorder + (lv << 8);
  375. correction_type_sp[0] = correction_type_sp[1] = s->corrector_type + (lv << 8);
  376. correction_lp[0] = correction_lp[1] = correction + (lv << 8);
  377. }
  378. switch(k) {
  379. case 1:
  380. case 0: /********** CASE 0 **********/
  381. for( ; blks_height > 0; blks_height -= 4) {
  382. for(lp1 = 0; lp1 < blks_width; lp1++) {
  383. for(lp2 = 0; lp2 < 4; ) {
  384. k = *buf1++;
  385. cur_lp = ((uint32_t *)cur_frm_pos) + width_tbl[lp2];
  386. ref_lp = ((uint32_t *)ref_frm_pos) + width_tbl[lp2];
  387. switch(correction_type_sp[0][k]) {
  388. case 0:
  389. *cur_lp = le2me_32(((le2me_32(*ref_lp) >> 1) + correction_lp[lp2 & 0x01][k]) << 1);
  390. lp2++;
  391. break;
  392. case 1:
  393. res = ((le2me_16(((unsigned short *)(ref_lp))[0]) >> 1) + correction_lp[lp2 & 0x01][*buf1]) << 1;
  394. ((unsigned short *)cur_lp)[0] = le2me_16(res);
  395. res = ((le2me_16(((unsigned short *)(ref_lp))[1]) >> 1) + correction_lp[lp2 & 0x01][k]) << 1;
  396. ((unsigned short *)cur_lp)[1] = le2me_16(res);
  397. buf1++;
  398. lp2++;
  399. break;
  400. case 2:
  401. if(lp2 == 0) {
  402. for(i = 0, j = 0; i < 2; i++, j += width_tbl[1])
  403. cur_lp[j] = ref_lp[j];
  404. lp2 += 2;
  405. }
  406. break;
  407. case 3:
  408. if(lp2 < 2) {
  409. for(i = 0, j = 0; i < (3 - lp2); i++, j += width_tbl[1])
  410. cur_lp[j] = ref_lp[j];
  411. lp2 = 3;
  412. }
  413. break;
  414. case 8:
  415. if(lp2 == 0) {
  416. RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3)
  417. if(rle_v1 == 1 || ref_vectors != NULL) {
  418. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  419. cur_lp[j] = ref_lp[j];
  420. }
  421. RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2)
  422. break;
  423. } else {
  424. rle_v1 = 1;
  425. rle_v2 = *buf1 - 1;
  426. }
  427. case 5:
  428. LP2_CHECK(buf1,rle_v3,lp2)
  429. case 4:
  430. for(i = 0, j = 0; i < (4 - lp2); i++, j += width_tbl[1])
  431. cur_lp[j] = ref_lp[j];
  432. lp2 = 4;
  433. break;
  434. case 7:
  435. if(rle_v3 != 0)
  436. rle_v3 = 0;
  437. else {
  438. buf1--;
  439. rle_v3 = 1;
  440. }
  441. case 6:
  442. if(ref_vectors != NULL) {
  443. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  444. cur_lp[j] = ref_lp[j];
  445. }
  446. lp2 = 4;
  447. break;
  448. case 9:
  449. lv1 = *buf1++;
  450. lv = (lv1 & 0x7F) << 1;
  451. lv += (lv << 8);
  452. lv += (lv << 16);
  453. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  454. cur_lp[j] = lv;
  455. LV1_CHECK(buf1,rle_v3,lv1,lp2)
  456. break;
  457. default:
  458. return;
  459. }
  460. }
  461. cur_frm_pos += 4;
  462. ref_frm_pos += 4;
  463. }
  464. cur_frm_pos += ((width - blks_width) * 4);
  465. ref_frm_pos += ((width - blks_width) * 4);
  466. }
  467. break;
  468. case 4:
  469. case 3: /********** CASE 3 **********/
  470. if(ref_vectors != NULL)
  471. return;
  472. flag1 = 1;
  473. for( ; blks_height > 0; blks_height -= 8) {
  474. for(lp1 = 0; lp1 < blks_width; lp1++) {
  475. for(lp2 = 0; lp2 < 4; ) {
  476. k = *buf1++;
  477. cur_lp = ((uint32_t *)cur_frm_pos) + width_tbl[lp2 * 2];
  478. ref_lp = ((uint32_t *)cur_frm_pos) + width_tbl[(lp2 * 2) - 1];
  479. switch(correction_type_sp[lp2 & 0x01][k]) {
  480. case 0:
  481. cur_lp[width_tbl[1]] = le2me_32(((le2me_32(*ref_lp) >> 1) + correction_lp[lp2 & 0x01][k]) << 1);
  482. if(lp2 > 0 || flag1 == 0 || strip->ypos != 0)
  483. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  484. else
  485. cur_lp[0] = le2me_32(((le2me_32(*ref_lp) >> 1) + correction_lp[lp2 & 0x01][k]) << 1);
  486. lp2++;
  487. break;
  488. case 1:
  489. res = ((le2me_16(((unsigned short *)ref_lp)[0]) >> 1) + correction_lp[lp2 & 0x01][*buf1]) << 1;
  490. ((unsigned short *)cur_lp)[width_tbl[2]] = le2me_16(res);
  491. res = ((le2me_16(((unsigned short *)ref_lp)[1]) >> 1) + correction_lp[lp2 & 0x01][k]) << 1;
  492. ((unsigned short *)cur_lp)[width_tbl[2]+1] = le2me_16(res);
  493. if(lp2 > 0 || flag1 == 0 || strip->ypos != 0)
  494. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  495. else
  496. cur_lp[0] = cur_lp[width_tbl[1]];
  497. buf1++;
  498. lp2++;
  499. break;
  500. case 2:
  501. if(lp2 == 0) {
  502. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  503. cur_lp[j] = *ref_lp;
  504. lp2 += 2;
  505. }
  506. break;
  507. case 3:
  508. if(lp2 < 2) {
  509. for(i = 0, j = 0; i < 6 - (lp2 * 2); i++, j += width_tbl[1])
  510. cur_lp[j] = *ref_lp;
  511. lp2 = 3;
  512. }
  513. break;
  514. case 6:
  515. lp2 = 4;
  516. break;
  517. case 7:
  518. if(rle_v3 != 0)
  519. rle_v3 = 0;
  520. else {
  521. buf1--;
  522. rle_v3 = 1;
  523. }
  524. lp2 = 4;
  525. break;
  526. case 8:
  527. if(lp2 == 0) {
  528. RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3)
  529. if(rle_v1 == 1) {
  530. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1])
  531. cur_lp[j] = ref_lp[j];
  532. }
  533. RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2)
  534. break;
  535. } else {
  536. rle_v2 = (*buf1) - 1;
  537. rle_v1 = 1;
  538. }
  539. case 5:
  540. LP2_CHECK(buf1,rle_v3,lp2)
  541. case 4:
  542. for(i = 0, j = 0; i < 8 - (lp2 * 2); i++, j += width_tbl[1])
  543. cur_lp[j] = *ref_lp;
  544. lp2 = 4;
  545. break;
  546. case 9:
  547. av_log(s->avctx, AV_LOG_ERROR, "UNTESTED.\n");
  548. lv1 = *buf1++;
  549. lv = (lv1 & 0x7F) << 1;
  550. lv += (lv << 8);
  551. lv += (lv << 16);
  552. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  553. cur_lp[j] = lv;
  554. LV1_CHECK(buf1,rle_v3,lv1,lp2)
  555. break;
  556. default:
  557. return;
  558. }
  559. }
  560. cur_frm_pos += 4;
  561. }
  562. cur_frm_pos += (((width * 2) - blks_width) * 4);
  563. flag1 = 0;
  564. }
  565. break;
  566. case 10: /********** CASE 10 **********/
  567. if(ref_vectors == NULL) {
  568. flag1 = 1;
  569. for( ; blks_height > 0; blks_height -= 8) {
  570. for(lp1 = 0; lp1 < blks_width; lp1 += 2) {
  571. for(lp2 = 0; lp2 < 4; ) {
  572. k = *buf1++;
  573. cur_lp = ((uint32_t *)cur_frm_pos) + width_tbl[lp2 * 2];
  574. ref_lp = ((uint32_t *)cur_frm_pos) + width_tbl[(lp2 * 2) - 1];
  575. lv1 = ref_lp[0];
  576. lv2 = ref_lp[1];
  577. if(lp2 == 0 && flag1 != 0) {
  578. #ifdef WORDS_BIGENDIAN
  579. lv1 = lv1 & 0xFF00FF00;
  580. lv1 = (lv1 >> 8) | lv1;
  581. lv2 = lv2 & 0xFF00FF00;
  582. lv2 = (lv2 >> 8) | lv2;
  583. #else
  584. lv1 = lv1 & 0x00FF00FF;
  585. lv1 = (lv1 << 8) | lv1;
  586. lv2 = lv2 & 0x00FF00FF;
  587. lv2 = (lv2 << 8) | lv2;
  588. #endif
  589. }
  590. switch(correction_type_sp[lp2 & 0x01][k]) {
  591. case 0:
  592. cur_lp[width_tbl[1]] = le2me_32(((le2me_32(lv1) >> 1) + correctionloworder_lp[lp2 & 0x01][k]) << 1);
  593. cur_lp[width_tbl[1]+1] = le2me_32(((le2me_32(lv2) >> 1) + correctionhighorder_lp[lp2 & 0x01][k]) << 1);
  594. if(lp2 > 0 || strip->ypos != 0 || flag1 == 0) {
  595. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  596. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  597. } else {
  598. cur_lp[0] = cur_lp[width_tbl[1]];
  599. cur_lp[1] = cur_lp[width_tbl[1]+1];
  600. }
  601. lp2++;
  602. break;
  603. case 1:
  604. cur_lp[width_tbl[1]] = le2me_32(((le2me_32(lv1) >> 1) + correctionloworder_lp[lp2 & 0x01][*buf1]) << 1);
  605. cur_lp[width_tbl[1]+1] = le2me_32(((le2me_32(lv2) >> 1) + correctionloworder_lp[lp2 & 0x01][k]) << 1);
  606. if(lp2 > 0 || strip->ypos != 0 || flag1 == 0) {
  607. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  608. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  609. } else {
  610. cur_lp[0] = cur_lp[width_tbl[1]];
  611. cur_lp[1] = cur_lp[width_tbl[1]+1];
  612. }
  613. buf1++;
  614. lp2++;
  615. break;
  616. case 2:
  617. if(lp2 == 0) {
  618. if(flag1 != 0) {
  619. for(i = 0, j = width_tbl[1]; i < 3; i++, j += width_tbl[1]) {
  620. cur_lp[j] = lv1;
  621. cur_lp[j+1] = lv2;
  622. }
  623. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  624. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  625. } else {
  626. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1]) {
  627. cur_lp[j] = lv1;
  628. cur_lp[j+1] = lv2;
  629. }
  630. }
  631. lp2 += 2;
  632. }
  633. break;
  634. case 3:
  635. if(lp2 < 2) {
  636. if(lp2 == 0 && flag1 != 0) {
  637. for(i = 0, j = width_tbl[1]; i < 5; i++, j += width_tbl[1]) {
  638. cur_lp[j] = lv1;
  639. cur_lp[j+1] = lv2;
  640. }
  641. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  642. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  643. } else {
  644. for(i = 0, j = 0; i < 6 - (lp2 * 2); i++, j += width_tbl[1]) {
  645. cur_lp[j] = lv1;
  646. cur_lp[j+1] = lv2;
  647. }
  648. }
  649. lp2 = 3;
  650. }
  651. break;
  652. case 8:
  653. if(lp2 == 0) {
  654. RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3)
  655. if(rle_v1 == 1) {
  656. if(flag1 != 0) {
  657. for(i = 0, j = width_tbl[1]; i < 7; i++, j += width_tbl[1]) {
  658. cur_lp[j] = lv1;
  659. cur_lp[j+1] = lv2;
  660. }
  661. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  662. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  663. } else {
  664. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1]) {
  665. cur_lp[j] = lv1;
  666. cur_lp[j+1] = lv2;
  667. }
  668. }
  669. }
  670. RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2)
  671. break;
  672. } else {
  673. rle_v1 = 1;
  674. rle_v2 = (*buf1) - 1;
  675. }
  676. case 5:
  677. LP2_CHECK(buf1,rle_v3,lp2)
  678. case 4:
  679. if(lp2 == 0 && flag1 != 0) {
  680. for(i = 0, j = width_tbl[1]; i < 7; i++, j += width_tbl[1]) {
  681. cur_lp[j] = lv1;
  682. cur_lp[j+1] = lv2;
  683. }
  684. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  685. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  686. } else {
  687. for(i = 0, j = 0; i < 8 - (lp2 * 2); i++, j += width_tbl[1]) {
  688. cur_lp[j] = lv1;
  689. cur_lp[j+1] = lv2;
  690. }
  691. }
  692. lp2 = 4;
  693. break;
  694. case 6:
  695. lp2 = 4;
  696. break;
  697. case 7:
  698. if(lp2 == 0) {
  699. if(rle_v3 != 0)
  700. rle_v3 = 0;
  701. else {
  702. buf1--;
  703. rle_v3 = 1;
  704. }
  705. lp2 = 4;
  706. }
  707. break;
  708. case 9:
  709. av_log(s->avctx, AV_LOG_ERROR, "UNTESTED.\n");
  710. lv1 = *buf1;
  711. lv = (lv1 & 0x7F) << 1;
  712. lv += (lv << 8);
  713. lv += (lv << 16);
  714. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1])
  715. cur_lp[j] = lv;
  716. LV1_CHECK(buf1,rle_v3,lv1,lp2)
  717. break;
  718. default:
  719. return;
  720. }
  721. }
  722. cur_frm_pos += 8;
  723. }
  724. cur_frm_pos += (((width * 2) - blks_width) * 4);
  725. flag1 = 0;
  726. }
  727. } else {
  728. for( ; blks_height > 0; blks_height -= 8) {
  729. for(lp1 = 0; lp1 < blks_width; lp1 += 2) {
  730. for(lp2 = 0; lp2 < 4; ) {
  731. k = *buf1++;
  732. cur_lp = ((uint32_t *)cur_frm_pos) + width_tbl[lp2 * 2];
  733. ref_lp = ((uint32_t *)ref_frm_pos) + width_tbl[lp2 * 2];
  734. switch(correction_type_sp[lp2 & 0x01][k]) {
  735. case 0:
  736. lv1 = correctionloworder_lp[lp2 & 0x01][k];
  737. lv2 = correctionhighorder_lp[lp2 & 0x01][k];
  738. cur_lp[0] = le2me_32(((le2me_32(ref_lp[0]) >> 1) + lv1) << 1);
  739. cur_lp[1] = le2me_32(((le2me_32(ref_lp[1]) >> 1) + lv2) << 1);
  740. cur_lp[width_tbl[1]] = le2me_32(((le2me_32(ref_lp[width_tbl[1]]) >> 1) + lv1) << 1);
  741. cur_lp[width_tbl[1]+1] = le2me_32(((le2me_32(ref_lp[width_tbl[1]+1]) >> 1) + lv2) << 1);
  742. lp2++;
  743. break;
  744. case 1:
  745. lv1 = correctionloworder_lp[lp2 & 0x01][*buf1++];
  746. lv2 = correctionloworder_lp[lp2 & 0x01][k];
  747. cur_lp[0] = le2me_32(((le2me_32(ref_lp[0]) >> 1) + lv1) << 1);
  748. cur_lp[1] = le2me_32(((le2me_32(ref_lp[1]) >> 1) + lv2) << 1);
  749. cur_lp[width_tbl[1]] = le2me_32(((le2me_32(ref_lp[width_tbl[1]]) >> 1) + lv1) << 1);
  750. cur_lp[width_tbl[1]+1] = le2me_32(((le2me_32(ref_lp[width_tbl[1]+1]) >> 1) + lv2) << 1);
  751. lp2++;
  752. break;
  753. case 2:
  754. if(lp2 == 0) {
  755. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1]) {
  756. cur_lp[j] = ref_lp[j];
  757. cur_lp[j+1] = ref_lp[j+1];
  758. }
  759. lp2 += 2;
  760. }
  761. break;
  762. case 3:
  763. if(lp2 < 2) {
  764. for(i = 0, j = 0; i < 6 - (lp2 * 2); i++, j += width_tbl[1]) {
  765. cur_lp[j] = ref_lp[j];
  766. cur_lp[j+1] = ref_lp[j+1];
  767. }
  768. lp2 = 3;
  769. }
  770. break;
  771. case 8:
  772. if(lp2 == 0) {
  773. RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3)
  774. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1]) {
  775. ((uint32_t *)cur_frm_pos)[j] = ((uint32_t *)ref_frm_pos)[j];
  776. ((uint32_t *)cur_frm_pos)[j+1] = ((uint32_t *)ref_frm_pos)[j+1];
  777. }
  778. RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2)
  779. break;
  780. } else {
  781. rle_v1 = 1;
  782. rle_v2 = (*buf1) - 1;
  783. }
  784. case 5:
  785. case 7:
  786. LP2_CHECK(buf1,rle_v3,lp2)
  787. case 6:
  788. case 4:
  789. for(i = 0, j = 0; i < 8 - (lp2 * 2); i++, j += width_tbl[1]) {
  790. cur_lp[j] = ref_lp[j];
  791. cur_lp[j+1] = ref_lp[j+1];
  792. }
  793. lp2 = 4;
  794. break;
  795. case 9:
  796. av_log(s->avctx, AV_LOG_ERROR, "UNTESTED.\n");
  797. lv1 = *buf1;
  798. lv = (lv1 & 0x7F) << 1;
  799. lv += (lv << 8);
  800. lv += (lv << 16);
  801. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1])
  802. ((uint32_t *)cur_frm_pos)[j] = ((uint32_t *)cur_frm_pos)[j+1] = lv;
  803. LV1_CHECK(buf1,rle_v3,lv1,lp2)
  804. break;
  805. default:
  806. return;
  807. }
  808. }
  809. cur_frm_pos += 8;
  810. ref_frm_pos += 8;
  811. }
  812. cur_frm_pos += (((width * 2) - blks_width) * 4);
  813. ref_frm_pos += (((width * 2) - blks_width) * 4);
  814. }
  815. }
  816. break;
  817. case 11: /********** CASE 11 **********/
  818. if(ref_vectors == NULL)
  819. return;
  820. for( ; blks_height > 0; blks_height -= 8) {
  821. for(lp1 = 0; lp1 < blks_width; lp1++) {
  822. for(lp2 = 0; lp2 < 4; ) {
  823. k = *buf1++;
  824. cur_lp = ((uint32_t *)cur_frm_pos) + width_tbl[lp2 * 2];
  825. ref_lp = ((uint32_t *)ref_frm_pos) + width_tbl[lp2 * 2];
  826. switch(correction_type_sp[lp2 & 0x01][k]) {
  827. case 0:
  828. cur_lp[0] = le2me_32(((le2me_32(*ref_lp) >> 1) + correction_lp[lp2 & 0x01][k]) << 1);
  829. cur_lp[width_tbl[1]] = le2me_32(((le2me_32(ref_lp[width_tbl[1]]) >> 1) + correction_lp[lp2 & 0x01][k]) << 1);
  830. lp2++;
  831. break;
  832. case 1:
  833. lv1 = (unsigned short)(correction_lp[lp2 & 0x01][*buf1++]);
  834. lv2 = (unsigned short)(correction_lp[lp2 & 0x01][k]);
  835. res = (unsigned short)(((le2me_16(((unsigned short *)ref_lp)[0]) >> 1) + lv1) << 1);
  836. ((unsigned short *)cur_lp)[0] = le2me_16(res);
  837. res = (unsigned short)(((le2me_16(((unsigned short *)ref_lp)[1]) >> 1) + lv2) << 1);
  838. ((unsigned short *)cur_lp)[1] = le2me_16(res);
  839. res = (unsigned short)(((le2me_16(((unsigned short *)ref_lp)[width_tbl[2]]) >> 1) + lv1) << 1);
  840. ((unsigned short *)cur_lp)[width_tbl[2]] = le2me_16(res);
  841. res = (unsigned short)(((le2me_16(((unsigned short *)ref_lp)[width_tbl[2]+1]) >> 1) + lv2) << 1);
  842. ((unsigned short *)cur_lp)[width_tbl[2]+1] = le2me_16(res);
  843. lp2++;
  844. break;
  845. case 2:
  846. if(lp2 == 0) {
  847. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  848. cur_lp[j] = ref_lp[j];
  849. lp2 += 2;
  850. }
  851. break;
  852. case 3:
  853. if(lp2 < 2) {
  854. for(i = 0, j = 0; i < 6 - (lp2 * 2); i++, j += width_tbl[1])
  855. cur_lp[j] = ref_lp[j];
  856. lp2 = 3;
  857. }
  858. break;
  859. case 8:
  860. if(lp2 == 0) {
  861. RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3)
  862. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1])
  863. cur_lp[j] = ref_lp[j];
  864. RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2)
  865. break;
  866. } else {
  867. rle_v1 = 1;
  868. rle_v2 = (*buf1) - 1;
  869. }
  870. case 5:
  871. case 7:
  872. LP2_CHECK(buf1,rle_v3,lp2)
  873. case 4:
  874. case 6:
  875. for(i = 0, j = 0; i < 8 - (lp2 * 2); i++, j += width_tbl[1])
  876. cur_lp[j] = ref_lp[j];
  877. lp2 = 4;
  878. break;
  879. case 9:
  880. av_log(s->avctx, AV_LOG_ERROR, "UNTESTED.\n");
  881. lv1 = *buf1++;
  882. lv = (lv1 & 0x7F) << 1;
  883. lv += (lv << 8);
  884. lv += (lv << 16);
  885. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  886. cur_lp[j] = lv;
  887. LV1_CHECK(buf1,rle_v3,lv1,lp2)
  888. break;
  889. default:
  890. return;
  891. }
  892. }
  893. cur_frm_pos += 4;
  894. ref_frm_pos += 4;
  895. }
  896. cur_frm_pos += (((width * 2) - blks_width) * 4);
  897. ref_frm_pos += (((width * 2) - blks_width) * 4);
  898. }
  899. break;
  900. default:
  901. return;
  902. }
  903. }
  904. if(strip < strip_tbl)
  905. return;
  906. for( ; strip >= strip_tbl; strip--) {
  907. if(strip->split_flag != 0) {
  908. strip->split_flag = 0;
  909. strip->usl7 = (strip-1)->usl7;
  910. if(strip->split_direction) {
  911. strip->xpos += strip->width;
  912. strip->width = (strip-1)->width - strip->width;
  913. if(region_160_width <= strip->xpos && width < strip->width + strip->xpos)
  914. strip->width = width - strip->xpos;
  915. } else {
  916. strip->ypos += strip->height;
  917. strip->height = (strip-1)->height - strip->height;
  918. }
  919. break;
  920. }
  921. }
  922. }
  923. }
  924. static int indeo3_decode_init(AVCodecContext *avctx)
  925. {
  926. Indeo3DecodeContext *s = avctx->priv_data;
  927. s->avctx = avctx;
  928. s->width = avctx->width;
  929. s->height = avctx->height;
  930. avctx->pix_fmt = PIX_FMT_YUV410P;
  931. avctx->has_b_frames = 0;
  932. build_modpred(s);
  933. iv_alloc_frames(s);
  934. return 0;
  935. }
  936. static int indeo3_decode_frame(AVCodecContext *avctx,
  937. void *data, int *data_size,
  938. unsigned char *buf, int buf_size)
  939. {
  940. Indeo3DecodeContext *s=avctx->priv_data;
  941. unsigned char *src, *dest;
  942. int y;
  943. iv_decode_frame(s, buf, buf_size);
  944. if(s->frame.data[0])
  945. avctx->release_buffer(avctx, &s->frame);
  946. s->frame.reference = 0;
  947. if(avctx->get_buffer(avctx, &s->frame) < 0) {
  948. av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed\n");
  949. return -1;
  950. }
  951. src = s->cur_frame->Ybuf;
  952. dest = s->frame.data[0];
  953. for (y = 0; y < s->height; y++) {
  954. memcpy(dest, src, s->cur_frame->y_w);
  955. src += s->cur_frame->y_w;
  956. dest += s->frame.linesize[0];
  957. }
  958. if (!(s->avctx->flags & CODEC_FLAG_GRAY))
  959. {
  960. src = s->cur_frame->Ubuf;
  961. dest = s->frame.data[1];
  962. for (y = 0; y < s->height / 4; y++) {
  963. memcpy(dest, src, s->cur_frame->uv_w);
  964. src += s->cur_frame->uv_w;
  965. dest += s->frame.linesize[1];
  966. }
  967. src = s->cur_frame->Vbuf;
  968. dest = s->frame.data[2];
  969. for (y = 0; y < s->height / 4; y++) {
  970. memcpy(dest, src, s->cur_frame->uv_w);
  971. src += s->cur_frame->uv_w;
  972. dest += s->frame.linesize[2];
  973. }
  974. }
  975. *data_size=sizeof(AVFrame);
  976. *(AVFrame*)data= s->frame;
  977. return buf_size;
  978. }
  979. static int indeo3_decode_end(AVCodecContext *avctx)
  980. {
  981. Indeo3DecodeContext *s = avctx->priv_data;
  982. iv_free_func(s);
  983. return 0;
  984. }
  985. AVCodec indeo3_decoder = {
  986. "indeo3",
  987. CODEC_TYPE_VIDEO,
  988. CODEC_ID_INDEO3,
  989. sizeof(Indeo3DecodeContext),
  990. indeo3_decode_init,
  991. NULL,
  992. indeo3_decode_end,
  993. indeo3_decode_frame,
  994. 0,
  995. NULL
  996. };