You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1121 lines
37KB

  1. /*
  2. * Intel Indeo 3 (IV31, IV32, etc.) video decoder for ffmpeg
  3. * written, produced, and directed by Alan Smithee
  4. *
  5. * This library is free software; you can redistribute it and/or
  6. * modify it under the terms of the GNU Lesser General Public
  7. * License as published by the Free Software Foundation; either
  8. * version 2 of the License, or (at your option) any later version.
  9. *
  10. * This library is distributed in the hope that it will be useful,
  11. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  13. * Lesser General Public License for more details.
  14. *
  15. * You should have received a copy of the GNU Lesser General Public
  16. * License along with this library; if not, write to the Free Software
  17. * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
  18. */
  19. #include <stdio.h>
  20. #include <stdlib.h>
  21. #include <string.h>
  22. #include <unistd.h>
  23. #include "common.h"
  24. #include "avcodec.h"
  25. #include "dsputil.h"
  26. #include "mpegvideo.h"
  27. #include "indeo3data.h"
  28. typedef struct
  29. {
  30. unsigned char *Ybuf;
  31. unsigned char *Ubuf;
  32. unsigned char *Vbuf;
  33. unsigned char *the_buf;
  34. unsigned int the_buf_size;
  35. unsigned short y_w, y_h;
  36. unsigned short uv_w, uv_h;
  37. } YUVBufs;
  38. typedef struct Indeo3DecodeContext {
  39. AVCodecContext *avctx;
  40. int width, height;
  41. AVFrame frame;
  42. YUVBufs iv_frame[2];
  43. YUVBufs *cur_frame;
  44. YUVBufs *ref_frame;
  45. unsigned char *ModPred;
  46. unsigned short *corrector_type;
  47. } Indeo3DecodeContext;
  48. static int corrector_type_0[24] = {
  49. 195, 159, 133, 115, 101, 93, 87, 77,
  50. 195, 159, 133, 115, 101, 93, 87, 77,
  51. 128, 79, 79, 79, 79, 79, 79, 79
  52. };
  53. static int corrector_type_2[8] = { 9, 7, 6, 8, 5, 4, 3, 2 };
  54. static void build_modpred(Indeo3DecodeContext *s)
  55. {
  56. int i, j;
  57. s->ModPred = (unsigned char *) av_malloc (8 * 128);
  58. for (i=0; i < 128; ++i) {
  59. s->ModPred[i+0*128] = (i > 126) ? 254 : 2*((i + 1) - ((i + 1) % 2));
  60. s->ModPred[i+1*128] = (i == 7) ? 20 : ((i == 119 || i == 120)
  61. ? 236 : 2*((i + 2) - ((i + 1) % 3)));
  62. s->ModPred[i+2*128] = (i > 125) ? 248 : 2*((i + 2) - ((i + 2) % 4));
  63. s->ModPred[i+3*128] = 2*((i + 1) - ((i - 3) % 5));
  64. s->ModPred[i+4*128] = (i == 8) ? 20 : 2*((i + 1) - ((i - 3) % 6));
  65. s->ModPred[i+5*128] = 2*((i + 4) - ((i + 3) % 7));
  66. s->ModPred[i+6*128] = (i > 123) ? 240 : 2*((i + 4) - ((i + 4) % 8));
  67. s->ModPred[i+7*128] = 2*((i + 5) - ((i + 4) % 9));
  68. }
  69. s->corrector_type = (unsigned short *) av_malloc (24 * 256 * sizeof(unsigned short));
  70. for (i=0; i < 24; ++i) {
  71. for (j=0; j < 256; ++j) {
  72. s->corrector_type[i*256+j] = (j < corrector_type_0[i])
  73. ? 1 : ((j < 248 || (i == 16 && j == 248))
  74. ? 0 : corrector_type_2[j - 248]);
  75. }
  76. }
  77. }
  78. static void iv_Decode_Chunk(Indeo3DecodeContext *s, unsigned char *cur,
  79. unsigned char *ref, int width, int height, unsigned char *buf1,
  80. long fflags2, unsigned char *hdr,
  81. unsigned char *buf2, int min_width_160);
  82. #define min(a,b) ((a) < (b) ? (a) : (b))
  83. /* ---------------------------------------------------------------------- */
  84. static void iv_alloc_frames(Indeo3DecodeContext *s)
  85. {
  86. int luma_width, luma_height, luma_pixels, chroma_width, chroma_height,
  87. chroma_pixels, bufsize, i;
  88. luma_width = (s->width + 3) & (~3);
  89. luma_height = (s->height + 3) & (~3);
  90. s->iv_frame[0].y_w = s->iv_frame[0].y_h =
  91. s->iv_frame[0].the_buf_size = 0;
  92. s->iv_frame[1].y_w = s->iv_frame[1].y_h =
  93. s->iv_frame[1].the_buf_size = 0;
  94. s->iv_frame[1].the_buf = NULL;
  95. chroma_width = ((luma_width >> 2) + 3) & (~3);
  96. chroma_height = ((luma_height>> 2) + 3) & (~3);
  97. luma_pixels = luma_width * luma_height;
  98. chroma_pixels = chroma_width * chroma_height;
  99. bufsize = luma_pixels * 2 + luma_width * 3 +
  100. (chroma_pixels + chroma_width) * 4;
  101. if((s->iv_frame[0].the_buf =
  102. (s->iv_frame[0].the_buf_size == 0 ? av_malloc(bufsize) :
  103. av_realloc(s->iv_frame[0].the_buf, bufsize))) == NULL)
  104. return;
  105. s->iv_frame[0].y_w = s->iv_frame[1].y_w = luma_width;
  106. s->iv_frame[0].y_h = s->iv_frame[1].y_h = luma_height;
  107. s->iv_frame[0].uv_w = s->iv_frame[1].uv_w = chroma_width;
  108. s->iv_frame[0].uv_h = s->iv_frame[1].uv_h = chroma_height;
  109. s->iv_frame[0].the_buf_size = bufsize;
  110. s->iv_frame[0].Ybuf = s->iv_frame[0].the_buf + luma_width;
  111. i = luma_pixels + luma_width * 2;
  112. s->iv_frame[1].Ybuf = s->iv_frame[0].the_buf + i;
  113. i += (luma_pixels + luma_width);
  114. s->iv_frame[0].Ubuf = s->iv_frame[0].the_buf + i;
  115. i += (chroma_pixels + chroma_width);
  116. s->iv_frame[1].Ubuf = s->iv_frame[0].the_buf + i;
  117. i += (chroma_pixels + chroma_width);
  118. s->iv_frame[0].Vbuf = s->iv_frame[0].the_buf + i;
  119. i += (chroma_pixels + chroma_width);
  120. s->iv_frame[1].Vbuf = s->iv_frame[0].the_buf + i;
  121. for(i = 1; i <= luma_width; i++)
  122. s->iv_frame[0].Ybuf[-i] = s->iv_frame[1].Ybuf[-i] =
  123. s->iv_frame[0].Ubuf[-i] = 0x80;
  124. for(i = 1; i <= chroma_width; i++) {
  125. s->iv_frame[1].Ubuf[-i] = 0x80;
  126. s->iv_frame[0].Vbuf[-i] = 0x80;
  127. s->iv_frame[1].Vbuf[-i] = 0x80;
  128. s->iv_frame[1].Vbuf[chroma_pixels+i-1] = 0x80;
  129. }
  130. }
  131. /* ---------------------------------------------------------------------- */
  132. static void iv_free_func(Indeo3DecodeContext *s)
  133. {
  134. int i;
  135. for(i = 0 ; i < 2 ; i++) {
  136. if(s->iv_frame[i].the_buf != NULL)
  137. av_free(s->iv_frame[i].the_buf);
  138. s->iv_frame[i].Ybuf = s->iv_frame[i].Ubuf =
  139. s->iv_frame[i].Vbuf = NULL;
  140. s->iv_frame[i].the_buf = NULL;
  141. s->iv_frame[i].the_buf_size = 0;
  142. s->iv_frame[i].y_w = s->iv_frame[i].y_h = 0;
  143. s->iv_frame[i].uv_w = s->iv_frame[i].uv_h = 0;
  144. }
  145. av_free(s->ModPred);
  146. av_free(s->corrector_type);
  147. }
  148. /* ---------------------------------------------------------------------- */
  149. static unsigned long iv_decode_frame(Indeo3DecodeContext *s,
  150. unsigned char *buf, int buf_size)
  151. {
  152. unsigned int hdr_width, hdr_height,
  153. chroma_width, chroma_height;
  154. unsigned long fflags1, fflags2, fflags3, offs1, offs2, offs3, offs;
  155. unsigned char *hdr_pos, *buf_pos;
  156. buf_pos = buf;
  157. buf_pos += 18;
  158. fflags1 = le2me_16(*(uint16_t *)buf_pos);
  159. buf_pos += 2;
  160. fflags3 = le2me_32(*(uint32_t *)buf_pos);
  161. buf_pos += 4;
  162. fflags2 = *buf_pos++;
  163. buf_pos += 3;
  164. hdr_height = le2me_16(*(uint16_t *)buf_pos);
  165. buf_pos += 2;
  166. hdr_width = le2me_16(*(uint16_t *)buf_pos);
  167. buf_pos += 2;
  168. chroma_height = ((hdr_height >> 2) + 3) & 0x7ffc;
  169. chroma_width = ((hdr_width >> 2) + 3) & 0x7ffc;
  170. offs1 = le2me_32(*(uint32_t *)buf_pos);
  171. buf_pos += 4;
  172. offs2 = le2me_32(*(uint32_t *)buf_pos);
  173. buf_pos += 4;
  174. offs3 = le2me_32(*(uint32_t *)buf_pos);
  175. buf_pos += 8;
  176. hdr_pos = buf_pos;
  177. if(fflags3 == 0x80) return 4;
  178. if(fflags1 & 0x200) {
  179. s->cur_frame = s->iv_frame + 1;
  180. s->ref_frame = s->iv_frame;
  181. } else {
  182. s->cur_frame = s->iv_frame;
  183. s->ref_frame = s->iv_frame + 1;
  184. }
  185. buf_pos = buf + 16 + offs1;
  186. offs = le2me_32(*(uint32_t *)buf_pos);
  187. buf_pos += 4;
  188. iv_Decode_Chunk(s, s->cur_frame->Ybuf, s->ref_frame->Ybuf, hdr_width,
  189. hdr_height, buf_pos + offs * 2, fflags2, hdr_pos, buf_pos,
  190. min(hdr_width, 160));
  191. buf_pos = buf + 16 + offs2;
  192. offs = le2me_32(*(uint32_t *)buf_pos);
  193. buf_pos += 4;
  194. iv_Decode_Chunk(s, s->cur_frame->Vbuf, s->ref_frame->Vbuf, chroma_width,
  195. chroma_height, buf_pos + offs * 2, fflags2, hdr_pos, buf_pos,
  196. min(chroma_width, 40));
  197. buf_pos = buf + 16 + offs3;
  198. offs = le2me_32(*(uint32_t *)buf_pos);
  199. buf_pos += 4;
  200. iv_Decode_Chunk(s, s->cur_frame->Ubuf, s->ref_frame->Ubuf, chroma_width,
  201. chroma_height, buf_pos + offs * 2, fflags2, hdr_pos, buf_pos,
  202. min(chroma_width, 40));
  203. return 8;
  204. }
  205. typedef struct {
  206. long xpos;
  207. long ypos;
  208. long width;
  209. long height;
  210. long split_flag;
  211. long split_direction;
  212. long usl7;
  213. } ustr_t;
  214. /* ---------------------------------------------------------------------- */
  215. #define LV1_CHECK(buf1,rle_v3,lv1,lp2) \
  216. if((lv1 & 0x80) != 0) { \
  217. if(rle_v3 != 0) \
  218. rle_v3 = 0; \
  219. else { \
  220. rle_v3 = 1; \
  221. buf1 -= 2; \
  222. } \
  223. } \
  224. lp2 = 4;
  225. #define RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3) \
  226. if(rle_v3 == 0) { \
  227. rle_v2 = *buf1; \
  228. rle_v1 = 1; \
  229. if(rle_v2 > 32) { \
  230. rle_v2 -= 32; \
  231. rle_v1 = 0; \
  232. } \
  233. rle_v3 = 1; \
  234. } \
  235. buf1--;
  236. #define LP2_CHECK(buf1,rle_v3,lp2) \
  237. if(lp2 == 0 && rle_v3 != 0) \
  238. rle_v3 = 0; \
  239. else { \
  240. buf1--; \
  241. rle_v3 = 1; \
  242. }
  243. #define RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2) \
  244. rle_v2--; \
  245. if(rle_v2 == 0) { \
  246. rle_v3 = 0; \
  247. buf1 += 2; \
  248. } \
  249. lp2 = 4;
  250. static void iv_Decode_Chunk(Indeo3DecodeContext *s,
  251. unsigned char *cur, unsigned char *ref, int width, int height,
  252. unsigned char *buf1, long fflags2, unsigned char *hdr,
  253. unsigned char *buf2, int min_width_160)
  254. {
  255. unsigned char bit_buf;
  256. unsigned long bit_pos, lv, lv1, lv2;
  257. long *width_tbl, width_tbl_arr[10];
  258. char *ref_vectors;
  259. unsigned char *cur_frm_pos, *ref_frm_pos, *cp, *cp2;
  260. uint32_t *cur_lp, *ref_lp;
  261. const uint32_t *correction_lp[2], *correctionloworder_lp[2], *correctionhighorder_lp[2];
  262. unsigned short *correction_type_sp[2];
  263. ustr_t strip_tbl[20], *strip;
  264. int i, j, k, lp1, lp2, flag1, cmd, blks_width, blks_height, region_160_width,
  265. rle_v1, rle_v2, rle_v3;
  266. bit_buf = 0;
  267. ref_vectors = NULL;
  268. width_tbl = width_tbl_arr + 1;
  269. i = (width < 0 ? width + 3 : width)/4;
  270. for(j = -1; j < 8; j++)
  271. width_tbl[j] = i * j;
  272. strip = strip_tbl;
  273. for(region_160_width = 0; region_160_width < (width - min_width_160); region_160_width += min_width_160);
  274. strip->ypos = strip->xpos = 0;
  275. for(strip->width = min_width_160; width > strip->width; strip->width *= 2);
  276. strip->height = height;
  277. strip->split_direction = 0;
  278. strip->split_flag = 0;
  279. strip->usl7 = 0;
  280. bit_pos = 0;
  281. rle_v1 = rle_v2 = rle_v3 = 0;
  282. while(strip >= strip_tbl) {
  283. if(bit_pos <= 0) {
  284. bit_pos = 8;
  285. bit_buf = *buf1++;
  286. }
  287. bit_pos -= 2;
  288. cmd = (bit_buf >> bit_pos) & 0x03;
  289. if(cmd == 0) {
  290. strip++;
  291. memcpy(strip, strip-1, sizeof(ustr_t));
  292. strip->split_flag = 1;
  293. strip->split_direction = 0;
  294. strip->height = (strip->height > 8 ? ((strip->height+8)>>4)<<3 : 4);
  295. continue;
  296. } else if(cmd == 1) {
  297. strip++;
  298. memcpy(strip, strip-1, sizeof(ustr_t));
  299. strip->split_flag = 1;
  300. strip->split_direction = 1;
  301. strip->width = (strip->width > 8 ? ((strip->width+8)>>4)<<3 : 4);
  302. continue;
  303. } else if(cmd == 2) {
  304. if(strip->usl7 == 0) {
  305. strip->usl7 = 1;
  306. ref_vectors = NULL;
  307. continue;
  308. }
  309. } else if(cmd == 3) {
  310. if(strip->usl7 == 0) {
  311. strip->usl7 = 1;
  312. ref_vectors = buf2 + (*buf1 * 2);
  313. buf1++;
  314. continue;
  315. }
  316. }
  317. cur_frm_pos = cur + width * strip->ypos + strip->xpos;
  318. if((blks_width = strip->width) < 0)
  319. blks_width += 3;
  320. blks_width >>= 2;
  321. blks_height = strip->height;
  322. if(ref_vectors != NULL) {
  323. ref_frm_pos = ref + (ref_vectors[0] + strip->ypos) * width +
  324. ref_vectors[1] + strip->xpos;
  325. } else
  326. ref_frm_pos = cur_frm_pos - width_tbl[4];
  327. if(cmd == 2) {
  328. if(bit_pos <= 0) {
  329. bit_pos = 8;
  330. bit_buf = *buf1++;
  331. }
  332. bit_pos -= 2;
  333. cmd = (bit_buf >> bit_pos) & 0x03;
  334. if(cmd == 0 || ref_vectors != NULL) {
  335. for(lp1 = 0; lp1 < blks_width; lp1++) {
  336. for(i = 0, j = 0; i < blks_height; i++, j += width_tbl[1])
  337. ((uint32_t *)cur_frm_pos)[j] = ((uint32_t *)ref_frm_pos)[j];
  338. cur_frm_pos += 4;
  339. ref_frm_pos += 4;
  340. }
  341. } else if(cmd != 1)
  342. return;
  343. } else {
  344. k = *buf1 >> 4;
  345. j = *buf1 & 0x0f;
  346. buf1++;
  347. lv = j + fflags2;
  348. if((lv - 8) <= 7 && (k == 0 || k == 3 || k == 10)) {
  349. cp2 = s->ModPred + ((lv - 8) << 7);
  350. cp = ref_frm_pos;
  351. for(i = 0; i < blks_width << 2; i++) {
  352. int v = *cp >> 1;
  353. *(cp++) = cp2[v];
  354. }
  355. }
  356. if(k == 1 || k == 4) {
  357. lv = (hdr[j] & 0xf) + fflags2;
  358. correction_type_sp[0] = s->corrector_type + (lv << 8);
  359. correction_lp[0] = correction + (lv << 8);
  360. lv = (hdr[j] >> 4) + fflags2;
  361. correction_lp[1] = correction + (lv << 8);
  362. correction_type_sp[1] = s->corrector_type + (lv << 8);
  363. } else {
  364. correctionloworder_lp[0] = correctionloworder_lp[1] = correctionloworder + (lv << 8);
  365. correctionhighorder_lp[0] = correctionhighorder_lp[1] = correctionhighorder + (lv << 8);
  366. correction_type_sp[0] = correction_type_sp[1] = s->corrector_type + (lv << 8);
  367. correction_lp[0] = correction_lp[1] = correction + (lv << 8);
  368. }
  369. switch(k) {
  370. case 1:
  371. case 0: /********** CASE 0 **********/
  372. for( ; blks_height > 0; blks_height -= 4) {
  373. for(lp1 = 0; lp1 < blks_width; lp1++) {
  374. for(lp2 = 0; lp2 < 4; ) {
  375. k = *buf1++;
  376. cur_lp = ((uint32_t *)cur_frm_pos) + width_tbl[lp2];
  377. ref_lp = ((uint32_t *)ref_frm_pos) + width_tbl[lp2];
  378. switch(correction_type_sp[0][k]) {
  379. case 0:
  380. *cur_lp = ((*ref_lp >> 1) + correction_lp[lp2 & 0x01][k]) << 1;
  381. lp2++;
  382. break;
  383. case 1:
  384. ((unsigned short *)cur_lp)[0] = ((((unsigned short *)(ref_lp))[0] >> 1)
  385. + correction_lp[lp2 & 0x01][*buf1++]) << 1;
  386. ((unsigned short *)cur_lp)[1] = ((((unsigned short *)(ref_lp))[1] >> 1)
  387. + correction_lp[lp2 & 0x01][k]) << 1;
  388. lp2++;
  389. break;
  390. case 2:
  391. if(lp2 == 0) {
  392. for(i = 0, j = 0; i < 2; i++, j += width_tbl[1])
  393. cur_lp[j] = ref_lp[j];
  394. lp2 += 2;
  395. }
  396. break;
  397. case 3:
  398. if(lp2 < 2) {
  399. for(i = 0, j = 0; i < (3 - lp2); i++, j += width_tbl[1])
  400. cur_lp[j] = ref_lp[j];
  401. lp2 = 3;
  402. }
  403. break;
  404. case 8:
  405. if(lp2 == 0) {
  406. RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3)
  407. if(rle_v1 == 1 || ref_vectors != NULL) {
  408. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  409. cur_lp[j] = ref_lp[j];
  410. }
  411. RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2)
  412. break;
  413. } else {
  414. rle_v1 = 1;
  415. rle_v2 = *buf1 - 1;
  416. }
  417. case 5:
  418. LP2_CHECK(buf1,rle_v3,lp2)
  419. case 4:
  420. for(i = 0, j = 0; i < (4 - lp2); i++, j += width_tbl[1])
  421. cur_lp[j] = ref_lp[j];
  422. lp2 = 4;
  423. break;
  424. case 7:
  425. if(rle_v3 != 0)
  426. rle_v3 = 0;
  427. else {
  428. buf1--;
  429. rle_v3 = 1;
  430. }
  431. case 6:
  432. if(ref_vectors != NULL) {
  433. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  434. cur_lp[j] = ref_lp[j];
  435. }
  436. lp2 = 4;
  437. break;
  438. case 9:
  439. lv1 = *buf1++;
  440. lv = (lv1 & 0x7F) << 1;
  441. lv += (lv << 8);
  442. lv += (lv << 16);
  443. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  444. cur_lp[j] = lv;
  445. LV1_CHECK(buf1,rle_v3,lv1,lp2)
  446. break;
  447. default:
  448. return;
  449. }
  450. }
  451. cur_frm_pos += 4;
  452. ref_frm_pos += 4;
  453. }
  454. cur_frm_pos += ((width - blks_width) * 4);
  455. ref_frm_pos += ((width - blks_width) * 4);
  456. }
  457. break;
  458. case 4:
  459. case 3: /********** CASE 3 **********/
  460. if(ref_vectors != NULL)
  461. return;
  462. flag1 = 1;
  463. for( ; blks_height > 0; blks_height -= 8) {
  464. for(lp1 = 0; lp1 < blks_width; lp1++) {
  465. for(lp2 = 0; lp2 < 4; ) {
  466. k = *buf1++;
  467. cur_lp = ((uint32_t *)cur_frm_pos) + width_tbl[lp2 * 2];
  468. ref_lp = ((uint32_t *)cur_frm_pos) + width_tbl[(lp2 * 2) - 1];
  469. switch(correction_type_sp[lp2 & 0x01][k]) {
  470. case 0:
  471. cur_lp[width_tbl[1]] = ((*ref_lp >> 1) + correction_lp[lp2 & 0x01][k]) << 1;
  472. if(lp2 > 0 || flag1 == 0 || strip->ypos != 0)
  473. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  474. else
  475. cur_lp[0] = ((*ref_lp >> 1) + correction_lp[lp2 & 0x01][k]) << 1;
  476. lp2++;
  477. break;
  478. case 1:
  479. ((unsigned short *)cur_lp)[width_tbl[2]] =
  480. ((((unsigned short *)ref_lp)[0] >> 1) + correction_lp[lp2 & 0x01][*buf1++]) << 1;
  481. ((unsigned short *)cur_lp)[width_tbl[2]+1] =
  482. ((((unsigned short *)ref_lp)[1] >> 1) + correction_lp[lp2 & 0x01][k]) << 1;
  483. if(lp2 > 0 || flag1 == 0 || strip->ypos != 0)
  484. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  485. else
  486. cur_lp[0] = cur_lp[width_tbl[1]];
  487. lp2++;
  488. break;
  489. case 2:
  490. if(lp2 == 0) {
  491. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  492. cur_lp[j] = *ref_lp;
  493. lp2 += 2;
  494. }
  495. break;
  496. case 3:
  497. if(lp2 < 2) {
  498. for(i = 0, j = 0; i < 6 - (lp2 * 2); i++, j += width_tbl[1])
  499. cur_lp[j] = *ref_lp;
  500. lp2 = 3;
  501. }
  502. break;
  503. case 6:
  504. lp2 = 4;
  505. break;
  506. case 7:
  507. if(rle_v3 != 0)
  508. rle_v3 = 0;
  509. else {
  510. buf1--;
  511. rle_v3 = 1;
  512. }
  513. lp2 = 4;
  514. break;
  515. case 8:
  516. if(lp2 == 0) {
  517. RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3)
  518. if(rle_v1 == 1) {
  519. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1])
  520. cur_lp[j] = ref_lp[j];
  521. }
  522. RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2)
  523. break;
  524. } else {
  525. rle_v2 = (*buf1) - 1;
  526. rle_v1 = 1;
  527. }
  528. case 5:
  529. LP2_CHECK(buf1,rle_v3,lp2)
  530. case 4:
  531. for(i = 0, j = 0; i < 8 - (lp2 * 2); i++, j += width_tbl[1])
  532. cur_lp[j] = *ref_lp;
  533. lp2 = 4;
  534. break;
  535. case 9:
  536. fprintf(stderr, "UNTESTED.\n");
  537. lv1 = *buf1++;
  538. lv = (lv1 & 0x7F) << 1;
  539. lv += (lv << 8);
  540. lv += (lv << 16);
  541. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  542. cur_lp[j] = lv;
  543. LV1_CHECK(buf1,rle_v3,lv1,lp2)
  544. break;
  545. default:
  546. return;
  547. }
  548. }
  549. cur_frm_pos += 4;
  550. }
  551. cur_frm_pos += (((width * 2) - blks_width) * 4);
  552. flag1 = 0;
  553. }
  554. break;
  555. case 10: /********** CASE 10 **********/
  556. if(ref_vectors == NULL) {
  557. flag1 = 1;
  558. for( ; blks_height > 0; blks_height -= 8) {
  559. for(lp1 = 0; lp1 < blks_width; lp1 += 2) {
  560. for(lp2 = 0; lp2 < 4; ) {
  561. k = *buf1++;
  562. cur_lp = ((uint32_t *)cur_frm_pos) + width_tbl[lp2 * 2];
  563. ref_lp = ((uint32_t *)cur_frm_pos) + width_tbl[(lp2 * 2) - 1];
  564. lv1 = ref_lp[0];
  565. lv2 = ref_lp[1];
  566. if(lp2 == 0 && flag1 != 0) {
  567. lv1 = lv1 & 0x00FF00FF;
  568. lv1 = (lv1 << 8) | lv1;
  569. lv2 = lv2 & 0x00FF00FF;
  570. lv2 = (lv2 << 8) | lv2;
  571. }
  572. switch(correction_type_sp[lp2 & 0x01][k]) {
  573. case 0:
  574. cur_lp[width_tbl[1]] = ((lv1 >> 1) + correctionloworder_lp[lp2 & 0x01][k]) << 1;
  575. cur_lp[width_tbl[1]+1] = ((lv2 >> 1) + correctionhighorder_lp[lp2 & 0x01][k]) << 1;
  576. if(lp2 > 0 || strip->ypos != 0 || flag1 == 0) {
  577. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  578. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  579. } else {
  580. cur_lp[0] = cur_lp[width_tbl[1]];
  581. cur_lp[1] = cur_lp[width_tbl[1]+1];
  582. }
  583. lp2++;
  584. break;
  585. case 1:
  586. cur_lp[width_tbl[1]] = ((lv1 >> 1) + correctionloworder_lp[lp2 & 0x01][*buf1++]) << 1;
  587. cur_lp[width_tbl[1]+1] = ((lv2 >> 1) + correctionloworder_lp[lp2 & 0x01][k]) << 1;
  588. if(lp2 > 0 || strip->ypos != 0 || flag1 == 0) {
  589. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  590. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  591. } else {
  592. cur_lp[0] = cur_lp[width_tbl[1]];
  593. cur_lp[1] = cur_lp[width_tbl[1]+1];
  594. }
  595. lp2++;
  596. break;
  597. case 2:
  598. if(lp2 == 0) {
  599. if(flag1 != 0) {
  600. for(i = 0, j = width_tbl[1]; i < 3; i++, j += width_tbl[1]) {
  601. cur_lp[j] = lv1;
  602. cur_lp[j+1] = lv2;
  603. }
  604. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  605. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  606. } else {
  607. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1]) {
  608. cur_lp[j] = lv1;
  609. cur_lp[j+1] = lv2;
  610. }
  611. }
  612. lp2 += 2;
  613. }
  614. break;
  615. case 3:
  616. if(lp2 < 2) {
  617. if(lp2 == 0 && flag1 != 0) {
  618. for(i = 0, j = width_tbl[1]; i < 5; i++, j += width_tbl[1]) {
  619. cur_lp[j] = lv1;
  620. cur_lp[j+1] = lv2;
  621. }
  622. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  623. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  624. } else {
  625. for(i = 0, j = 0; i < 6 - (lp2 * 2); i++, j += width_tbl[1]) {
  626. cur_lp[j] = lv1;
  627. cur_lp[j+1] = lv2;
  628. }
  629. }
  630. lp2 = 3;
  631. }
  632. break;
  633. case 8:
  634. if(lp2 == 0) {
  635. RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3)
  636. if(rle_v1 == 1) {
  637. if(flag1 != 0) {
  638. for(i = 0, j = width_tbl[1]; i < 7; i++, j += width_tbl[1]) {
  639. cur_lp[j] = lv1;
  640. cur_lp[j+1] = lv2;
  641. }
  642. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  643. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  644. } else {
  645. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1]) {
  646. cur_lp[j] = lv1;
  647. cur_lp[j+1] = lv2;
  648. }
  649. }
  650. }
  651. RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2)
  652. break;
  653. } else {
  654. rle_v1 = 1;
  655. rle_v2 = (*buf1) - 1;
  656. }
  657. case 5:
  658. LP2_CHECK(buf1,rle_v3,lp2)
  659. case 4:
  660. if(lp2 == 0 && flag1 != 0) {
  661. for(i = 0, j = width_tbl[1]; i < 7; i++, j += width_tbl[1]) {
  662. cur_lp[j] = lv1;
  663. cur_lp[j+1] = lv2;
  664. }
  665. cur_lp[0] = ((cur_lp[-width_tbl[1]] >> 1) + (cur_lp[width_tbl[1]] >> 1)) & 0xFEFEFEFE;
  666. cur_lp[1] = ((cur_lp[-width_tbl[1]+1] >> 1) + (cur_lp[width_tbl[1]+1] >> 1)) & 0xFEFEFEFE;
  667. } else {
  668. for(i = 0, j = 0; i < 8 - (lp2 * 2); i++, j += width_tbl[1]) {
  669. cur_lp[j] = lv1;
  670. cur_lp[j+1] = lv2;
  671. }
  672. }
  673. lp2 = 4;
  674. break;
  675. case 6:
  676. lp2 = 4;
  677. break;
  678. case 7:
  679. if(lp2 == 0) {
  680. if(rle_v3 != 0)
  681. rle_v3 = 0;
  682. else {
  683. buf1--;
  684. rle_v3 = 1;
  685. }
  686. lp2 = 4;
  687. }
  688. break;
  689. case 9:
  690. fprintf(stderr, "UNTESTED.\n");
  691. lv1 = *buf1;
  692. lv = (lv1 & 0x7F) << 1;
  693. lv += (lv << 8);
  694. lv += (lv << 16);
  695. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1])
  696. cur_lp[j] = lv;
  697. LV1_CHECK(buf1,rle_v3,lv1,lp2)
  698. break;
  699. default:
  700. return;
  701. }
  702. }
  703. cur_frm_pos += 8;
  704. }
  705. cur_frm_pos += (((width * 2) - blks_width) * 4);
  706. flag1 = 0;
  707. }
  708. } else {
  709. for( ; blks_height > 0; blks_height -= 8) {
  710. for(lp1 = 0; lp1 < blks_width; lp1 += 2) {
  711. for(lp2 = 0; lp2 < 4; ) {
  712. k = *buf1++;
  713. cur_lp = ((uint32_t *)cur_frm_pos) + width_tbl[lp2 * 2];
  714. ref_lp = ((uint32_t *)ref_frm_pos) + width_tbl[lp2 * 2];
  715. switch(correction_type_sp[lp2 & 0x01][k]) {
  716. case 0:
  717. lv1 = correctionloworder_lp[lp2 & 0x01][k];
  718. lv2 = correctionhighorder_lp[lp2 & 0x01][k];
  719. cur_lp[0] = ((ref_lp[0] >> 1) + lv1) << 1;
  720. cur_lp[1] = ((ref_lp[1] >> 1) + lv2) << 1;
  721. cur_lp[width_tbl[1]] = ((ref_lp[width_tbl[1]] >> 1) + lv1) << 1;
  722. cur_lp[width_tbl[1]+1] = ((ref_lp[width_tbl[1]+1] >> 1) + lv2) << 1;
  723. lp2++;
  724. break;
  725. case 1:
  726. lv1 = correctionloworder_lp[lp2 & 0x01][*buf1++];
  727. lv2 = correctionloworder_lp[lp2 & 0x01][k];
  728. cur_lp[0] = ((ref_lp[0] >> 1) + lv1) << 1;
  729. cur_lp[1] = ((ref_lp[1] >> 1) + lv2) << 1;
  730. cur_lp[width_tbl[1]] = ((ref_lp[width_tbl[1]] >> 1) + lv1) << 1;
  731. cur_lp[width_tbl[1]+1] = ((ref_lp[width_tbl[1]+1] >> 1) + lv2) << 1;
  732. lp2++;
  733. break;
  734. case 2:
  735. if(lp2 == 0) {
  736. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1]) {
  737. cur_lp[j] = ref_lp[j];
  738. cur_lp[j+1] = ref_lp[j+1];
  739. }
  740. lp2 += 2;
  741. }
  742. break;
  743. case 3:
  744. if(lp2 < 2) {
  745. for(i = 0, j = 0; i < 6 - (lp2 * 2); i++, j += width_tbl[1]) {
  746. cur_lp[j] = ref_lp[j];
  747. cur_lp[j+1] = ref_lp[j+1];
  748. }
  749. lp2 = 3;
  750. }
  751. break;
  752. case 8:
  753. if(lp2 == 0) {
  754. RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3)
  755. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1]) {
  756. ((uint32_t *)cur_frm_pos)[j] = ((uint32_t *)ref_frm_pos)[j];
  757. ((uint32_t *)cur_frm_pos)[j+1] = ((uint32_t *)ref_frm_pos)[j+1];
  758. }
  759. RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2)
  760. break;
  761. } else {
  762. rle_v1 = 1;
  763. rle_v2 = (*buf1) - 1;
  764. }
  765. case 5:
  766. case 7:
  767. LP2_CHECK(buf1,rle_v3,lp2)
  768. case 6:
  769. case 4:
  770. for(i = 0, j = 0; i < 8 - (lp2 * 2); i++, j += width_tbl[1]) {
  771. cur_lp[j] = ref_lp[j];
  772. cur_lp[j+1] = ref_lp[j+1];
  773. }
  774. lp2 = 4;
  775. break;
  776. case 9:
  777. fprintf(stderr, "UNTESTED.\n");
  778. lv1 = *buf1;
  779. lv = (lv1 & 0x7F) << 1;
  780. lv += (lv << 8);
  781. lv += (lv << 16);
  782. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1])
  783. ((uint32_t *)cur_frm_pos)[j] = ((uint32_t *)cur_frm_pos)[j+1] = lv;
  784. LV1_CHECK(buf1,rle_v3,lv1,lp2)
  785. break;
  786. default:
  787. return;
  788. }
  789. }
  790. cur_frm_pos += 8;
  791. ref_frm_pos += 8;
  792. }
  793. cur_frm_pos += (((width * 2) - blks_width) * 4);
  794. ref_frm_pos += (((width * 2) - blks_width) * 4);
  795. }
  796. }
  797. break;
  798. case 11: /********** CASE 11 **********/
  799. if(ref_vectors == NULL)
  800. return;
  801. for( ; blks_height > 0; blks_height -= 8) {
  802. for(lp1 = 0; lp1 < blks_width; lp1++) {
  803. for(lp2 = 0; lp2 < 4; ) {
  804. k = *buf1++;
  805. cur_lp = ((uint32_t *)cur_frm_pos) + width_tbl[lp2 * 2];
  806. ref_lp = ((uint32_t *)ref_frm_pos) + width_tbl[lp2 * 2];
  807. switch(correction_type_sp[lp2 & 0x01][k]) {
  808. case 0:
  809. cur_lp[0] = ((*ref_lp >> 1) + correction_lp[lp2 & 0x01][k]) << 1;
  810. cur_lp[width_tbl[1]] = ((ref_lp[width_tbl[1]] >> 1) + correction_lp[lp2 & 0x01][k]) << 1;
  811. lp2++;
  812. break;
  813. case 1:
  814. lv1 = (unsigned short)(correction_lp[lp2 & 0x01][*buf1++]);
  815. lv2 = (unsigned short)(correction_lp[lp2 & 0x01][k]);
  816. ((unsigned short *)cur_lp)[0] = ((((unsigned short *)ref_lp)[0] >> 1) + lv1) << 1;
  817. ((unsigned short *)cur_lp)[1] = ((((unsigned short *)ref_lp)[1] >> 1) + lv2) << 1;
  818. ((unsigned short *)cur_lp)[width_tbl[2]] = ((((unsigned short *)ref_lp)[width_tbl[2]] >> 1) + lv1) << 1;
  819. ((unsigned short *)cur_lp)[width_tbl[2]+1] = ((((unsigned short *)ref_lp)[width_tbl[2]+1] >> 1) + lv2) << 1;
  820. lp2++;
  821. break;
  822. case 2:
  823. if(lp2 == 0) {
  824. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  825. cur_lp[j] = ref_lp[j];
  826. lp2 += 2;
  827. }
  828. break;
  829. case 3:
  830. if(lp2 < 2) {
  831. for(i = 0, j = 0; i < 6 - (lp2 * 2); i++, j += width_tbl[1])
  832. cur_lp[j] = ref_lp[j];
  833. lp2 = 3;
  834. }
  835. break;
  836. case 8:
  837. if(lp2 == 0) {
  838. RLE_V3_CHECK(buf1,rle_v1,rle_v2,rle_v3)
  839. for(i = 0, j = 0; i < 8; i++, j += width_tbl[1])
  840. cur_lp[j] = ref_lp[j];
  841. RLE_V2_CHECK(buf1,rle_v2, rle_v3,lp2)
  842. break;
  843. } else {
  844. rle_v1 = 1;
  845. rle_v2 = (*buf1) - 1;
  846. }
  847. case 5:
  848. case 7:
  849. LP2_CHECK(buf1,rle_v3,lp2)
  850. case 4:
  851. case 6:
  852. for(i = 0, j = 0; i < 8 - (lp2 * 2); i++, j += width_tbl[1])
  853. cur_lp[j] = ref_lp[j];
  854. lp2 = 4;
  855. break;
  856. case 9:
  857. fprintf(stderr, "UNTESTED.\n");
  858. lv1 = *buf1++;
  859. lv = (lv1 & 0x7F) << 1;
  860. lv += (lv << 8);
  861. lv += (lv << 16);
  862. for(i = 0, j = 0; i < 4; i++, j += width_tbl[1])
  863. cur_lp[j] = lv;
  864. LV1_CHECK(buf1,rle_v3,lv1,lp2)
  865. break;
  866. default:
  867. return;
  868. }
  869. }
  870. cur_frm_pos += 4;
  871. ref_frm_pos += 4;
  872. }
  873. cur_frm_pos += (((width * 2) - blks_width) * 4);
  874. ref_frm_pos += (((width * 2) - blks_width) * 4);
  875. }
  876. break;
  877. default:
  878. return;
  879. }
  880. }
  881. if(strip < strip_tbl)
  882. return;
  883. for( ; strip >= strip_tbl; strip--) {
  884. if(strip->split_flag != 0) {
  885. strip->split_flag = 0;
  886. strip->usl7 = (strip-1)->usl7;
  887. if(strip->split_direction) {
  888. strip->xpos += strip->width;
  889. strip->width = (strip-1)->width - strip->width;
  890. if(region_160_width <= strip->xpos && width < strip->width + strip->xpos)
  891. strip->width = width - strip->xpos;
  892. } else {
  893. strip->ypos += strip->height;
  894. strip->height = (strip-1)->height - strip->height;
  895. }
  896. break;
  897. }
  898. }
  899. }
  900. }
  901. static int indeo3_decode_init(AVCodecContext *avctx)
  902. {
  903. Indeo3DecodeContext *s = avctx->priv_data;
  904. s->avctx = avctx;
  905. s->width = avctx->width;
  906. s->height = avctx->height;
  907. avctx->pix_fmt = PIX_FMT_YUV410P;
  908. avctx->has_b_frames = 0;
  909. build_modpred(s);
  910. iv_alloc_frames(s);
  911. return 0;
  912. }
  913. static int indeo3_decode_frame(AVCodecContext *avctx,
  914. void *data, int *data_size,
  915. unsigned char *buf, int buf_size)
  916. {
  917. Indeo3DecodeContext *s=avctx->priv_data;
  918. unsigned char *src, *dest;
  919. int y;
  920. iv_decode_frame(s, buf, buf_size);
  921. if(s->frame.data[0])
  922. avctx->release_buffer(avctx, &s->frame);
  923. s->frame.reference = 0;
  924. if(avctx->get_buffer(avctx, &s->frame) < 0) {
  925. fprintf(stderr, "get_buffer() failed\n");
  926. return -1;
  927. }
  928. src = s->cur_frame->Ybuf;
  929. dest = s->frame.data[0];
  930. for (y = 0; y < s->height; y++) {
  931. memcpy(dest, src, s->cur_frame->y_w);
  932. src += s->cur_frame->y_w;
  933. dest += s->frame.linesize[0];
  934. }
  935. src = s->cur_frame->Ubuf;
  936. dest = s->frame.data[1];
  937. for (y = 0; y < s->height / 4; y++) {
  938. memcpy(dest, src, s->cur_frame->uv_w);
  939. src += s->cur_frame->uv_w;
  940. dest += s->frame.linesize[1];
  941. }
  942. src = s->cur_frame->Vbuf;
  943. dest = s->frame.data[2];
  944. for (y = 0; y < s->height / 4; y++) {
  945. memcpy(dest, src, s->cur_frame->uv_w);
  946. src += s->cur_frame->uv_w;
  947. dest += s->frame.linesize[2];
  948. }
  949. *data_size=sizeof(AVFrame);
  950. *(AVFrame*)data= s->frame;
  951. return buf_size;
  952. }
  953. static int indeo3_decode_end(AVCodecContext *avctx)
  954. {
  955. Indeo3DecodeContext *s = avctx->priv_data;
  956. iv_free_func(s);
  957. return 0;
  958. }
  959. AVCodec indeo3_decoder = {
  960. "indeo3",
  961. CODEC_TYPE_VIDEO,
  962. CODEC_ID_INDEO3,
  963. sizeof(Indeo3DecodeContext),
  964. indeo3_decode_init,
  965. NULL,
  966. indeo3_decode_end,
  967. indeo3_decode_frame,
  968. 0,
  969. NULL
  970. };