You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1290 lines
34KB

  1. /*
  2. * MSMPEG4 backend for ffmpeg encoder and decoder
  3. * Copyright (c) 2001 Gerard Lantau.
  4. *
  5. * This program is free software; you can redistribute it and/or modify
  6. * it under the terms of the GNU General Public License as published by
  7. * the Free Software Foundation; either version 2 of the License, or
  8. * (at your option) any later version.
  9. *
  10. * This program is distributed in the hope that it will be useful,
  11. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  13. * GNU General Public License for more details.
  14. *
  15. * You should have received a copy of the GNU General Public License
  16. * along with this program; if not, write to the Free Software
  17. * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  18. */
  19. #include <stdlib.h>
  20. #include <stdio.h>
  21. #include "common.h"
  22. #include "dsputil.h"
  23. #include "mpegvideo.h"
  24. #include "avcodec.h"
  25. /*
  26. * You can also call this codec : MPEG4 with a twist !
  27. *
  28. * TODO:
  29. * - (encoding) select best mv table (two choices)
  30. * - (encoding) select best vlc/dc table
  31. */
  32. //#define DEBUG
  33. /* motion vector table */
  34. typedef struct MVTable {
  35. int n;
  36. const UINT16 *table_mv_code;
  37. const UINT8 *table_mv_bits;
  38. const UINT8 *table_mvx;
  39. const UINT8 *table_mvy;
  40. UINT16 *table_mv_index; /* encoding: convert mv to index in table_mv */
  41. VLC vlc; /* decoding: vlc */
  42. } MVTable;
  43. static UINT32 v2_dc_lum_table[512][2];
  44. static UINT32 v2_dc_chroma_table[512][2];
  45. static void msmpeg4_encode_block(MpegEncContext * s, DCTELEM * block, int n);
  46. static int msmpeg4_decode_block(MpegEncContext * s, DCTELEM * block,
  47. int n, int coded);
  48. static int msmpeg4_decode_dc(MpegEncContext * s, int n, int *dir_ptr);
  49. static int msmpeg4_decode_motion(MpegEncContext * s,
  50. int *mx_ptr, int *my_ptr);
  51. extern UINT32 inverse[256];
  52. #ifdef DEBUG
  53. int intra_count = 0;
  54. int frame_count = 0;
  55. #endif
  56. /* XXX: move it to mpegvideo.h */
  57. static int init_done = 0;
  58. #include "msmpeg4data.h"
  59. #ifdef STATS
  60. const char *st_names[ST_NB] = {
  61. "unknown",
  62. "dc",
  63. "intra_ac",
  64. "inter_ac",
  65. "intra_mb",
  66. "inter_mb",
  67. "mv",
  68. };
  69. int st_current_index = 0;
  70. unsigned int st_bit_counts[ST_NB];
  71. unsigned int st_out_bit_counts[ST_NB];
  72. #define set_stat(var) st_current_index = var;
  73. void print_stats(void)
  74. {
  75. unsigned int total;
  76. int i;
  77. printf("Input:\n");
  78. total = 0;
  79. for(i=0;i<ST_NB;i++)
  80. total += st_bit_counts[i];
  81. if (total == 0)
  82. total = 1;
  83. for(i=0;i<ST_NB;i++) {
  84. printf("%-10s : %10.1f %5.1f%%\n",
  85. st_names[i],
  86. (double)st_bit_counts[i] / 8.0,
  87. (double)st_bit_counts[i] * 100.0 / total);
  88. }
  89. printf("%-10s : %10.1f %5.1f%%\n",
  90. "total",
  91. (double)total / 8.0,
  92. 100.0);
  93. printf("Output:\n");
  94. total = 0;
  95. for(i=0;i<ST_NB;i++)
  96. total += st_out_bit_counts[i];
  97. if (total == 0)
  98. total = 1;
  99. for(i=0;i<ST_NB;i++) {
  100. printf("%-10s : %10.1f %5.1f%%\n",
  101. st_names[i],
  102. (double)st_out_bit_counts[i] / 8.0,
  103. (double)st_out_bit_counts[i] * 100.0 / total);
  104. }
  105. printf("%-10s : %10.1f %5.1f%%\n",
  106. "total",
  107. (double)total / 8.0,
  108. 100.0);
  109. }
  110. #else
  111. #define set_stat(var)
  112. #endif
  113. /* build the table which associate a (x,y) motion vector to a vlc */
  114. static void init_mv_table(MVTable *tab)
  115. {
  116. int i, x, y;
  117. tab->table_mv_index = malloc(sizeof(UINT16) * 4096);
  118. /* mark all entries as not used */
  119. for(i=0;i<4096;i++)
  120. tab->table_mv_index[i] = tab->n;
  121. for(i=0;i<tab->n;i++) {
  122. x = tab->table_mvx[i];
  123. y = tab->table_mvy[i];
  124. tab->table_mv_index[(x << 6) | y] = i;
  125. }
  126. }
  127. static void code012(PutBitContext *pb, int n)
  128. {
  129. if (n == 0) {
  130. put_bits(pb, 1, 0);
  131. } else {
  132. put_bits(pb, 1, 1);
  133. put_bits(pb, 1, (n >= 2));
  134. }
  135. }
  136. /* write MSMPEG4 V3 compatible frame header */
  137. void msmpeg4_encode_picture_header(MpegEncContext * s, int picture_number)
  138. {
  139. int i;
  140. align_put_bits(&s->pb);
  141. put_bits(&s->pb, 2, s->pict_type - 1);
  142. put_bits(&s->pb, 5, s->qscale);
  143. s->rl_table_index = 2;
  144. s->rl_chroma_table_index = 1; /* only for I frame */
  145. s->dc_table_index = 1;
  146. s->mv_table_index = 1; /* only if P frame */
  147. s->use_skip_mb_code = 1; /* only if P frame */
  148. if (s->pict_type == I_TYPE) {
  149. put_bits(&s->pb, 5, 0x17); /* indicate only one "slice" */
  150. code012(&s->pb, s->rl_chroma_table_index);
  151. code012(&s->pb, s->rl_table_index);
  152. put_bits(&s->pb, 1, s->dc_table_index);
  153. s->no_rounding = 1;
  154. } else {
  155. put_bits(&s->pb, 1, s->use_skip_mb_code);
  156. s->rl_chroma_table_index = s->rl_table_index;
  157. code012(&s->pb, s->rl_table_index);
  158. put_bits(&s->pb, 1, s->dc_table_index);
  159. put_bits(&s->pb, 1, s->mv_table_index);
  160. if(s->flipflop_rounding){
  161. s->no_rounding ^= 1;
  162. }else{
  163. s->no_rounding = 0;
  164. }
  165. }
  166. if (!init_done) {
  167. /* init various encoding tables */
  168. init_done = 1;
  169. init_mv_table(&mv_tables[0]);
  170. init_mv_table(&mv_tables[1]);
  171. for(i=0;i<NB_RL_TABLES;i++)
  172. init_rl(&rl_table[i]);
  173. }
  174. #ifdef DEBUG
  175. intra_count = 0;
  176. printf("*****frame %d:\n", frame_count++);
  177. #endif
  178. }
  179. void msmpeg4_encode_ext_header(MpegEncContext * s)
  180. {
  181. s->flipflop_rounding=1;
  182. s->bitrate= 910; // FIXME
  183. put_bits(&s->pb, 5, s->frame_rate / FRAME_RATE_BASE); //yes 29.97 -> 29
  184. put_bits(&s->pb, 11, s->bitrate);
  185. put_bits(&s->pb, 1, s->flipflop_rounding);
  186. }
  187. /* predict coded block */
  188. static inline int coded_block_pred(MpegEncContext * s, int n, UINT8 **coded_block_ptr)
  189. {
  190. int xy, wrap, pred, a, b, c;
  191. xy = s->block_index[n];
  192. wrap = s->block_wrap[0];
  193. /* B C
  194. * A X
  195. */
  196. a = s->coded_block[xy - 1 ];
  197. b = s->coded_block[xy - 1 - wrap];
  198. c = s->coded_block[xy - wrap];
  199. if (b == c) {
  200. pred = a;
  201. } else {
  202. pred = c;
  203. }
  204. /* store value */
  205. *coded_block_ptr = &s->coded_block[xy];
  206. return pred;
  207. }
  208. static void msmpeg4_encode_motion(MpegEncContext * s,
  209. int mx, int my)
  210. {
  211. int code;
  212. MVTable *mv;
  213. /* modulo encoding */
  214. /* WARNING : you cannot reach all the MVs even with the modulo
  215. encoding. This is a somewhat strange compromise they took !!! */
  216. if (mx <= -64)
  217. mx += 64;
  218. else if (mx >= 64)
  219. mx -= 64;
  220. if (my <= -64)
  221. my += 64;
  222. else if (my >= 64)
  223. my -= 64;
  224. mx += 32;
  225. my += 32;
  226. #if 0
  227. if ((unsigned)mx >= 64 ||
  228. (unsigned)my >= 64)
  229. fprintf(stderr, "error mx=%d my=%d\n", mx, my);
  230. #endif
  231. mv = &mv_tables[s->mv_table_index];
  232. code = mv->table_mv_index[(mx << 6) | my];
  233. set_stat(ST_MV);
  234. put_bits(&s->pb,
  235. mv->table_mv_bits[code],
  236. mv->table_mv_code[code]);
  237. if (code == mv->n) {
  238. /* escape : code litterally */
  239. put_bits(&s->pb, 6, mx);
  240. put_bits(&s->pb, 6, my);
  241. }
  242. }
  243. void msmpeg4_encode_mb(MpegEncContext * s,
  244. DCTELEM block[6][64],
  245. int motion_x, int motion_y)
  246. {
  247. int cbp, coded_cbp, i;
  248. int pred_x, pred_y;
  249. UINT8 *coded_block;
  250. if (!s->mb_intra) {
  251. /* compute cbp */
  252. set_stat(ST_INTER_MB);
  253. cbp = 0;
  254. for (i = 0; i < 6; i++) {
  255. if (s->block_last_index[i] >= 0)
  256. cbp |= 1 << (5 - i);
  257. }
  258. if (s->use_skip_mb_code && (cbp | motion_x | motion_y) == 0) {
  259. /* skip macroblock */
  260. put_bits(&s->pb, 1, 1);
  261. return;
  262. }
  263. if (s->use_skip_mb_code)
  264. put_bits(&s->pb, 1, 0); /* mb coded */
  265. put_bits(&s->pb,
  266. table_mb_non_intra[cbp + 64][1],
  267. table_mb_non_intra[cbp + 64][0]);
  268. /* motion vector */
  269. h263_pred_motion(s, 0, &pred_x, &pred_y);
  270. msmpeg4_encode_motion(s, motion_x - pred_x,
  271. motion_y - pred_y);
  272. } else {
  273. /* compute cbp */
  274. cbp = 0;
  275. coded_cbp = 0;
  276. for (i = 0; i < 6; i++) {
  277. int val, pred;
  278. val = (s->block_last_index[i] >= 1);
  279. cbp |= val << (5 - i);
  280. if (i < 4) {
  281. /* predict value for close blocks only for luma */
  282. pred = coded_block_pred(s, i, &coded_block);
  283. *coded_block = val;
  284. val = val ^ pred;
  285. }
  286. coded_cbp |= val << (5 - i);
  287. }
  288. #if 0
  289. if (coded_cbp)
  290. printf("cbp=%x %x\n", cbp, coded_cbp);
  291. #endif
  292. if (s->pict_type == I_TYPE) {
  293. set_stat(ST_INTRA_MB);
  294. put_bits(&s->pb,
  295. table_mb_intra[coded_cbp][1], table_mb_intra[coded_cbp][0]);
  296. } else {
  297. if (s->use_skip_mb_code)
  298. put_bits(&s->pb, 1, 0); /* mb coded */
  299. put_bits(&s->pb,
  300. table_mb_non_intra[cbp][1],
  301. table_mb_non_intra[cbp][0]);
  302. }
  303. set_stat(ST_INTRA_MB);
  304. put_bits(&s->pb, 1, 0); /* no AC prediction yet */
  305. }
  306. for (i = 0; i < 6; i++) {
  307. msmpeg4_encode_block(s, block[i], i);
  308. }
  309. }
  310. /* strongly inspirated from MPEG4, but not exactly the same ! */
  311. void msmpeg4_dc_scale(MpegEncContext * s)
  312. {
  313. if (s->qscale < 5){
  314. s->y_dc_scale = 8;
  315. s->c_dc_scale = 8;
  316. // s->c_dc_scale = (s->qscale + 13)>>1;
  317. }else if (s->qscale < 9){
  318. s->y_dc_scale = 2 * s->qscale;
  319. s->c_dc_scale = (s->qscale + 13)>>1;
  320. }else{
  321. s->y_dc_scale = s->qscale + 8;
  322. s->c_dc_scale = (s->qscale + 13)>>1;
  323. }
  324. // this differs for quant >24 from mpeg4
  325. // if(s->qscale==13) s->c_dc_scale=14;
  326. // if(s->qscale>=6)
  327. // printf("%d", s->qscale);
  328. /* s->c_dc_scale values (found by Michael Nidermayer)
  329. qscale=2 -> 8 (yes iam sure about that)
  330. qscale=3 -> 8
  331. qscale=4 -> 8
  332. qscale=5 -> 9
  333. qscale=6 -> 9
  334. qscale=7 -> 10
  335. qscale=8 -> 10
  336. qscale=9 -> 11
  337. qscale=10-> 11
  338. */
  339. }
  340. /* dir = 0: left, dir = 1: top prediction */
  341. static int msmpeg4_pred_dc(MpegEncContext * s, int n,
  342. INT16 **dc_val_ptr, int *dir_ptr)
  343. {
  344. int a, b, c, wrap, pred, scale;
  345. INT16 *dc_val;
  346. /* find prediction */
  347. if (n < 4) {
  348. scale = s->y_dc_scale;
  349. } else {
  350. scale = s->c_dc_scale;
  351. }
  352. wrap = s->block_wrap[n];
  353. dc_val= s->dc_val[0] + s->block_index[n];
  354. /* B C
  355. * A X
  356. */
  357. a = dc_val[ - 1];
  358. b = dc_val[ - 1 - wrap];
  359. c = dc_val[ - wrap];
  360. /* XXX: the following solution consumes divisions, but it does not
  361. necessitate to modify mpegvideo.c. The problem comes from the
  362. fact they decided to store the quantized DC (which would lead
  363. to problems if Q could vary !) */
  364. #if defined ARCH_X86 && !defined PIC
  365. asm volatile(
  366. "movl %3, %%eax \n\t"
  367. "shrl $1, %%eax \n\t"
  368. "addl %%eax, %2 \n\t"
  369. "addl %%eax, %1 \n\t"
  370. "addl %0, %%eax \n\t"
  371. "mull %4 \n\t"
  372. "movl %%edx, %0 \n\t"
  373. "movl %1, %%eax \n\t"
  374. "mull %4 \n\t"
  375. "movl %%edx, %1 \n\t"
  376. "movl %2, %%eax \n\t"
  377. "mull %4 \n\t"
  378. "movl %%edx, %2 \n\t"
  379. : "+b" (a), "+c" (b), "+D" (c)
  380. : "g" (scale), "S" (inverse[scale])
  381. : "%eax", "%edx"
  382. );
  383. #else
  384. /* #elif defined (ARCH_ALPHA) */
  385. /* Divisions are extremely costly on Alpha; optimize the most
  386. common case. But they are costly everywhere...
  387. */
  388. if (scale == 8) {
  389. a = (a + (8 >> 1)) / 8;
  390. b = (b + (8 >> 1)) / 8;
  391. c = (c + (8 >> 1)) / 8;
  392. } else {
  393. a = (a + (scale >> 1)) / scale;
  394. b = (b + (scale >> 1)) / scale;
  395. c = (c + (scale >> 1)) / scale;
  396. }
  397. #endif
  398. /* XXX: WARNING: they did not choose the same test as MPEG4. This
  399. is very important ! */
  400. if (abs(a - b) <= abs(b - c)) {
  401. pred = c;
  402. *dir_ptr = 1;
  403. } else {
  404. pred = a;
  405. *dir_ptr = 0;
  406. }
  407. /* update predictor */
  408. *dc_val_ptr = &dc_val[0];
  409. return pred;
  410. }
  411. #define DC_MAX 119
  412. static void msmpeg4_encode_dc(MpegEncContext * s, int level, int n, int *dir_ptr)
  413. {
  414. int sign, code;
  415. int pred;
  416. INT16 *dc_val;
  417. pred = msmpeg4_pred_dc(s, n, &dc_val, dir_ptr);
  418. /* update predictor */
  419. if (n < 4) {
  420. *dc_val = level * s->y_dc_scale;
  421. } else {
  422. *dc_val = level * s->c_dc_scale;
  423. }
  424. /* do the prediction */
  425. level -= pred;
  426. sign = 0;
  427. if (level < 0) {
  428. level = -level;
  429. sign = 1;
  430. }
  431. code = level;
  432. if (code > DC_MAX)
  433. code = DC_MAX;
  434. if (s->dc_table_index == 0) {
  435. if (n < 4) {
  436. put_bits(&s->pb, table0_dc_lum[code][1], table0_dc_lum[code][0]);
  437. } else {
  438. put_bits(&s->pb, table0_dc_chroma[code][1], table0_dc_chroma[code][0]);
  439. }
  440. } else {
  441. if (n < 4) {
  442. put_bits(&s->pb, table1_dc_lum[code][1], table1_dc_lum[code][0]);
  443. } else {
  444. put_bits(&s->pb, table1_dc_chroma[code][1], table1_dc_chroma[code][0]);
  445. }
  446. }
  447. if (code == DC_MAX)
  448. put_bits(&s->pb, 8, level);
  449. if (level != 0) {
  450. put_bits(&s->pb, 1, sign);
  451. }
  452. }
  453. /* Encoding of a block. Very similar to MPEG4 except for a different
  454. escape coding (same as H263) and more vlc tables.
  455. */
  456. static void msmpeg4_encode_block(MpegEncContext * s, DCTELEM * block, int n)
  457. {
  458. int level, run, last, i, j, last_index;
  459. int last_non_zero, sign, slevel;
  460. int code, run_diff, dc_pred_dir;
  461. const RLTable *rl;
  462. if (s->mb_intra) {
  463. set_stat(ST_DC);
  464. msmpeg4_encode_dc(s, block[0], n, &dc_pred_dir);
  465. i = 1;
  466. if (n < 4) {
  467. rl = &rl_table[s->rl_table_index];
  468. } else {
  469. rl = &rl_table[3 + s->rl_chroma_table_index];
  470. }
  471. run_diff = 0;
  472. set_stat(ST_INTRA_AC);
  473. } else {
  474. i = 0;
  475. rl = &rl_table[3 + s->rl_table_index];
  476. run_diff = 1;
  477. set_stat(ST_INTER_AC);
  478. }
  479. /* AC coefs */
  480. last_index = s->block_last_index[n];
  481. last_non_zero = i - 1;
  482. for (; i <= last_index; i++) {
  483. j = zigzag_direct[i];
  484. level = block[j];
  485. if (level) {
  486. run = i - last_non_zero - 1;
  487. last = (i == last_index);
  488. sign = 0;
  489. slevel = level;
  490. if (level < 0) {
  491. sign = 1;
  492. level = -level;
  493. }
  494. code = get_rl_index(rl, last, run, level);
  495. put_bits(&s->pb, rl->table_vlc[code][1], rl->table_vlc[code][0]);
  496. if (code == rl->n) {
  497. int level1, run1;
  498. level1 = level - rl->max_level[last][run];
  499. if (level1 < 1)
  500. goto esc2;
  501. code = get_rl_index(rl, last, run, level1);
  502. if (code == rl->n) {
  503. esc2:
  504. put_bits(&s->pb, 1, 0);
  505. if (level > MAX_LEVEL)
  506. goto esc3;
  507. run1 = run - rl->max_run[last][level] - run_diff;
  508. if (run1 < 0)
  509. goto esc3;
  510. code = get_rl_index(rl, last, run1, level);
  511. if (code == rl->n) {
  512. esc3:
  513. /* third escape */
  514. put_bits(&s->pb, 1, 0);
  515. put_bits(&s->pb, 1, last);
  516. put_bits(&s->pb, 6, run);
  517. put_bits(&s->pb, 8, slevel & 0xff);
  518. } else {
  519. /* second escape */
  520. put_bits(&s->pb, 1, 1);
  521. put_bits(&s->pb, rl->table_vlc[code][1], rl->table_vlc[code][0]);
  522. put_bits(&s->pb, 1, sign);
  523. }
  524. } else {
  525. /* first escape */
  526. put_bits(&s->pb, 1, 1);
  527. put_bits(&s->pb, rl->table_vlc[code][1], rl->table_vlc[code][0]);
  528. put_bits(&s->pb, 1, sign);
  529. }
  530. } else {
  531. put_bits(&s->pb, 1, sign);
  532. }
  533. last_non_zero = i;
  534. }
  535. }
  536. }
  537. /****************************************/
  538. /* decoding stuff */
  539. static VLC mb_non_intra_vlc;
  540. static VLC mb_intra_vlc;
  541. static VLC dc_lum_vlc[2];
  542. static VLC dc_chroma_vlc[2];
  543. static VLC v2_dc_lum_vlc;
  544. static VLC v2_dc_chroma_vlc;
  545. static VLC cbpy_vlc;
  546. static VLC v2_intra_cbpc_vlc;
  547. static VLC v2_mb_type_vlc;
  548. static VLC v2_mv_vlc;
  549. /* this table is practically identical to the one from h263 except that its inverted */
  550. static void init_h263_dc_for_msmpeg4()
  551. {
  552. static int inited=0;
  553. if(!inited){
  554. int level, uni_code, uni_len;
  555. inited=1;
  556. for(level=-255; level<256; level++){
  557. int size, v, l;
  558. /* find number of bits */
  559. size = 0;
  560. v = abs(level);
  561. while (v) {
  562. v >>= 1;
  563. size++;
  564. }
  565. if (level < 0)
  566. l= (-level) ^ ((1 << size) - 1);
  567. else
  568. l= level;
  569. /* luminance h263 */
  570. uni_code= DCtab_lum[size][0];
  571. uni_len = DCtab_lum[size][1];
  572. uni_code ^= (1<<uni_len)-1; //M$ doesnt like compatibility
  573. if (size > 0) {
  574. uni_code<<=size; uni_code|=l;
  575. uni_len+=size;
  576. if (size > 8){
  577. uni_code<<=1; uni_code|=1;
  578. uni_len++;
  579. }
  580. }
  581. v2_dc_lum_table[level+256][0]= uni_code;
  582. v2_dc_lum_table[level+256][1]= uni_len;
  583. /* chrominance h263 */
  584. uni_code= DCtab_chrom[size][0];
  585. uni_len = DCtab_chrom[size][1];
  586. uni_code ^= (1<<uni_len)-1; //M$ doesnt like compatibility
  587. if (size > 0) {
  588. uni_code<<=size; uni_code|=l;
  589. uni_len+=size;
  590. if (size > 8){
  591. uni_code<<=1; uni_code|=1;
  592. uni_len++;
  593. }
  594. }
  595. v2_dc_chroma_table[level+256][0]= uni_code;
  596. v2_dc_chroma_table[level+256][1]= uni_len;
  597. }
  598. }
  599. }
  600. /* init all vlc decoding tables */
  601. int msmpeg4_decode_init_vlc(MpegEncContext *s)
  602. {
  603. int i;
  604. MVTable *mv;
  605. for(i=0;i<NB_RL_TABLES;i++) {
  606. init_rl(&rl_table[i]);
  607. init_vlc_rl(&rl_table[i]);
  608. }
  609. for(i=0;i<2;i++) {
  610. mv = &mv_tables[i];
  611. init_vlc(&mv->vlc, 9, mv->n + 1,
  612. mv->table_mv_bits, 1, 1,
  613. mv->table_mv_code, 2, 2);
  614. }
  615. init_vlc(&dc_lum_vlc[0], 9, 120,
  616. &table0_dc_lum[0][1], 8, 4,
  617. &table0_dc_lum[0][0], 8, 4);
  618. init_vlc(&dc_chroma_vlc[0], 9, 120,
  619. &table0_dc_chroma[0][1], 8, 4,
  620. &table0_dc_chroma[0][0], 8, 4);
  621. init_vlc(&dc_lum_vlc[1], 9, 120,
  622. &table1_dc_lum[0][1], 8, 4,
  623. &table1_dc_lum[0][0], 8, 4);
  624. init_vlc(&dc_chroma_vlc[1], 9, 120,
  625. &table1_dc_chroma[0][1], 8, 4,
  626. &table1_dc_chroma[0][0], 8, 4);
  627. init_h263_dc_for_msmpeg4();
  628. init_vlc(&v2_dc_lum_vlc, 9, 512,
  629. &v2_dc_lum_table[0][1], 8, 4,
  630. &v2_dc_lum_table[0][0], 8, 4);
  631. init_vlc(&v2_dc_chroma_vlc, 9, 512,
  632. &v2_dc_chroma_table[0][1], 8, 4,
  633. &v2_dc_chroma_table[0][0], 8, 4);
  634. init_vlc(&cbpy_vlc, 6, 16,
  635. &cbpy_tab[0][1], 2, 1,
  636. &cbpy_tab[0][0], 2, 1);
  637. init_vlc(&v2_intra_cbpc_vlc, 3, 4,
  638. &v2_intra_cbpc[0][1], 2, 1,
  639. &v2_intra_cbpc[0][0], 2, 1);
  640. init_vlc(&v2_mb_type_vlc, 5, 8,
  641. &v2_mb_type[0][1], 2, 1,
  642. &v2_mb_type[0][0], 2, 1);
  643. init_vlc(&v2_mv_vlc, 9, 33,
  644. &mvtab[0][1], 2, 1,
  645. &mvtab[0][0], 2, 1);
  646. init_vlc(&mb_non_intra_vlc, 9, 128,
  647. &table_mb_non_intra[0][1], 8, 4,
  648. &table_mb_non_intra[0][0], 8, 4);
  649. init_vlc(&mb_intra_vlc, 9, 64,
  650. &table_mb_intra[0][1], 4, 2,
  651. &table_mb_intra[0][0], 4, 2);
  652. return 0;
  653. }
  654. static int decode012(GetBitContext *gb)
  655. {
  656. int n;
  657. n = get_bits1(gb);
  658. if (n == 0)
  659. return 0;
  660. else
  661. return get_bits1(gb) + 1;
  662. }
  663. int msmpeg4_decode_picture_header(MpegEncContext * s)
  664. {
  665. int code;
  666. s->pict_type = get_bits(&s->gb, 2) + 1;
  667. if (s->pict_type != I_TYPE &&
  668. s->pict_type != P_TYPE)
  669. return -1;
  670. s->qscale = get_bits(&s->gb, 5);
  671. if (s->pict_type == I_TYPE) {
  672. code = get_bits(&s->gb, 5);
  673. /* 0x17: one slice, 0x18: two slices */
  674. if (code < 0x17)
  675. return -1;
  676. s->slice_height = s->mb_height / (code - 0x16);
  677. if(s->msmpeg4_version==2){
  678. s->rl_chroma_table_index = 2;
  679. s->rl_table_index = 2;
  680. s->dc_table_index = 0; //not used
  681. }else{
  682. s->rl_chroma_table_index = decode012(&s->gb);
  683. s->rl_table_index = decode012(&s->gb);
  684. s->dc_table_index = get_bits1(&s->gb);
  685. }
  686. s->no_rounding = 1;
  687. /* printf(" %d %d %d %d \n",
  688. s->qscale,
  689. s->rl_chroma_table_index,
  690. s->rl_table_index,
  691. s->dc_table_index);*/
  692. } else {
  693. s->use_skip_mb_code = get_bits1(&s->gb);
  694. if(s->msmpeg4_version==2){
  695. s->rl_table_index = 2;
  696. s->rl_chroma_table_index = s->rl_table_index;
  697. s->dc_table_index = 0; //not used
  698. s->mv_table_index = 0;
  699. }else{
  700. s->rl_table_index = decode012(&s->gb);
  701. s->rl_chroma_table_index = s->rl_table_index;
  702. s->dc_table_index = get_bits1(&s->gb);
  703. s->mv_table_index = get_bits1(&s->gb);
  704. }
  705. /* printf(" %d %d %d %d %d \n",
  706. s->use_skip_mb_code,
  707. s->rl_table_index,
  708. s->rl_chroma_table_index,
  709. s->dc_table_index,
  710. s->mv_table_index);*/
  711. if(s->flipflop_rounding){
  712. s->no_rounding ^= 1;
  713. }else{
  714. s->no_rounding = 0;
  715. }
  716. // printf("%d", s->no_rounding);
  717. }
  718. #if 0
  719. if(s->msmpeg4_version==2)
  720. {
  721. int i;
  722. printf("%s q:%d s:%X ", s->pict_type == I_TYPE ? "I" : "P" , s->qscale,
  723. s->pict_type == I_TYPE ? code : s->use_skip_mb_code);
  724. for(i=0; i<s->gb.size*8; i++)
  725. // printf("%d", get_bits1(&s->gb));
  726. get_bits1(&s->gb);
  727. printf("END\n");
  728. return -1;
  729. }
  730. #endif
  731. #ifdef DEBUG
  732. printf("*****frame %d:\n", frame_count++);
  733. #endif
  734. return 0;
  735. }
  736. int msmpeg4_decode_ext_header(MpegEncContext * s, int buf_size)
  737. {
  738. /* the alt_bitstream reader could read over the end so we need to check it */
  739. if(get_bits_count(&s->gb) + 16 < buf_size*8)
  740. {
  741. int fps;
  742. fps= get_bits(&s->gb, 5);
  743. s->bitrate= get_bits(&s->gb, 11);
  744. s->flipflop_rounding= get_bits1(&s->gb);
  745. // printf("fps:%2d bps:%2d roundingType:%1d\n", fps, s->bitrate, s->flipflop_rounding);
  746. }
  747. else
  748. {
  749. s->flipflop_rounding= 0;
  750. s->bitrate= 0;
  751. }
  752. return 0;
  753. }
  754. static inline void memsetw(short *tab, int val, int n)
  755. {
  756. int i;
  757. for(i=0;i<n;i++)
  758. tab[i] = val;
  759. }
  760. /* this is identical to h263 except that its range is multiplied by 2 */
  761. static int msmpeg4v2_decode_motion(MpegEncContext * s, int pred, int f_code)
  762. {
  763. int code, val, sign, shift;
  764. code = get_vlc(&s->gb, &v2_mv_vlc);
  765. if (code < 0)
  766. return 0xffff;
  767. if (code == 0)
  768. return pred;
  769. sign = get_bits1(&s->gb);
  770. shift = f_code - 1;
  771. val = (code - 1) << shift;
  772. if (shift > 0)
  773. val |= get_bits(&s->gb, shift);
  774. val++;
  775. if (sign)
  776. val = -val;
  777. val += pred;
  778. if (val <= -64)
  779. val += 64;
  780. else if (val >= 64)
  781. val -= 64;
  782. return val;
  783. }
  784. int msmpeg4v2_decode_mb(MpegEncContext *s,
  785. DCTELEM block[6][64])
  786. {
  787. int cbp, code, i;
  788. //printf("M");
  789. //fflush(stderr); fflush(stdout);
  790. if (s->pict_type == P_TYPE) {
  791. if (s->use_skip_mb_code) {
  792. if (get_bits1(&s->gb)) {
  793. /* skip mb */
  794. s->mb_intra = 0;
  795. for(i=0;i<6;i++)
  796. s->block_last_index[i] = -1;
  797. s->mv_dir = MV_DIR_FORWARD;
  798. s->mv_type = MV_TYPE_16X16;
  799. s->mv[0][0][0] = 0;
  800. s->mv[0][0][1] = 0;
  801. s->mb_skiped = 1;
  802. return 0;
  803. }
  804. }
  805. code = get_vlc(&s->gb, &v2_mb_type_vlc);
  806. s->mb_intra = code >>2;
  807. cbp = code & 0x3;
  808. } else {
  809. s->mb_intra = 1;
  810. //printf("%X ", show_bits(&s->gb, 24));
  811. cbp= get_vlc(&s->gb, &v2_intra_cbpc_vlc);
  812. //printf("%X ", show_bits(&s->gb, 24));
  813. //printf("CBP: %X ",cbp);
  814. }
  815. if (!s->mb_intra) {
  816. int mx, my;
  817. cbp|= get_vlc(&s->gb, &cbpy_vlc)<<2;
  818. if((cbp&3) != 3) cbp^= 0x3C;
  819. h263_pred_motion(s, 0, &mx, &my);
  820. mx= msmpeg4v2_decode_motion(s, mx, 1);
  821. my= msmpeg4v2_decode_motion(s, my, 1);
  822. s->mv_dir = MV_DIR_FORWARD;
  823. s->mv_type = MV_TYPE_16X16;
  824. s->mv[0][0][0] = mx;
  825. s->mv[0][0][1] = my;
  826. } else {
  827. //if(s->pict_type == P_TYPE) printf("intra cbp: %X", cbp);
  828. s->ac_pred = get_bits1(&s->gb);
  829. //printf("AC: %d ",s->ac_pred);
  830. cbp|= get_vlc(&s->gb, &cbpy_vlc)<<2;
  831. //printf("cbp: %X ",cbp);
  832. }
  833. for (i = 0; i < 6; i++) {
  834. if (msmpeg4_decode_block(s, block[i], i, (cbp >> (5 - i)) & 1) < 0)
  835. {
  836. //fflush(stderr); fflush(stdout);
  837. fprintf(stderr,"\nIgnoring error while decoding block: %d x %d (%d)\n", s->mb_x, s->mb_y, i);
  838. return -1;
  839. }
  840. }
  841. return 0;
  842. }
  843. int msmpeg4_decode_mb(MpegEncContext *s,
  844. DCTELEM block[6][64])
  845. {
  846. int cbp, code, i;
  847. UINT8 *coded_val;
  848. /* special slice handling */
  849. if (s->mb_x == 0) {
  850. if (s->slice_height && (s->mb_y % s->slice_height) == 0) {
  851. int wrap;
  852. /* reset DC pred (set previous line to 1024) */
  853. wrap = 2 * s->mb_width + 2;
  854. memsetw(&s->dc_val[0][(1) + (2 * s->mb_y) * wrap],
  855. 1024, 2 * s->mb_width);
  856. wrap = s->mb_width + 2;
  857. memsetw(&s->dc_val[1][(1) + (s->mb_y) * wrap],
  858. 1024, s->mb_width);
  859. memsetw(&s->dc_val[2][(1) + (s->mb_y) * wrap],
  860. 1024, s->mb_width);
  861. /* reset AC pred (set previous line to 0) */
  862. wrap = s->mb_width * 2 + 2;
  863. memsetw(s->ac_val[0][0] + (1 + (2 * s->mb_y) * wrap)*16,
  864. 0, 2 * s->mb_width*16);
  865. wrap = s->mb_width + 2;
  866. memsetw(s->ac_val[1][0] + (1 + (s->mb_y) * wrap)*16,
  867. 0, s->mb_width*16);
  868. memsetw(s->ac_val[2][0] + (1 + (s->mb_y) * wrap)*16,
  869. 0, s->mb_width*16);
  870. s->first_slice_line = 1;
  871. } else {
  872. s->first_slice_line = 0;
  873. }
  874. }
  875. if(s->msmpeg4_version==2) return msmpeg4v2_decode_mb(s, block); //FIXME merge if possible
  876. if (s->pict_type == P_TYPE) {
  877. set_stat(ST_INTER_MB);
  878. if (s->use_skip_mb_code) {
  879. if (get_bits1(&s->gb)) {
  880. /* skip mb */
  881. s->mb_intra = 0;
  882. for(i=0;i<6;i++)
  883. s->block_last_index[i] = -1;
  884. s->mv_dir = MV_DIR_FORWARD;
  885. s->mv_type = MV_TYPE_16X16;
  886. s->mv[0][0][0] = 0;
  887. s->mv[0][0][1] = 0;
  888. s->mb_skiped = 1;
  889. return 0;
  890. }
  891. }
  892. code = get_vlc(&s->gb, &mb_non_intra_vlc);
  893. if (code < 0)
  894. return -1;
  895. //s->mb_intra = (code & 0x40) ? 0 : 1;
  896. s->mb_intra = (~code & 0x40) >> 6;
  897. cbp = code & 0x3f;
  898. } else {
  899. set_stat(ST_INTRA_MB);
  900. s->mb_intra = 1;
  901. code = get_vlc(&s->gb, &mb_intra_vlc);
  902. if (code < 0)
  903. return -1;
  904. /* predict coded block pattern */
  905. cbp = 0;
  906. for(i=0;i<6;i++) {
  907. int val = ((code >> (5 - i)) & 1);
  908. if (i < 4) {
  909. int pred = coded_block_pred(s, i, &coded_val);
  910. val = val ^ pred;
  911. *coded_val = val;
  912. }
  913. cbp |= val << (5 - i);
  914. }
  915. }
  916. if (!s->mb_intra) {
  917. int mx, my;
  918. set_stat(ST_MV);
  919. h263_pred_motion(s, 0, &mx, &my);
  920. if (msmpeg4_decode_motion(s, &mx, &my) < 0)
  921. return -1;
  922. s->mv_dir = MV_DIR_FORWARD;
  923. s->mv_type = MV_TYPE_16X16;
  924. s->mv[0][0][0] = mx;
  925. s->mv[0][0][1] = my;
  926. } else {
  927. set_stat(ST_INTRA_MB);
  928. s->ac_pred = get_bits1(&s->gb);
  929. }
  930. for (i = 0; i < 6; i++) {
  931. if (msmpeg4_decode_block(s, block[i], i, (cbp >> (5 - i)) & 1) < 0)
  932. {
  933. fprintf(stderr,"\nIgnoring error while decoding block: %d x %d (%d)\n", s->mb_x, s->mb_y, i);
  934. // return -1;
  935. }
  936. }
  937. return 0;
  938. }
  939. static int msmpeg4_decode_block(MpegEncContext * s, DCTELEM * block,
  940. int n, int coded)
  941. {
  942. int code, level, i, j, last, run, run_diff;
  943. int dc_pred_dir;
  944. RLTable *rl;
  945. const UINT8 *scan_table;
  946. int qmul, qadd;
  947. if (s->mb_intra) {
  948. qmul=1;
  949. qadd=0;
  950. /* DC coef */
  951. set_stat(ST_DC);
  952. level = msmpeg4_decode_dc(s, n, &dc_pred_dir);
  953. if (level < 0)
  954. return -1;
  955. block[0] = level;
  956. if (n < 4) {
  957. rl = &rl_table[s->rl_table_index];
  958. } else {
  959. rl = &rl_table[3 + s->rl_chroma_table_index];
  960. }
  961. run_diff = 0;
  962. i = 1;
  963. if (!coded) {
  964. goto not_coded;
  965. }
  966. if (s->ac_pred) {
  967. if (dc_pred_dir == 0)
  968. scan_table = ff_alternate_vertical_scan; /* left */
  969. else
  970. scan_table = ff_alternate_horizontal_scan; /* top */
  971. } else {
  972. scan_table = zigzag_direct;
  973. }
  974. set_stat(ST_INTRA_AC);
  975. } else {
  976. qmul = s->qscale << 1;
  977. qadd = (s->qscale - 1) | 1;
  978. i = 0;
  979. rl = &rl_table[3 + s->rl_table_index];
  980. if(s->msmpeg4_version==2)
  981. run_diff = 0;
  982. else
  983. run_diff = 1;
  984. if (!coded) {
  985. s->block_last_index[n] = i - 1;
  986. return 0;
  987. }
  988. scan_table = zigzag_direct;
  989. set_stat(ST_INTER_AC);
  990. }
  991. for(;;) {
  992. code = get_vlc(&s->gb, &rl->vlc);
  993. if (code < 0)
  994. return -1;
  995. if (code == rl->n) {
  996. /* escape */
  997. if (get_bits1(&s->gb) == 0) {
  998. if (get_bits1(&s->gb) == 0) {
  999. /* third escape */
  1000. last = get_bits1(&s->gb);
  1001. run = get_bits(&s->gb, 6);
  1002. level = get_bits(&s->gb, 8);
  1003. level = (level << 24) >> 24; /* sign extend */
  1004. //level = level * qmul + (level>0) * qadd - (level<=0) * qadd ;
  1005. if (level>0) level= level * qmul + qadd;
  1006. else level= level * qmul - qadd;
  1007. } else {
  1008. /* second escape */
  1009. code = get_vlc(&s->gb, &rl->vlc);
  1010. if (code < 0 || code >= rl->n)
  1011. return -1;
  1012. run = rl->table_run[code];
  1013. level = rl->table_level[code];
  1014. last = code >= rl->last;
  1015. run += rl->max_run[last][level] + run_diff;
  1016. level= level * qmul + qadd;
  1017. if (get_bits1(&s->gb))
  1018. level = -level;
  1019. }
  1020. } else {
  1021. /* first escape */
  1022. code = get_vlc(&s->gb, &rl->vlc);
  1023. if (code < 0 || code >= rl->n)
  1024. return -1;
  1025. run = rl->table_run[code];
  1026. level = rl->table_level[code];
  1027. last = code >= rl->last;
  1028. level += rl->max_level[last][run];
  1029. level= level * qmul + qadd;
  1030. if (get_bits1(&s->gb))
  1031. level = -level;
  1032. }
  1033. } else {
  1034. run = rl->table_run[code];
  1035. level = rl->table_level[code] * qmul + qadd;
  1036. last = code >= rl->last;
  1037. if (get_bits1(&s->gb))
  1038. level = -level;
  1039. }
  1040. i += run;
  1041. if (i >= 64)
  1042. return -1;
  1043. j = scan_table[i];
  1044. block[j] = level;
  1045. i++;
  1046. if (last)
  1047. break;
  1048. }
  1049. not_coded:
  1050. if (s->mb_intra) {
  1051. mpeg4_pred_ac(s, block, n, dc_pred_dir);
  1052. if (s->ac_pred) {
  1053. i = 64; /* XXX: not optimal */
  1054. }
  1055. }
  1056. s->block_last_index[n] = i - 1;
  1057. return 0;
  1058. }
  1059. static int msmpeg4_decode_dc(MpegEncContext * s, int n, int *dir_ptr)
  1060. {
  1061. int level, pred;
  1062. INT16 *dc_val;
  1063. if(s->msmpeg4_version==2){
  1064. if (n < 4) {
  1065. level = get_vlc(&s->gb, &v2_dc_lum_vlc);
  1066. } else {
  1067. level = get_vlc(&s->gb, &v2_dc_chroma_vlc);
  1068. }
  1069. if (level < 0)
  1070. return -1;
  1071. level-=256;
  1072. }else{ //FIXME optimize use unified tables & index
  1073. if (n < 4) {
  1074. level = get_vlc(&s->gb, &dc_lum_vlc[s->dc_table_index]);
  1075. } else {
  1076. level = get_vlc(&s->gb, &dc_chroma_vlc[s->dc_table_index]);
  1077. }
  1078. if (level < 0)
  1079. return -1;
  1080. if (level == DC_MAX) {
  1081. level = get_bits(&s->gb, 8);
  1082. if (get_bits1(&s->gb))
  1083. level = -level;
  1084. } else if (level != 0) {
  1085. if (get_bits1(&s->gb))
  1086. level = -level;
  1087. }
  1088. }
  1089. pred = msmpeg4_pred_dc(s, n, &dc_val, dir_ptr);
  1090. level += pred;
  1091. /* update predictor */
  1092. if (n < 4) {
  1093. *dc_val = level * s->y_dc_scale;
  1094. } else {
  1095. *dc_val = level * s->c_dc_scale;
  1096. }
  1097. return level;
  1098. }
  1099. static int msmpeg4_decode_motion(MpegEncContext * s,
  1100. int *mx_ptr, int *my_ptr)
  1101. {
  1102. MVTable *mv;
  1103. int code, mx, my;
  1104. mv = &mv_tables[s->mv_table_index];
  1105. code = get_vlc(&s->gb, &mv->vlc);
  1106. if (code < 0)
  1107. return -1;
  1108. if (code == mv->n) {
  1109. mx = get_bits(&s->gb, 6);
  1110. my = get_bits(&s->gb, 6);
  1111. } else {
  1112. mx = mv->table_mvx[code];
  1113. my = mv->table_mvy[code];
  1114. }
  1115. mx += *mx_ptr - 32;
  1116. my += *my_ptr - 32;
  1117. /* WARNING : they do not do exactly modulo encoding */
  1118. if (mx <= -64)
  1119. mx += 64;
  1120. else if (mx >= 64)
  1121. mx -= 64;
  1122. if (my <= -64)
  1123. my += 64;
  1124. else if (my >= 64)
  1125. my -= 64;
  1126. *mx_ptr = mx;
  1127. *my_ptr = my;
  1128. return 0;
  1129. }