You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

595 lines
23KB

  1. /*
  2. * Copyright (c) 2013
  3. * MIPS Technologies, Inc., California.
  4. *
  5. * Redistribution and use in source and binary forms, with or without
  6. * modification, are permitted provided that the following conditions
  7. * are met:
  8. * 1. Redistributions of source code must retain the above copyright
  9. * notice, this list of conditions and the following disclaimer.
  10. * 2. Redistributions in binary form must reproduce the above copyright
  11. * notice, this list of conditions and the following disclaimer in the
  12. * documentation and/or other materials provided with the distribution.
  13. * 3. Neither the name of the MIPS Technologies, Inc., nor the names of its
  14. * contributors may be used to endorse or promote products derived from
  15. * this software without specific prior written permission.
  16. *
  17. * THIS SOFTWARE IS PROVIDED BY THE MIPS TECHNOLOGIES, INC. ``AS IS'' AND
  18. * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  19. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  20. * ARE DISCLAIMED. IN NO EVENT SHALL THE MIPS TECHNOLOGIES, INC. BE LIABLE
  21. * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  22. * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  23. * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  24. * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  25. * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  26. * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  27. * SUCH DAMAGE.
  28. *
  29. * AAC Spectral Band Replication decoding functions (fixed-point)
  30. * Copyright (c) 2008-2009 Robert Swain ( rob opendot cl )
  31. * Copyright (c) 2009-2010 Alex Converse <alex.converse@gmail.com>
  32. *
  33. * This file is part of FFmpeg.
  34. *
  35. * FFmpeg is free software; you can redistribute it and/or
  36. * modify it under the terms of the GNU Lesser General Public
  37. * License as published by the Free Software Foundation; either
  38. * version 2.1 of the License, or (at your option) any later version.
  39. *
  40. * FFmpeg is distributed in the hope that it will be useful,
  41. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  42. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  43. * Lesser General Public License for more details.
  44. *
  45. * You should have received a copy of the GNU Lesser General Public
  46. * License along with FFmpeg; if not, write to the Free Software
  47. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  48. */
  49. /**
  50. * @file
  51. * AAC Spectral Band Replication decoding functions (fixed-point)
  52. * Note: Rounding-to-nearest used unless otherwise stated
  53. * @author Robert Swain ( rob opendot cl )
  54. * @author Stanislav Ocovaj ( stanislav.ocovaj imgtec com )
  55. */
  56. #define USE_FIXED 1
  57. #include "aac.h"
  58. #include "sbr.h"
  59. #include "aacsbr.h"
  60. #include "aacsbrdata.h"
  61. #include "aacsbr_fixed_tablegen.h"
  62. #include "fft.h"
  63. #include "aacps.h"
  64. #include "sbrdsp.h"
  65. #include "libavutil/internal.h"
  66. #include "libavutil/libm.h"
  67. #include "libavutil/avassert.h"
  68. #include <stdint.h>
  69. #include <float.h>
  70. #include <math.h>
  71. static VLC vlc_sbr[10];
  72. static void aacsbr_func_ptr_init(AACSBRContext *c);
  73. static const int CONST_LN2 = Q31(0.6931471806/256); // ln(2)/256
  74. static const int CONST_RECIP_LN2 = Q31(0.7213475204); // 0.5/ln(2)
  75. static const int CONST_076923 = Q31(0.76923076923076923077f);
  76. static const int fixed_log_table[10] =
  77. {
  78. Q31(1.0/2), Q31(1.0/3), Q31(1.0/4), Q31(1.0/5), Q31(1.0/6),
  79. Q31(1.0/7), Q31(1.0/8), Q31(1.0/9), Q31(1.0/10), Q31(1.0/11)
  80. };
  81. static int fixed_log(int x)
  82. {
  83. int i, ret, xpow, tmp;
  84. ret = x;
  85. xpow = x;
  86. for (i=0; i<10; i+=2){
  87. xpow = (int)(((int64_t)xpow * x + 0x40000000) >> 31);
  88. tmp = (int)(((int64_t)xpow * fixed_log_table[i] + 0x40000000) >> 31);
  89. ret -= tmp;
  90. xpow = (int)(((int64_t)xpow * x + 0x40000000) >> 31);
  91. tmp = (int)(((int64_t)xpow * fixed_log_table[i+1] + 0x40000000) >> 31);
  92. ret += tmp;
  93. }
  94. return ret;
  95. }
  96. static const int fixed_exp_table[7] =
  97. {
  98. Q31(1.0/2), Q31(1.0/6), Q31(1.0/24), Q31(1.0/120),
  99. Q31(1.0/720), Q31(1.0/5040), Q31(1.0/40320)
  100. };
  101. static int fixed_exp(int x)
  102. {
  103. int i, ret, xpow, tmp;
  104. ret = 0x800000 + x;
  105. xpow = x;
  106. for (i=0; i<7; i++){
  107. xpow = (int)(((int64_t)xpow * x + 0x400000) >> 23);
  108. tmp = (int)(((int64_t)xpow * fixed_exp_table[i] + 0x40000000) >> 31);
  109. ret += tmp;
  110. }
  111. return ret;
  112. }
  113. static void make_bands(int16_t* bands, int start, int stop, int num_bands)
  114. {
  115. int k, previous, present;
  116. int base, prod, nz = 0;
  117. base = (stop << 23) / start;
  118. while (base < 0x40000000){
  119. base <<= 1;
  120. nz++;
  121. }
  122. base = fixed_log(base - 0x80000000);
  123. base = (((base + 0x80) >> 8) + (8-nz)*CONST_LN2) / num_bands;
  124. base = fixed_exp(base);
  125. previous = start;
  126. prod = start << 23;
  127. for (k = 0; k < num_bands-1; k++) {
  128. prod = (int)(((int64_t)prod * base + 0x400000) >> 23);
  129. present = (prod + 0x400000) >> 23;
  130. bands[k] = present - previous;
  131. previous = present;
  132. }
  133. bands[num_bands-1] = stop - previous;
  134. }
  135. /// Dequantization and stereo decoding (14496-3 sp04 p203)
  136. static void sbr_dequant(SpectralBandReplication *sbr, int id_aac)
  137. {
  138. int k, e;
  139. int ch;
  140. if (id_aac == TYPE_CPE && sbr->bs_coupling) {
  141. int alpha = sbr->data[0].bs_amp_res ? 2 : 1;
  142. int pan_offset = sbr->data[0].bs_amp_res ? 12 : 24;
  143. for (e = 1; e <= sbr->data[0].bs_num_env; e++) {
  144. for (k = 0; k < sbr->n[sbr->data[0].bs_freq_res[e]]; k++) {
  145. SoftFloat temp1, temp2, fac;
  146. temp1.exp = sbr->data[0].env_facs_q[e][k] * alpha + 14;
  147. if (temp1.exp & 1)
  148. temp1.mant = 759250125;
  149. else
  150. temp1.mant = 0x20000000;
  151. temp1.exp = (temp1.exp >> 1) + 1;
  152. if (temp1.exp > 66) { // temp1 > 1E20
  153. av_log(NULL, AV_LOG_ERROR, "envelope scalefactor overflow in dequant\n");
  154. temp1 = FLOAT_1;
  155. }
  156. temp2.exp = (pan_offset - sbr->data[1].env_facs_q[e][k]) * alpha;
  157. if (temp2.exp & 1)
  158. temp2.mant = 759250125;
  159. else
  160. temp2.mant = 0x20000000;
  161. temp2.exp = (temp2.exp >> 1) + 1;
  162. fac = av_div_sf(temp1, av_add_sf(FLOAT_1, temp2));
  163. sbr->data[0].env_facs[e][k] = fac;
  164. sbr->data[1].env_facs[e][k] = av_mul_sf(fac, temp2);
  165. }
  166. }
  167. for (e = 1; e <= sbr->data[0].bs_num_noise; e++) {
  168. for (k = 0; k < sbr->n_q; k++) {
  169. SoftFloat temp1, temp2, fac;
  170. temp1.exp = NOISE_FLOOR_OFFSET - \
  171. sbr->data[0].noise_facs_q[e][k] + 2;
  172. temp1.mant = 0x20000000;
  173. av_assert0(temp1.exp <= 66);
  174. temp2.exp = 12 - sbr->data[1].noise_facs_q[e][k] + 1;
  175. temp2.mant = 0x20000000;
  176. fac = av_div_sf(temp1, av_add_sf(FLOAT_1, temp2));
  177. sbr->data[0].noise_facs[e][k] = fac;
  178. sbr->data[1].noise_facs[e][k] = av_mul_sf(fac, temp2);
  179. }
  180. }
  181. } else { // SCE or one non-coupled CPE
  182. for (ch = 0; ch < (id_aac == TYPE_CPE) + 1; ch++) {
  183. int alpha = sbr->data[ch].bs_amp_res ? 2 : 1;
  184. for (e = 1; e <= sbr->data[ch].bs_num_env; e++)
  185. for (k = 0; k < sbr->n[sbr->data[ch].bs_freq_res[e]]; k++){
  186. SoftFloat temp1;
  187. temp1.exp = alpha * sbr->data[ch].env_facs_q[e][k] + 12;
  188. if (temp1.exp & 1)
  189. temp1.mant = 759250125;
  190. else
  191. temp1.mant = 0x20000000;
  192. temp1.exp = (temp1.exp >> 1) + 1;
  193. if (temp1.exp > 66) { // temp1 > 1E20
  194. av_log(NULL, AV_LOG_ERROR, "envelope scalefactor overflow in dequant\n");
  195. temp1 = FLOAT_1;
  196. }
  197. sbr->data[ch].env_facs[e][k] = temp1;
  198. }
  199. for (e = 1; e <= sbr->data[ch].bs_num_noise; e++)
  200. for (k = 0; k < sbr->n_q; k++){
  201. sbr->data[ch].noise_facs[e][k].exp = NOISE_FLOOR_OFFSET - \
  202. sbr->data[ch].noise_facs_q[e][k] + 1;
  203. sbr->data[ch].noise_facs[e][k].mant = 0x20000000;
  204. }
  205. }
  206. }
  207. }
  208. /** High Frequency Generation (14496-3 sp04 p214+) and Inverse Filtering
  209. * (14496-3 sp04 p214)
  210. * Warning: This routine does not seem numerically stable.
  211. */
  212. static void sbr_hf_inverse_filter(SBRDSPContext *dsp,
  213. int (*alpha0)[2], int (*alpha1)[2],
  214. const int X_low[32][40][2], int k0)
  215. {
  216. int k;
  217. int shift, round;
  218. for (k = 0; k < k0; k++) {
  219. SoftFloat phi[3][2][2];
  220. SoftFloat a00, a01, a10, a11;
  221. SoftFloat dk;
  222. dsp->autocorrelate(X_low[k], phi);
  223. dk = av_sub_sf(av_mul_sf(phi[2][1][0], phi[1][0][0]),
  224. av_mul_sf(av_add_sf(av_mul_sf(phi[1][1][0], phi[1][1][0]),
  225. av_mul_sf(phi[1][1][1], phi[1][1][1])), FLOAT_0999999));
  226. if (!dk.mant) {
  227. a10 = FLOAT_0;
  228. a11 = FLOAT_0;
  229. } else {
  230. SoftFloat temp_real, temp_im;
  231. temp_real = av_sub_sf(av_sub_sf(av_mul_sf(phi[0][0][0], phi[1][1][0]),
  232. av_mul_sf(phi[0][0][1], phi[1][1][1])),
  233. av_mul_sf(phi[0][1][0], phi[1][0][0]));
  234. temp_im = av_sub_sf(av_add_sf(av_mul_sf(phi[0][0][0], phi[1][1][1]),
  235. av_mul_sf(phi[0][0][1], phi[1][1][0])),
  236. av_mul_sf(phi[0][1][1], phi[1][0][0]));
  237. a10 = av_div_sf(temp_real, dk);
  238. a11 = av_div_sf(temp_im, dk);
  239. }
  240. if (!phi[1][0][0].mant) {
  241. a00 = FLOAT_0;
  242. a01 = FLOAT_0;
  243. } else {
  244. SoftFloat temp_real, temp_im;
  245. temp_real = av_add_sf(phi[0][0][0],
  246. av_add_sf(av_mul_sf(a10, phi[1][1][0]),
  247. av_mul_sf(a11, phi[1][1][1])));
  248. temp_im = av_add_sf(phi[0][0][1],
  249. av_sub_sf(av_mul_sf(a11, phi[1][1][0]),
  250. av_mul_sf(a10, phi[1][1][1])));
  251. temp_real.mant = -temp_real.mant;
  252. temp_im.mant = -temp_im.mant;
  253. a00 = av_div_sf(temp_real, phi[1][0][0]);
  254. a01 = av_div_sf(temp_im, phi[1][0][0]);
  255. }
  256. shift = a00.exp;
  257. if (shift >= 3)
  258. alpha0[k][0] = 0x7fffffff;
  259. else {
  260. a00.mant *= 2;
  261. shift = 2-shift;
  262. if (shift == 0)
  263. alpha0[k][0] = a00.mant;
  264. else {
  265. round = 1 << (shift-1);
  266. alpha0[k][0] = (a00.mant + round) >> shift;
  267. }
  268. }
  269. shift = a01.exp;
  270. if (shift >= 3)
  271. alpha0[k][1] = 0x7fffffff;
  272. else {
  273. a01.mant *= 2;
  274. shift = 2-shift;
  275. if (shift == 0)
  276. alpha0[k][1] = a01.mant;
  277. else {
  278. round = 1 << (shift-1);
  279. alpha0[k][1] = (a01.mant + round) >> shift;
  280. }
  281. }
  282. shift = a10.exp;
  283. if (shift >= 3)
  284. alpha1[k][0] = 0x7fffffff;
  285. else {
  286. a10.mant *= 2;
  287. shift = 2-shift;
  288. if (shift == 0)
  289. alpha1[k][0] = a10.mant;
  290. else {
  291. round = 1 << (shift-1);
  292. alpha1[k][0] = (a10.mant + round) >> shift;
  293. }
  294. }
  295. shift = a11.exp;
  296. if (shift >= 3)
  297. alpha1[k][1] = 0x7fffffff;
  298. else {
  299. a11.mant *= 2;
  300. shift = 2-shift;
  301. if (shift == 0)
  302. alpha1[k][1] = a11.mant;
  303. else {
  304. round = 1 << (shift-1);
  305. alpha1[k][1] = (a11.mant + round) >> shift;
  306. }
  307. }
  308. shift = (int)(((int64_t)(alpha1[k][0]>>1) * (alpha1[k][0]>>1) + \
  309. (int64_t)(alpha1[k][1]>>1) * (alpha1[k][1]>>1) + \
  310. 0x40000000) >> 31);
  311. if (shift >= 0x20000000){
  312. alpha1[k][0] = 0;
  313. alpha1[k][1] = 0;
  314. alpha0[k][0] = 0;
  315. alpha0[k][1] = 0;
  316. }
  317. shift = (int)(((int64_t)(alpha0[k][0]>>1) * (alpha0[k][0]>>1) + \
  318. (int64_t)(alpha0[k][1]>>1) * (alpha0[k][1]>>1) + \
  319. 0x40000000) >> 31);
  320. if (shift >= 0x20000000){
  321. alpha1[k][0] = 0;
  322. alpha1[k][1] = 0;
  323. alpha0[k][0] = 0;
  324. alpha0[k][1] = 0;
  325. }
  326. }
  327. }
  328. /// Chirp Factors (14496-3 sp04 p214)
  329. static void sbr_chirp(SpectralBandReplication *sbr, SBRData *ch_data)
  330. {
  331. int i;
  332. int new_bw;
  333. static const int bw_tab[] = { 0, 1610612736, 1932735283, 2104533975 };
  334. int64_t accu;
  335. for (i = 0; i < sbr->n_q; i++) {
  336. if (ch_data->bs_invf_mode[0][i] + ch_data->bs_invf_mode[1][i] == 1)
  337. new_bw = 1288490189;
  338. else
  339. new_bw = bw_tab[ch_data->bs_invf_mode[0][i]];
  340. if (new_bw < ch_data->bw_array[i]){
  341. accu = (int64_t)new_bw * 1610612736;
  342. accu += (int64_t)ch_data->bw_array[i] * 0x20000000;
  343. new_bw = (int)((accu + 0x40000000) >> 31);
  344. } else {
  345. accu = (int64_t)new_bw * 1946157056;
  346. accu += (int64_t)ch_data->bw_array[i] * 201326592;
  347. new_bw = (int)((accu + 0x40000000) >> 31);
  348. }
  349. ch_data->bw_array[i] = new_bw < 0x2000000 ? 0 : new_bw;
  350. }
  351. }
  352. /**
  353. * Calculation of levels of additional HF signal components (14496-3 sp04 p219)
  354. * and Calculation of gain (14496-3 sp04 p219)
  355. */
  356. static void sbr_gain_calc(AACContext *ac, SpectralBandReplication *sbr,
  357. SBRData *ch_data, const int e_a[2])
  358. {
  359. int e, k, m;
  360. // max gain limits : -3dB, 0dB, 3dB, inf dB (limiter off)
  361. static const SoftFloat limgain[4] = { { 760155524, 0 }, { 0x20000000, 1 },
  362. { 758351638, 1 }, { 625000000, 34 } };
  363. for (e = 0; e < ch_data->bs_num_env; e++) {
  364. int delta = !((e == e_a[1]) || (e == e_a[0]));
  365. for (k = 0; k < sbr->n_lim; k++) {
  366. SoftFloat gain_boost, gain_max;
  367. SoftFloat sum[2];
  368. sum[0] = sum[1] = FLOAT_0;
  369. for (m = sbr->f_tablelim[k] - sbr->kx[1]; m < sbr->f_tablelim[k + 1] - sbr->kx[1]; m++) {
  370. const SoftFloat temp = av_div_sf(sbr->e_origmapped[e][m],
  371. av_add_sf(FLOAT_1, sbr->q_mapped[e][m]));
  372. sbr->q_m[e][m] = av_sqrt_sf(av_mul_sf(temp, sbr->q_mapped[e][m]));
  373. sbr->s_m[e][m] = av_sqrt_sf(av_mul_sf(temp, av_int2sf(ch_data->s_indexmapped[e + 1][m], 0)));
  374. if (!sbr->s_mapped[e][m]) {
  375. if (delta) {
  376. sbr->gain[e][m] = av_sqrt_sf(av_div_sf(sbr->e_origmapped[e][m],
  377. av_mul_sf(av_add_sf(FLOAT_1, sbr->e_curr[e][m]),
  378. av_add_sf(FLOAT_1, sbr->q_mapped[e][m]))));
  379. } else {
  380. sbr->gain[e][m] = av_sqrt_sf(av_div_sf(sbr->e_origmapped[e][m],
  381. av_add_sf(FLOAT_1, sbr->e_curr[e][m])));
  382. }
  383. } else {
  384. sbr->gain[e][m] = av_sqrt_sf(
  385. av_div_sf(
  386. av_mul_sf(sbr->e_origmapped[e][m], sbr->q_mapped[e][m]),
  387. av_mul_sf(
  388. av_add_sf(FLOAT_1, sbr->e_curr[e][m]),
  389. av_add_sf(FLOAT_1, sbr->q_mapped[e][m]))));
  390. }
  391. }
  392. for (m = sbr->f_tablelim[k] - sbr->kx[1]; m < sbr->f_tablelim[k + 1] - sbr->kx[1]; m++) {
  393. sum[0] = av_add_sf(sum[0], sbr->e_origmapped[e][m]);
  394. sum[1] = av_add_sf(sum[1], sbr->e_curr[e][m]);
  395. }
  396. gain_max = av_mul_sf(limgain[sbr->bs_limiter_gains],
  397. av_sqrt_sf(
  398. av_div_sf(
  399. av_add_sf(FLOAT_EPSILON, sum[0]),
  400. av_add_sf(FLOAT_EPSILON, sum[1]))));
  401. if (av_gt_sf(gain_max, FLOAT_100000))
  402. gain_max = FLOAT_100000;
  403. for (m = sbr->f_tablelim[k] - sbr->kx[1]; m < sbr->f_tablelim[k + 1] - sbr->kx[1]; m++) {
  404. SoftFloat q_m_max = av_div_sf(
  405. av_mul_sf(sbr->q_m[e][m], gain_max),
  406. sbr->gain[e][m]);
  407. if (av_gt_sf(sbr->q_m[e][m], q_m_max))
  408. sbr->q_m[e][m] = q_m_max;
  409. if (av_gt_sf(sbr->gain[e][m], gain_max))
  410. sbr->gain[e][m] = gain_max;
  411. }
  412. sum[0] = sum[1] = FLOAT_0;
  413. for (m = sbr->f_tablelim[k] - sbr->kx[1]; m < sbr->f_tablelim[k + 1] - sbr->kx[1]; m++) {
  414. sum[0] = av_add_sf(sum[0], sbr->e_origmapped[e][m]);
  415. sum[1] = av_add_sf(sum[1],
  416. av_mul_sf(
  417. av_mul_sf(sbr->e_curr[e][m],
  418. sbr->gain[e][m]),
  419. sbr->gain[e][m]));
  420. sum[1] = av_add_sf(sum[1],
  421. av_mul_sf(sbr->s_m[e][m], sbr->s_m[e][m]));
  422. if (delta && !sbr->s_m[e][m].mant)
  423. sum[1] = av_add_sf(sum[1],
  424. av_mul_sf(sbr->q_m[e][m], sbr->q_m[e][m]));
  425. }
  426. gain_boost = av_sqrt_sf(
  427. av_div_sf(
  428. av_add_sf(FLOAT_EPSILON, sum[0]),
  429. av_add_sf(FLOAT_EPSILON, sum[1])));
  430. if (av_gt_sf(gain_boost, FLOAT_1584893192))
  431. gain_boost = FLOAT_1584893192;
  432. for (m = sbr->f_tablelim[k] - sbr->kx[1]; m < sbr->f_tablelim[k + 1] - sbr->kx[1]; m++) {
  433. sbr->gain[e][m] = av_mul_sf(sbr->gain[e][m], gain_boost);
  434. sbr->q_m[e][m] = av_mul_sf(sbr->q_m[e][m], gain_boost);
  435. sbr->s_m[e][m] = av_mul_sf(sbr->s_m[e][m], gain_boost);
  436. }
  437. }
  438. }
  439. }
  440. /// Assembling HF Signals (14496-3 sp04 p220)
  441. static void sbr_hf_assemble(int Y1[38][64][2],
  442. const int X_high[64][40][2],
  443. SpectralBandReplication *sbr, SBRData *ch_data,
  444. const int e_a[2])
  445. {
  446. int e, i, j, m;
  447. const int h_SL = 4 * !sbr->bs_smoothing_mode;
  448. const int kx = sbr->kx[1];
  449. const int m_max = sbr->m[1];
  450. static const SoftFloat h_smooth[5] = {
  451. { 715827883, -1 },
  452. { 647472402, -1 },
  453. { 937030863, -2 },
  454. { 989249804, -3 },
  455. { 546843842, -4 },
  456. };
  457. SoftFloat (*g_temp)[48] = ch_data->g_temp, (*q_temp)[48] = ch_data->q_temp;
  458. int indexnoise = ch_data->f_indexnoise;
  459. int indexsine = ch_data->f_indexsine;
  460. if (sbr->reset) {
  461. for (i = 0; i < h_SL; i++) {
  462. memcpy(g_temp[i + 2*ch_data->t_env[0]], sbr->gain[0], m_max * sizeof(sbr->gain[0][0]));
  463. memcpy(q_temp[i + 2*ch_data->t_env[0]], sbr->q_m[0], m_max * sizeof(sbr->q_m[0][0]));
  464. }
  465. } else if (h_SL) {
  466. for (i = 0; i < 4; i++) {
  467. memcpy(g_temp[i + 2 * ch_data->t_env[0]],
  468. g_temp[i + 2 * ch_data->t_env_num_env_old],
  469. sizeof(g_temp[0]));
  470. memcpy(q_temp[i + 2 * ch_data->t_env[0]],
  471. q_temp[i + 2 * ch_data->t_env_num_env_old],
  472. sizeof(q_temp[0]));
  473. }
  474. }
  475. for (e = 0; e < ch_data->bs_num_env; e++) {
  476. for (i = 2 * ch_data->t_env[e]; i < 2 * ch_data->t_env[e + 1]; i++) {
  477. memcpy(g_temp[h_SL + i], sbr->gain[e], m_max * sizeof(sbr->gain[0][0]));
  478. memcpy(q_temp[h_SL + i], sbr->q_m[e], m_max * sizeof(sbr->q_m[0][0]));
  479. }
  480. }
  481. for (e = 0; e < ch_data->bs_num_env; e++) {
  482. for (i = 2 * ch_data->t_env[e]; i < 2 * ch_data->t_env[e + 1]; i++) {
  483. SoftFloat g_filt_tab[48];
  484. SoftFloat q_filt_tab[48];
  485. SoftFloat *g_filt, *q_filt;
  486. if (h_SL && e != e_a[0] && e != e_a[1]) {
  487. g_filt = g_filt_tab;
  488. q_filt = q_filt_tab;
  489. for (m = 0; m < m_max; m++) {
  490. const int idx1 = i + h_SL;
  491. g_filt[m].mant = g_filt[m].exp = 0;
  492. q_filt[m].mant = q_filt[m].exp = 0;
  493. for (j = 0; j <= h_SL; j++) {
  494. g_filt[m] = av_add_sf(g_filt[m],
  495. av_mul_sf(g_temp[idx1 - j][m],
  496. h_smooth[j]));
  497. q_filt[m] = av_add_sf(q_filt[m],
  498. av_mul_sf(q_temp[idx1 - j][m],
  499. h_smooth[j]));
  500. }
  501. }
  502. } else {
  503. g_filt = g_temp[i + h_SL];
  504. q_filt = q_temp[i];
  505. }
  506. sbr->dsp.hf_g_filt(Y1[i] + kx, X_high + kx, g_filt, m_max,
  507. i + ENVELOPE_ADJUSTMENT_OFFSET);
  508. if (e != e_a[0] && e != e_a[1]) {
  509. sbr->dsp.hf_apply_noise[indexsine](Y1[i] + kx, sbr->s_m[e],
  510. q_filt, indexnoise,
  511. kx, m_max);
  512. } else {
  513. int idx = indexsine&1;
  514. int A = (1-((indexsine+(kx & 1))&2));
  515. int B = (A^(-idx)) + idx;
  516. int *out = &Y1[i][kx][idx];
  517. int shift, round;
  518. SoftFloat *in = sbr->s_m[e];
  519. for (m = 0; m+1 < m_max; m+=2) {
  520. shift = 22 - in[m ].exp;
  521. round = 1 << (shift-1);
  522. out[2*m ] += (in[m ].mant * A + round) >> shift;
  523. shift = 22 - in[m+1].exp;
  524. round = 1 << (shift-1);
  525. out[2*m+2] += (in[m+1].mant * B + round) >> shift;
  526. }
  527. if(m_max&1)
  528. {
  529. shift = 22 - in[m ].exp;
  530. round = 1 << (shift-1);
  531. out[2*m ] += (in[m ].mant * A + round) >> shift;
  532. }
  533. }
  534. indexnoise = (indexnoise + m_max) & 0x1ff;
  535. indexsine = (indexsine + 1) & 3;
  536. }
  537. }
  538. ch_data->f_indexnoise = indexnoise;
  539. ch_data->f_indexsine = indexsine;
  540. }
  541. #include "aacsbr_template.c"