You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1136 lines
27KB

  1. /* Copyright (C) 2007 Hong Zhiqian */
  2. /**
  3. @file preprocess_tm.h
  4. @author Hong Zhiqian
  5. @brief Various compatibility routines for Speex (TriMedia version)
  6. */
  7. /*
  8. Redistribution and use in source and binary forms, with or without
  9. modification, are permitted provided that the following conditions
  10. are met:
  11. - Redistributions of source code must retain the above copyright
  12. notice, this list of conditions and the following disclaimer.
  13. - Redistributions in binary form must reproduce the above copyright
  14. notice, this list of conditions and the following disclaimer in the
  15. documentation and/or other materials provided with the distribution.
  16. - Neither the name of the Xiph.org Foundation nor the names of its
  17. contributors may be used to endorse or promote products derived from
  18. this software without specific prior written permission.
  19. THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  20. ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  21. LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  22. A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR
  23. CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
  24. EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
  25. PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
  26. PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
  27. LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
  28. NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
  29. SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  30. */
  31. #include <ops/custom_defs.h>
  32. #include "profile_tm.h"
  33. #ifdef FIXED_POINT
  34. #define OVERRIDE_PREPROCESS_ANALYSIS
  35. static void preprocess_analysis(SpeexPreprocessState * restrict st, spx_int16_t * restrict x)
  36. {
  37. register int i, j, framesize = st->frame_size;
  38. register int N = st->ps_size;
  39. register int N3 = 2*N - framesize;
  40. register int N4 = framesize - N3;
  41. register int * restrict ps = st->ps;
  42. register int * restrict frame;
  43. register int * restrict inbuf;
  44. register int * restrict ptr;
  45. register int max_val;
  46. frame = (int*)(st->frame);
  47. inbuf = (int*)(st->inbuf);
  48. ptr = (int*)(st->frame+N3);
  49. TMDEBUG_ALIGNMEM(x);
  50. TMDEBUG_ALIGNMEM(frame);
  51. TMDEBUG_ALIGNMEM(inbuf);
  52. PREPROCESSANAYLSIS_START();
  53. N3 >>= 1;
  54. framesize >>= 1;
  55. max_val = 0;
  56. for ( i=0,j=0 ; i<N3 ; i+=2,j+=8 )
  57. { register int r1, r2;
  58. r1 = ld32x(inbuf,i);
  59. r2 = ld32x(inbuf,i+1);
  60. st32d(j, frame, r1);
  61. st32d(j+4, frame, r2);
  62. }
  63. for ( i=0,j=0 ; i<framesize ; i+=2,j+=8 )
  64. { register int r1, r2;
  65. r1 = ld32x(x, i);
  66. r2 = ld32x(x, i+1);
  67. st32d(j, ptr, r1);
  68. st32d(j+4,ptr, r2);
  69. }
  70. for ( i=0,j=0,ptr=(int*)(x+N4) ; i<N3 ; i+=2,j+=8 )
  71. { register int r1, r2;
  72. r1 = ld32x(ptr, i);
  73. r2 = ld32x(ptr, i+1);
  74. st32d(j, inbuf, r1);
  75. st32d(j+4,inbuf, r2);
  76. }
  77. #if (TM_UNROLL && TM_UNROLL_PREPROCESSANALYSIS)
  78. #pragma TCS_unroll=2
  79. #pragma TCS_unrollexact=1
  80. #endif
  81. for ( i=0,j=0,ptr=(int*)st->window ; i<N ; ++i,j+=4 )
  82. { register int f10, w10, r0, r1;
  83. f10 = ld32x(frame, i);
  84. w10 = ld32x(ptr, i);
  85. r0 = (sex16(f10) * sex16(w10)) >> 15;
  86. r1 = (asri(16,f10) * asri(16,w10)) >> 15;
  87. max_val = imax(iabs(sex16(r0)), max_val);
  88. max_val = imax(iabs(sex16(r1)), max_val);
  89. r0 = pack16lsb(r1, r0);
  90. st32d(j, frame, r0);
  91. }
  92. #if (TM_UNROLL && TM_UNROLL_PREPROCESSANALYSIS)
  93. #pragma TCS_unrollexact=0
  94. #pragma TCS_unroll=0
  95. #endif
  96. max_val = 14 - spx_ilog2(max_val);
  97. st->frame_shift = max_val;
  98. if ( max_val != 0 )
  99. {
  100. #if (TM_UNROLL && TM_UNROLL_PREPROCESSANALYSIS)
  101. #pragma TCS_unroll=4
  102. #pragma TCS_unrollexact=1
  103. #endif
  104. for ( i=0,j=0 ; i<N ; ++i,j+=4 )
  105. { register int f10;
  106. f10 = ld32x(frame, i);
  107. f10 = dualasl(f10, max_val);
  108. st32d(j, frame, f10);
  109. }
  110. #if (TM_UNROLL && TM_UNROLL_PREPROCESSANALYSIS)
  111. #pragma TCS_unrollexact=0
  112. #pragma TCS_unroll=0
  113. #endif
  114. }
  115. spx_fft(st->fft_lookup, st->frame, st->ft);
  116. power_spectrum(st->ft, ps, N << 1);
  117. #if (TM_UNROLL && TM_UNROLL_PREPROCESSANALYSIS)
  118. #pragma TCS_unroll=4
  119. #pragma TCS_unrollexact=1
  120. #endif
  121. for ( i=0,ptr=(int*)st->ps,max_val<<=1,j=((1<<((max_val))>>1)) ;i<N ; ++i )
  122. {
  123. ps[i] = (ps[i] + j) >> max_val;
  124. }
  125. #if (TM_UNROLL && TM_UNROLL_PREPROCESSANALYSIS)
  126. #pragma TCS_unrollexact=0
  127. #pragma TCS_unroll=0
  128. #endif
  129. filterbank_compute_bank32(st->bank, ps, ps+N);
  130. PREPROCESSANAYLSIS_STOP();
  131. }
  132. #define _MULT16_32_Q15(a,b,c) ADD32(MULT16_16((a),(b)), SHR(MULT16_16((a),(c)),15))
  133. #define OVERRIDE_UPDATE_NOISE_PROB
  134. static void update_noise_prob(SpeexPreprocessState * restrict st)
  135. {
  136. register int i;
  137. register int min_range, nb_adapt;
  138. register int N = st->ps_size;
  139. register int * restrict Smin = (int*)st->Smin;
  140. register int * restrict Stmp = (int*)st->Stmp;
  141. register int * restrict S = (int*)st->S;
  142. UPDATENOISEPROB_START();
  143. {
  144. register int psi_lsb, psi_msb, ips_lsb, ips_msb, psii_lsb, psii_msb;
  145. register int psiii_lsb, psiii_msb;
  146. register int q8, q05, q2, q1;
  147. register int *ps = (int*)st->ps;
  148. register int si_lsb, si_msb, sii_lsb, sii_msb;
  149. q8 = QCONST16(.8f,15);
  150. q05 = QCONST16(.05f,15);
  151. q2 = QCONST16(.2f,15);
  152. q1 = QCONST16(.1f,15);
  153. ips_lsb = ps[0];
  154. psi_lsb = ps[1];
  155. si_lsb = S[0];
  156. ips_msb = ips_lsb >> 15;
  157. psi_msb = psi_lsb >> 15;
  158. si_msb = si_lsb >> 15;
  159. ips_lsb &= 0x00007fff;
  160. psi_lsb &= 0x00007fff;
  161. si_lsb &= 0x00007fff;
  162. S[0] = _MULT16_32_Q15(q8,si_msb,si_lsb) + _MULT16_32_Q15(q2,ips_msb,ips_lsb);
  163. for ( i=1 ; i<N-1 ; i+=2 )
  164. {
  165. psii_lsb = ps[i+1];
  166. si_lsb = S[i];
  167. psii_msb = psii_lsb >> 15;
  168. si_msb = si_lsb >> 15;
  169. si_lsb &= 0x00007fff;
  170. psii_lsb &= 0x00007fff;
  171. S[i]= _MULT16_32_Q15(q8,si_msb,si_lsb) +
  172. _MULT16_32_Q15(q05,ips_msb,ips_lsb) +
  173. _MULT16_32_Q15(q1,psi_msb,psi_lsb) +
  174. _MULT16_32_Q15(q05,psii_msb,psii_lsb);
  175. psiii_lsb = ps[i+2];
  176. sii_lsb = S[i+1];
  177. sii_msb = sii_lsb >> 15;
  178. psiii_msb= psiii_lsb >> 15;
  179. sii_lsb &= 0x00007fff;
  180. psiii_lsb&= 0x00007fff;
  181. S[i+1]= _MULT16_32_Q15(q8,sii_msb,sii_lsb) +
  182. _MULT16_32_Q15(q05,psi_msb,psi_lsb) +
  183. _MULT16_32_Q15(q1,psii_msb,psii_lsb) +
  184. _MULT16_32_Q15(q05,psiii_msb,psiii_lsb);
  185. ips_lsb = psii_lsb;
  186. ips_msb = psii_msb;
  187. psi_lsb = psiii_lsb;
  188. psi_msb = psiii_msb;
  189. }
  190. S[N-1] = MULT16_32_Q15(q8,S[N-1]) + MULT16_32_Q15(q2,ps[N-1]);
  191. }
  192. nb_adapt = st->nb_adapt;
  193. if ( nb_adapt==1 )
  194. { for ( i=0 ; i<N ; ++i )
  195. Smin[i] = Stmp[i] = 0;
  196. }
  197. min_range = mux(nb_adapt < 100, 15,
  198. mux(nb_adapt < 1000, 50,
  199. mux(nb_adapt < 10000, 150, 300)));
  200. if ( st->min_count > min_range )
  201. {
  202. st->min_count = 0;
  203. #if (TM_UNROLL && TM_UNROLL_UPDATENOISEPROB)
  204. #pragma TCS_unroll=2
  205. #pragma TCS_unrollexact=1
  206. #endif
  207. for ( i=0 ; i<N ; ++i )
  208. { register int si, stmpi;
  209. si = S[i];
  210. stmpi = Stmp[i];
  211. Smin[i] = imin(stmpi,si);
  212. Stmp[i] = si;
  213. }
  214. #if (TM_UNROLL && TM_UNROLL_UPDATENOISEPROB)
  215. #pragma TCS_unrollexact=0
  216. #pragma TCS_unroll=0
  217. #endif
  218. } else
  219. {
  220. #if (TM_UNROLL && TM_UNROLL_UPDATENOISEPROB)
  221. #pragma TCS_unroll=2
  222. #pragma TCS_unrollexact=1
  223. #endif
  224. for ( i=0 ; i<N ; ++i )
  225. { register int si, stmpi, smini;
  226. si = S[i];
  227. stmpi = Stmp[i];
  228. smini = Smin[i];
  229. Smin[i] = imin(smini,si);
  230. Stmp[i] = imin(stmpi,si);
  231. }
  232. #if (TM_UNROLL && TM_UNROLL_UPDATENOISEPROB)
  233. #pragma TCS_unrollexact=0
  234. #pragma TCS_unroll=0
  235. #endif
  236. }
  237. {
  238. register int q4;
  239. register int * restrict update_prob = (int*)st->update_prob;
  240. q4 = QCONST16(.4f,15);
  241. #if (TM_UNROLL && TM_UNROLL_UPDATENOISEPROB)
  242. #pragma TCS_unroll=4
  243. #pragma TCS_unrollexact=1
  244. #endif
  245. for ( i=0 ; i<N ; ++i )
  246. { register int si;
  247. register int smini;
  248. si = S[i];
  249. smini = Smin[i];
  250. update_prob[i] = mux(MULT16_32_Q15(q4,si) > ADD32(smini,20), 1, 0);
  251. }
  252. #if (TM_UNROLL && TM_UNROLL_UPDATENOISEPROB)
  253. #pragma TCS_unrollexact=0
  254. #pragma TCS_unroll=0
  255. #endif
  256. }
  257. UPDATENOISEPROB_STOP();
  258. }
  259. #else
  260. #define OVERRIDE_PREPROCESS_ANALYSIS
  261. static void preprocess_analysis(SpeexPreprocessState * restrict st, spx_int16_t * restrict x)
  262. {
  263. register int i;
  264. register int framesize = st->frame_size;
  265. register int N = st->ps_size;
  266. register int N3 = 2*N - framesize;
  267. register int N4 = framesize - N3;
  268. register float * restrict ps = st->ps;
  269. register float * restrict frame = st->frame;
  270. register float * restrict inbuf = st->inbuf;
  271. PREPROCESSANAYLSIS_START();
  272. #if (TM_UNROLL && TM_UNROLL_PREPROCESSANALYSIS)
  273. #pragma TCS_unroll=4
  274. #pragma TCS_unrollexact=1
  275. #endif
  276. for ( i=0 ; i<N3 ; ++i )
  277. {
  278. frame[i] = inbuf[i];
  279. }
  280. #if (TM_UNROLL && TM_UNROLL_PREPROCESSANALYSIS)
  281. #pragma TCS_unrollexact=0
  282. #pragma TCS_unroll=0
  283. #endif
  284. #if (TM_UNROLL && TM_UNROLL_PREPROCESSANALYSIS)
  285. #pragma TCS_unroll=4
  286. #pragma TCS_unrollexact=1
  287. #endif
  288. for ( i=0 ; i<framesize ; ++i )
  289. { frame[N3+i] = x[i];
  290. }
  291. #if (TM_UNROLL && TM_UNROLL_PREPROCESSANALYSIS)
  292. #pragma TCS_unrollexact=0
  293. #pragma TCS_unroll=0
  294. #endif
  295. #if (TM_UNROLL && TM_UNROLL_PREPROCESSANALYSIS)
  296. #pragma TCS_unroll=4
  297. #pragma TCS_unrollexact=1
  298. #endif
  299. for ( i=0,x+=N4 ; i<N3 ; ++i )
  300. { inbuf[i] = x[i];
  301. }
  302. #if (TM_UNROLL && TM_UNROLL_PREPROCESSANALYSIS)
  303. #pragma TCS_unrollexact=0
  304. #pragma TCS_unroll=0
  305. #endif
  306. inbuf = st->window;
  307. #if (TM_UNROLL && TM_UNROLL_PREPROCESSANALYSIS)
  308. #pragma TCS_unroll=4
  309. #pragma TCS_unrollexact=1
  310. #endif
  311. for ( i=0 ; i<2*N ; ++i )
  312. {
  313. frame[i] = frame[i] * inbuf[i];
  314. }
  315. #if (TM_UNROLL && TM_UNROLL_PREPROCESSANALYSIS)
  316. #pragma TCS_unrollexact=0
  317. #pragma TCS_unroll=0
  318. #endif
  319. spx_fft(st->fft_lookup, frame, st->ft);
  320. power_spectrum(st->ft, ps, N << 1);
  321. filterbank_compute_bank32(st->bank, ps, ps+N);
  322. PREPROCESSANAYLSIS_STOP();
  323. }
  324. #define OVERRIDE_UPDATE_NOISE_PROB
  325. static void update_noise_prob(SpeexPreprocessState * restrict st)
  326. {
  327. register float * restrict S = st->S;
  328. register float * restrict ps = st->ps;
  329. register int N = st->ps_size;
  330. register int min_range;
  331. register int i;
  332. register int nb_adapt;
  333. register float * restrict Smin = st->Smin;
  334. register float * restrict Stmp = st->Stmp;
  335. UPDATENOISEPROB_START();
  336. {
  337. register float ips, psi;
  338. ips = ps[0];
  339. psi = ps[1];
  340. S[0] = .8f * S[0] + .2f * ips;
  341. for ( i=1 ; i<N-1 ; i+=2 )
  342. {
  343. register float psii, psiii;
  344. psii = ps[i+1];
  345. psiii = ps[i+2];
  346. S[i] = .8f * S[i] + .05f * ips + .1f * psi + .05f * psii;
  347. S[i+1] = .8f * S[i+1] + .05f * psi + .1f * psii + .05f * psiii;
  348. ips = psii;
  349. psi = psiii;
  350. }
  351. S[N-1] = .8f * S[N-1] + .2f * ps[N-1];
  352. }
  353. nb_adapt = st->nb_adapt;
  354. if ( nb_adapt==1 )
  355. {
  356. for (i=0;i<N;i++)
  357. Smin[i] = st->Stmp[i] = 0;
  358. }
  359. min_range = mux(nb_adapt < 100, 15,
  360. mux(nb_adapt < 1000, 50,
  361. mux(nb_adapt < 10000, 150, 300)));
  362. if ( st->min_count > min_range )
  363. {
  364. st->min_count = 0;
  365. #if (TM_UNROLL && TM_UNROLL_UPDATENOISEPROB)
  366. #pragma TCS_unroll=4
  367. #pragma TCS_unrollexact=1
  368. #endif
  369. for ( i=0 ; i<N ; ++i )
  370. {
  371. register float stmpi, si;
  372. stmpi = Stmp[i];
  373. si = S[i];
  374. Smin[i] = fmin(stmpi,si);
  375. Stmp[i] = si;
  376. }
  377. #if (TM_UNROLL && TM_UNROLL_UPDATENOISEPROB)
  378. #pragma TCS_unrollexact=0
  379. #pragma TCS_unroll=0
  380. #endif
  381. } else
  382. {
  383. register float * restrict Smin = st->Smin;
  384. #if (TM_UNROLL && TM_UNROLL_UPDATENOISEPROB)
  385. #pragma TCS_unroll=4
  386. #pragma TCS_unrollexact=1
  387. #endif
  388. for ( i=0 ; i<N ; ++i )
  389. {
  390. register float stmpi, si, smini;
  391. stmpi = Stmp[i];
  392. si = S[i];
  393. smini = Smin[i];
  394. Smin[i] = fmin(smini,si);
  395. Stmp[i] = fmin(stmpi,si);
  396. }
  397. #if (TM_UNROLL && TM_UNROLL_UPDATENOISEPROB)
  398. #pragma TCS_unrollexact=0
  399. #pragma TCS_unroll=0
  400. #endif
  401. }
  402. {
  403. register int * restrict update_prob = (int*)st->update_prob;
  404. #if (TM_UNROLL && TM_UNROLL_UPDATENOISEPROB)
  405. #pragma TCS_unroll=4
  406. #pragma TCS_unrollexact=1
  407. #endif
  408. for (i=0;i<N;i++)
  409. { register float si;
  410. register float smini;
  411. si = S[i];
  412. smini = Smin[i];
  413. update_prob[i] = mux( (.4 * si) > (smini + 20.f), 1, 0);
  414. }
  415. #if (TM_UNROLL && TM_UNROLL_UPDATENOISEPROB)
  416. #pragma TCS_unrollexact=0
  417. #pragma TCS_unroll=0
  418. #endif
  419. }
  420. UPDATENOISEPROB_STOP();
  421. }
  422. #define OVERRIDE_COMPUTE_GAIN_FLOOR
  423. static void compute_gain_floor(
  424. int noise_suppress,
  425. int effective_echo_suppress,
  426. float * restrict noise,
  427. float * restrict echo,
  428. float * gain_floor,
  429. int len
  430. )
  431. {
  432. register int i;
  433. register float echo_floor;
  434. register float noise_floor;
  435. COMPUTEGAINFLOOR_START();
  436. noise_floor = exp(.2302585f*noise_suppress);
  437. echo_floor = exp(.2302585f*effective_echo_suppress);
  438. #if (TM_UNROLL && TM_UNROLL_COMPUTEGAINFLOOR)
  439. #pragma TCS_unroll=4
  440. #pragma TCS_unrollexact=1
  441. #endif
  442. for (i=0;i<len;i++)
  443. { register float noisei, echoi;
  444. noisei = noise[i];
  445. echoi = echo[i];
  446. gain_floor[i] = FRAC_SCALING * sqrt(noise_floor * noisei + echo_floor * echoi) / sqrt(1+noisei+echoi);
  447. }
  448. #if (TM_UNROLL && TM_UNROLL_COMPUTEGAINFLOOR)
  449. #pragma TCS_unrollexact=0
  450. #pragma TCS_unroll=0
  451. #endif
  452. COMPUTEGAINFLOOR_STOP();
  453. }
  454. #endif
  455. static inline spx_word32_t hypergeom_gain(spx_word32_t xx);
  456. static inline spx_word16_t qcurve(spx_word16_t x);
  457. static void compute_gain_floor(int noise_suppress, int effective_echo_suppress, spx_word32_t *noise, spx_word32_t *echo, spx_word16_t *gain_floor, int len);
  458. void speex_echo_get_residual(SpeexEchoState *st, spx_word32_t *Yout, int len);
  459. #ifndef FIXED_POINT
  460. static void speex_compute_agc(SpeexPreprocessState *st, spx_word16_t Pframe, spx_word16_t *ft);
  461. #endif
  462. void preprocess_residue_echo(
  463. SpeexPreprocessState * restrict st,
  464. int N,
  465. int NM
  466. )
  467. {
  468. if (st->echo_state)
  469. {
  470. register spx_word32_t * restrict r_echo = st->residual_echo;
  471. register spx_word32_t * restrict e_noise = st->echo_noise;
  472. register int i;
  473. #ifndef FIXED_POINT
  474. register spx_word32_t r;
  475. #endif
  476. speex_echo_get_residual(st->echo_state, r_echo, N);
  477. #ifndef FIXED_POINT
  478. r = r_echo[0];
  479. if (!(r >=0 && r < N*1e9f) )
  480. {
  481. memset(r_echo, 0, N * sizeof(spx_word32_t));
  482. }
  483. #endif
  484. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  485. #pragma TCS_unroll=4
  486. #pragma TCS_unrollexact=1
  487. #endif
  488. for (i=0;i<N;i++)
  489. { register spx_word32_t eni = e_noise[i];
  490. e_noise[i] = MAX32(MULT16_32_Q15(QCONST16(.6f,15),eni), r_echo[i]);
  491. }
  492. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  493. #pragma TCS_unrollexact=0
  494. #pragma TCS_unroll=0
  495. #endif
  496. filterbank_compute_bank32(st->bank, e_noise, e_noise+N);
  497. } else
  498. { memset(st->echo_noise, 0, (NM) * sizeof(spx_word32_t));
  499. }
  500. }
  501. void preprocess_update_noise(
  502. SpeexPreprocessState * restrict st,
  503. spx_word32_t * restrict ps,
  504. int N
  505. )
  506. {
  507. register spx_word16_t beta, beta_1;
  508. register int * restrict up = st->update_prob;
  509. register spx_word32_t * restrict noise = st->noise;
  510. register int i;
  511. beta = MAX16(QCONST16(.03,15),DIV32_16(Q15_ONE,st->nb_adapt));
  512. beta_1 = Q15_ONE-beta;
  513. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  514. #pragma TCS_unroll=4
  515. #pragma TCS_unrollexact=1
  516. #endif
  517. for (i=0;i<N;i++)
  518. { register spx_word32_t ni = noise[i];
  519. register spx_word32_t psi = ps[i];
  520. if ( !up[i] || psi < PSHR32(ni, NOISE_SHIFT) )
  521. { noise[i] = MAX32(EXTEND32(0),MULT16_32_Q15(beta_1,ni) +
  522. MULT16_32_Q15(beta,SHL32(psi,NOISE_SHIFT)));
  523. }
  524. }
  525. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  526. #pragma TCS_unrollexact=0
  527. #pragma TCS_unroll=0
  528. #endif
  529. filterbank_compute_bank32(st->bank, noise, noise+N);
  530. }
  531. void preprocess_compute_SNR(
  532. SpeexPreprocessState * restrict st,
  533. spx_word32_t * restrict ps,
  534. int NM
  535. )
  536. {
  537. register spx_word32_t * restrict noise = st->noise;
  538. register spx_word32_t * restrict echo = st->echo_noise;
  539. register spx_word32_t * restrict reverb = st->reverb_estimate;
  540. register spx_word16_t * restrict post = st->post;
  541. register spx_word32_t * restrict old_ps = st->old_ps;
  542. register spx_word16_t * restrict prior = st->prior;
  543. register int i;
  544. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  545. #pragma TCS_unroll=4
  546. #pragma TCS_unrollexact=1
  547. #endif
  548. for ( i=0 ; i<NM ; i++)
  549. {
  550. register spx_word16_t gamma;
  551. register spx_word32_t tot_noise;
  552. register spx_word16_t posti;
  553. register spx_word32_t opsi;
  554. register spx_word16_t priori;
  555. tot_noise = ADD32(ADD32(ADD32(EXTEND32(1), PSHR32(noise[i],NOISE_SHIFT)), echo[i]) , reverb[i]);
  556. posti = SUB16(DIV32_16_Q8(ps[i],tot_noise), QCONST16(1.f,SNR_SHIFT));
  557. posti = MIN16(posti, QCONST16(100.f,SNR_SHIFT));
  558. post[i] = posti;
  559. opsi = old_ps[i];
  560. gamma = QCONST16(.1f,15)+MULT16_16_Q15(QCONST16(.89f,15),SQR16_Q15(DIV32_16_Q15(opsi,ADD32(opsi,tot_noise))));
  561. priori = EXTRACT16(PSHR32(ADD32(MULT16_16(gamma,MAX16(0,posti)), MULT16_16(Q15_ONE-gamma,DIV32_16_Q8(opsi,tot_noise))), 15));
  562. prior[i]=MIN16(priori, QCONST16(100.f,SNR_SHIFT));
  563. }
  564. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  565. #pragma TCS_unrollexact=0
  566. #pragma TCS_unroll=0
  567. #endif
  568. }
  569. spx_word32_t preprocess_smooth_SNR(
  570. SpeexPreprocessState * restrict st,
  571. int N,
  572. int NM
  573. )
  574. {
  575. register spx_word16_t * restrict zeta = st->zeta;
  576. register spx_word16_t * restrict prior = st->prior;
  577. register spx_word32_t Zframe;
  578. register spx_word16_t iprior, priori;
  579. register int _N = N-1;
  580. register int i;
  581. iprior = prior[0];
  582. priori = prior[1];
  583. zeta[0] = PSHR32(ADD32(MULT16_16(QCONST16(.7f,15),zeta[0]), MULT16_16(QCONST16(.3f,15),iprior)),15);
  584. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  585. #pragma TCS_unroll=2
  586. #pragma TCS_unrollexact=1
  587. #endif
  588. for ( i=1 ; i<_N ; i++)
  589. { register spx_word16_t zetai = zeta[i];
  590. register spx_word16_t priorii = prior[i+1];
  591. zeta[i] = PSHR32(ADD32(ADD32(ADD32(MULT16_16(QCONST16(.7f,15),zetai), MULT16_16(QCONST16(.15f,15),priori)),
  592. MULT16_16(QCONST16(.075f,15),iprior)), MULT16_16(QCONST16(.075f,15),priorii)),15);
  593. iprior = priori;
  594. priori = priorii;
  595. }
  596. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  597. #pragma TCS_unrollexact=0
  598. #pragma TCS_unroll=0
  599. #endif
  600. for (i=_N; i<NM ; i++)
  601. { register spx_word16_t zetai = zeta[i];
  602. priori = prior[i];
  603. zeta[i] = PSHR32(ADD32(MULT16_16(QCONST16(.7f,15),zetai), MULT16_16(QCONST16(.3f,15),priori)),15);
  604. }
  605. Zframe = 0;
  606. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  607. #pragma TCS_unroll=4
  608. #pragma TCS_unrollexact=1
  609. #endif
  610. for ( i=N ; i<NM ; i++ )
  611. { Zframe = ADD32(Zframe, EXTEND32(zeta[i]));
  612. }
  613. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  614. #pragma TCS_unrollexact=0
  615. #pragma TCS_unroll=0
  616. #endif
  617. return Zframe;
  618. }
  619. void preprocess_compute_emgain(
  620. SpeexPreprocessState * restrict st,
  621. spx_word32_t * restrict ps,
  622. spx_word16_t Pframe,
  623. int NM
  624. )
  625. {
  626. register spx_word16_t * restrict zeta = st->zeta;
  627. register spx_word16_t * restrict prior = st->prior;
  628. register spx_word16_t * restrict gain = st->gain;
  629. register spx_word32_t * restrict old_ps = st->old_ps;
  630. register spx_word16_t * restrict post = st->post;
  631. register spx_word16_t * restrict gain2 = st->gain2;
  632. register int i;
  633. register int N=st->ps_size;
  634. for ( i=N ; i<NM ; ++i )
  635. {
  636. register spx_word32_t theta;
  637. register spx_word32_t MM;
  638. register spx_word16_t prior_ratio;
  639. register spx_word16_t P1;
  640. register spx_word16_t q;
  641. #ifdef FIXED_POINT
  642. register spx_word16_t tmp;
  643. #endif
  644. register spx_word16_t priori = prior[i];
  645. prior_ratio = PDIV32_16(SHL32(EXTEND32(priori), 15), ADD16(priori, SHL32(1,SNR_SHIFT)));
  646. theta = MULT16_32_P15(prior_ratio, QCONST32(1.f,EXPIN_SHIFT)+SHL32(EXTEND32(post[i]),EXPIN_SHIFT-SNR_SHIFT));
  647. MM = hypergeom_gain(theta);
  648. gain[i] = EXTRACT16(MIN32(Q15_ONE, MULT16_32_Q15(prior_ratio, MM)));
  649. old_ps[i] = MULT16_32_P15(QCONST16(.2f,15),old_ps[i]) + MULT16_32_P15(MULT16_16_P15(QCONST16(.8f,15),SQR16_Q15(gain[i])),ps[i]);
  650. P1 = QCONST16(.199f,15)+MULT16_16_Q15(QCONST16(.8f,15),qcurve (zeta[i]));
  651. q = Q15_ONE-MULT16_16_Q15(Pframe,P1);
  652. #ifdef FIXED_POINT
  653. theta = MIN32(theta, EXTEND32(32767));
  654. tmp = MULT16_16_Q15((SHL32(1,SNR_SHIFT)+priori),EXTRACT16(MIN32(Q15ONE,SHR32(spx_exp(-EXTRACT16(theta)),1))));
  655. tmp = MIN16(QCONST16(3.,SNR_SHIFT), tmp);
  656. tmp = EXTRACT16(PSHR32(MULT16_16(PDIV32_16(SHL32(EXTEND32(q),8),(Q15_ONE-q)),tmp),8));
  657. gain2[i]=DIV32_16(SHL32(EXTEND32(32767),SNR_SHIFT), ADD16(256,tmp));
  658. #else
  659. gain2[i]=1/(1.f + (q/(1.f-q))*(1+priori)*exp(-theta));
  660. #endif
  661. }
  662. filterbank_compute_psd16(st->bank,gain2+N, gain2);
  663. filterbank_compute_psd16(st->bank,gain+N, gain);
  664. }
  665. void preprocess_compute_linear_gain(
  666. SpeexPreprocessState * restrict st,
  667. spx_word32_t * restrict ps,
  668. int N
  669. )
  670. {
  671. register spx_word16_t * restrict gain_floor = st->gain_floor;
  672. register spx_word16_t * restrict prior = st->prior;
  673. register spx_word16_t * restrict gain = st->gain;
  674. register spx_word32_t * restrict old_ps = st->old_ps;
  675. register spx_word16_t * restrict post = st->post;
  676. register spx_word16_t * restrict gain2 = st->gain2;
  677. register int i;
  678. filterbank_compute_psd16(st->bank,gain_floor+N,gain_floor);
  679. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  680. #pragma TCS_unroll=4
  681. #pragma TCS_unrollexact=1
  682. #endif
  683. for (i=0;i<N;i++)
  684. {
  685. register spx_word32_t MM;
  686. register spx_word32_t theta;
  687. register spx_word16_t prior_ratio;
  688. register spx_word16_t tmp;
  689. register spx_word16_t p;
  690. register spx_word16_t g;
  691. register spx_word16_t gfi = gain_floor[i];
  692. prior_ratio = PDIV32_16(SHL32(EXTEND32(st->prior[i]), 15), ADD16(prior[i], SHL32(1,SNR_SHIFT)));
  693. theta = MULT16_32_P15(prior_ratio, QCONST32(1.f,EXPIN_SHIFT)+SHL32(EXTEND32(post[i]),EXPIN_SHIFT-SNR_SHIFT));
  694. MM = hypergeom_gain(theta);
  695. g = EXTRACT16(MIN32(Q15_ONE, MULT16_32_Q15(prior_ratio, MM)));
  696. p = gain2[i];
  697. g = VMUX( MULT16_16_Q15(QCONST16(.333f,15),g) > gain[i], MULT16_16(3,gain[i]), g);
  698. old_ps[i]= MULT16_32_P15(QCONST16(.2f,15),old_ps[i]) +
  699. MULT16_32_P15(MULT16_16_P15(QCONST16(.8f,15),SQR16_Q15(g)),ps[i]);
  700. g = VMUX( g < gfi, gfi, g );
  701. gain[i] = g;
  702. tmp = MULT16_16_P15(p,spx_sqrt(SHL32(EXTEND32(g),15))) +
  703. MULT16_16_P15(SUB16(Q15_ONE,p),spx_sqrt(SHL32(EXTEND32(gfi),15)));
  704. gain2[i]=SQR16_Q15(tmp);
  705. /* Use this if you want a log-domain MMSE estimator instead */
  706. /* gain2[i] = pow(g, p) * pow(gfi,1.f-p);*/
  707. }
  708. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  709. #pragma TCS_unrollexact=0
  710. #pragma TCS_unroll=0
  711. #endif
  712. }
  713. #if 0
  714. void preprocess_compute_bark_gain(
  715. SpeexPreprocessState * restrict st,
  716. int N,
  717. int NM
  718. )
  719. {
  720. register spx_word16_t * restrict gain_floor = st->gain_floor;
  721. register spx_word16_t * restrict gain = st->gain;
  722. register spx_word16_t * restrict gain2 = st->gain2;
  723. register int i;
  724. for (i=N;i<NM;i++)
  725. {
  726. register spx_word16_t tmp;
  727. register spx_word16_t p = gain2[i];
  728. register spx_word16_t gaini;
  729. register spx_word16_t gfi = gain_floor[i];
  730. gaini = MAX16(gain[i], gfi);
  731. gain[i] = gaini;
  732. tmp = MULT16_16_P15(p,spx_sqrt(SHL32(EXTEND32(gaini),15))) +
  733. MULT16_16_P15(SUB16(Q15_ONE,p),spx_sqrt(SHL32(EXTEND32(gfi),15)));
  734. gain2[i]=SQR16_Q15(tmp);
  735. }
  736. filterbank_compute_psd16(st->bank,gain2+N, gain2);
  737. }
  738. #endif
  739. void preprocess_apply_gain(
  740. SpeexPreprocessState * restrict st,
  741. int N
  742. )
  743. {
  744. register spx_word16_t * restrict ft = st->ft;
  745. register spx_word16_t * restrict gain2 = st->gain2;
  746. register int j, i;
  747. ft[0] = MULT16_16_P15(gain2[0],ft[0]);
  748. for (i=1,j=1; i<N ; i++,j+=2)
  749. {
  750. register spx_word16_t gain2i = gain2[i];
  751. register spx_word16_t ftj = ft[j];
  752. register spx_word16_t ftjj = ft[j+1];
  753. ft[j] = MULT16_16_P15(gain2i,ftj);
  754. ft[j+1] = MULT16_16_P15(gain2i,ftjj);
  755. }
  756. ft[(N<<1)-1] = MULT16_16_P15(gain2[N-1],ft[(N<<1)-1]);
  757. }
  758. #ifdef FIXED_POINT
  759. void preprocess_scale(
  760. SpeexPreprocessState * restrict st,
  761. int N
  762. )
  763. {
  764. register spx_word16_t * restrict frame = st->frame;
  765. register int shift = st->frame_shift;
  766. register int i;
  767. register int N2 = N << 1;
  768. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  769. #pragma TCS_unroll=4
  770. #pragma TCS_unrollexact=1
  771. #endif
  772. for ( i=0 ; i<N2 ;i++)
  773. { register spx_word16_t framei = frame[i];
  774. frame[i] = PSHR16(framei,shift);
  775. }
  776. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  777. #pragma TCS_unrollexact=0
  778. #pragma TCS_unroll=0
  779. #endif
  780. }
  781. #else
  782. void preprocess_apply_agc(
  783. SpeexPreprocessState * restrict st,
  784. int N
  785. )
  786. {
  787. register spx_word16_t max_sample=0;
  788. register spx_word16_t * restrict frame = st->frame;
  789. register int i;
  790. register int N2 = N << 1;
  791. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  792. #pragma TCS_unroll=4
  793. #pragma TCS_unrollexact=1
  794. #endif
  795. for (i=0;i<N2;i++)
  796. { register spx_word16_t framei = VABS(frame[i]);
  797. max_sample = VMUX( framei > max_sample, framei, max_sample);
  798. }
  799. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  800. #pragma TCS_unrollexact=0
  801. #pragma TCS_unroll=0
  802. #endif
  803. if ( max_sample > 28000.f )
  804. {
  805. float damp = 28000.f/max_sample;
  806. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  807. #pragma TCS_unroll=4
  808. #pragma TCS_unrollexact=1
  809. #endif
  810. for ( i=0 ; i< N2 ; i++ )
  811. { frame[i] *= damp;
  812. }
  813. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  814. #pragma TCS_unrollexact=0
  815. #pragma TCS_unroll=0
  816. #endif
  817. }
  818. }
  819. #endif
  820. void preprocess_update(
  821. SpeexPreprocessState * restrict st,
  822. spx_int16_t * restrict x,
  823. int N
  824. )
  825. {
  826. register spx_word16_t * restrict frame = st->frame;
  827. register spx_word16_t * restrict window = st->window;
  828. register spx_word16_t * restrict outbuf = st->outbuf;
  829. register int framesize = st->frame_size;
  830. register int N2 = N << 1;
  831. register int N3 = N2 - framesize;
  832. register int N4 = (framesize) - N3;
  833. register int i;
  834. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  835. #pragma TCS_unroll=4
  836. #pragma TCS_unrollexact=1
  837. #endif
  838. for ( i=0 ; i<N2 ; i++)
  839. { register spx_word16_t fi = frame[i];
  840. register spx_word16_t wi = window[i];
  841. frame[i] = MULT16_16_Q15(fi, wi);
  842. }
  843. for (i=0;i<N3;i++)
  844. { x[i] = outbuf[i] + frame[i];
  845. }
  846. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  847. #pragma TCS_unrollexact=0
  848. #pragma TCS_unroll=0
  849. #endif
  850. for ( i=0;i<N4;i++)
  851. { x[N3+i] = frame[N3+i];
  852. }
  853. memcpy(outbuf, frame+framesize, (N3) * sizeof(spx_word16_t));
  854. }
  855. #define OVERRIDE_SPEEX_PREPROCESS_RUN
  856. int speex_preprocess_run(SpeexPreprocessState * restrict st, spx_int16_t * restrict x)
  857. {
  858. register int i, N, M, NM;
  859. register spx_word32_t * restrict ps=st->ps;
  860. register spx_word32_t Zframe;
  861. register spx_word16_t Pframe;
  862. st->nb_adapt++;
  863. st->min_count++;
  864. N = st->ps_size;
  865. M = st->nbands;
  866. NM = N + M;
  867. preprocess_residue_echo(st, N, NM);
  868. preprocess_analysis(st, x);
  869. update_noise_prob(st);
  870. preprocess_update_noise(st, ps, N);
  871. if ( st->nb_adapt == 1 )
  872. { memcpy(st->old_ps, ps, (NM) * sizeof(spx_word32_t));
  873. }
  874. preprocess_compute_SNR(st, ps, NM);
  875. Zframe = preprocess_smooth_SNR(st, N, NM);
  876. {
  877. register spx_word16_t effective_echo_suppress;
  878. Pframe = QCONST16(.1f,15)+MULT16_16_Q15(QCONST16(.899f,15),qcurve(DIV32_16(Zframe,M)));
  879. effective_echo_suppress = EXTRACT16(PSHR32(ADD32(MULT16_16(SUB16(Q15_ONE,Pframe), st->echo_suppress),
  880. MULT16_16(Pframe, st->echo_suppress_active)),15));
  881. compute_gain_floor(st->noise_suppress, effective_echo_suppress, st->noise+N, st->echo_noise+N, st->gain_floor+N, M);
  882. }
  883. preprocess_compute_emgain(st, ps, Pframe, NM);
  884. preprocess_compute_linear_gain(st, ps, N);
  885. if (!st->denoise_enabled)
  886. {
  887. register spx_word16_t * restrict gain2 = st->gain2;
  888. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  889. #pragma TCS_unroll=4
  890. #pragma TCS_unrollexact=1
  891. #endif
  892. for ( i=0 ; i<NM ; i++ )
  893. { gain2[i] = Q15_ONE;
  894. }
  895. #if (TM_UNROLL && TM_UNROLL_SPEEXPREPROCESSRUN)
  896. #pragma TCS_unrollexact=0
  897. #pragma TCS_unroll=0
  898. #endif
  899. }
  900. preprocess_apply_gain(st, N);
  901. #ifndef FIXED_POINT
  902. if (st->agc_enabled)
  903. { speex_compute_agc(st, Pframe, st->ft);
  904. }
  905. #endif
  906. spx_ifft(st->fft_lookup, st->ft, st->frame);
  907. #ifdef FIXED_POINT
  908. preprocess_scale(st, N);
  909. #endif
  910. #ifndef FIXED_POINT
  911. if ( st->agc_enabled )
  912. { preprocess_apply_agc(st, N);
  913. }
  914. #endif
  915. preprocess_update(st, x, N);
  916. if ( st->vad_enabled )
  917. {
  918. if (Pframe > st->speech_prob_start || (st->was_speech && Pframe > st->speech_prob_continue))
  919. { st->was_speech=1;
  920. return 1;
  921. } else
  922. { st->was_speech=0;
  923. return 0;
  924. }
  925. } else
  926. { return 1;
  927. }
  928. }