You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

390 lines
14KB

  1. /*
  2. * Copyright (C) 2001-2010 Krzysztof Foltman, Markus Schmidt, Thor Harald Johansen
  3. *
  4. * This file is part of FFmpeg.
  5. *
  6. * FFmpeg is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU Lesser General Public
  8. * License as published by the Free Software Foundation; either
  9. * version 2.1 of the License, or (at your option) any later version.
  10. *
  11. * FFmpeg is distributed in the hope that it will be useful,
  12. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  14. * Lesser General Public License for more details.
  15. *
  16. * You should have received a copy of the GNU Lesser General Public
  17. * License along with FFmpeg; if not, write to the Free Software
  18. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  19. */
  20. #include "libavutil/channel_layout.h"
  21. #include "libavutil/opt.h"
  22. #include "avfilter.h"
  23. #include "audio.h"
  24. #include "formats.h"
  25. typedef struct StereoToolsContext {
  26. const AVClass *class;
  27. int softclip;
  28. int mute_l;
  29. int mute_r;
  30. int phase_l;
  31. int phase_r;
  32. int mode;
  33. int bmode_in;
  34. int bmode_out;
  35. double slev;
  36. double sbal;
  37. double mlev;
  38. double mpan;
  39. double phase;
  40. double base;
  41. double delay;
  42. double balance_in;
  43. double balance_out;
  44. double phase_sin_coef;
  45. double phase_cos_coef;
  46. double sc_level;
  47. double inv_atan_shape;
  48. double level_in;
  49. double level_out;
  50. double *buffer;
  51. int length;
  52. int pos;
  53. } StereoToolsContext;
  54. #define OFFSET(x) offsetof(StereoToolsContext, x)
  55. #define A AV_OPT_FLAG_AUDIO_PARAM|AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_RUNTIME_PARAM
  56. static const AVOption stereotools_options[] = {
  57. { "level_in", "set level in", OFFSET(level_in), AV_OPT_TYPE_DOUBLE, {.dbl=1}, 0.015625, 64, A },
  58. { "level_out", "set level out", OFFSET(level_out), AV_OPT_TYPE_DOUBLE, {.dbl=1}, 0.015625, 64, A },
  59. { "balance_in", "set balance in", OFFSET(balance_in), AV_OPT_TYPE_DOUBLE, {.dbl=0}, -1, 1, A },
  60. { "balance_out", "set balance out", OFFSET(balance_out), AV_OPT_TYPE_DOUBLE, {.dbl=0}, -1, 1, A },
  61. { "softclip", "enable softclip", OFFSET(softclip), AV_OPT_TYPE_BOOL, {.i64=0}, 0, 1, A },
  62. { "mutel", "mute L", OFFSET(mute_l), AV_OPT_TYPE_BOOL, {.i64=0}, 0, 1, A },
  63. { "muter", "mute R", OFFSET(mute_r), AV_OPT_TYPE_BOOL, {.i64=0}, 0, 1, A },
  64. { "phasel", "phase L", OFFSET(phase_l), AV_OPT_TYPE_BOOL, {.i64=0}, 0, 1, A },
  65. { "phaser", "phase R", OFFSET(phase_r), AV_OPT_TYPE_BOOL, {.i64=0}, 0, 1, A },
  66. { "mode", "set stereo mode", OFFSET(mode), AV_OPT_TYPE_INT, {.i64=0}, 0, 10, A, "mode" },
  67. { "lr>lr", 0, 0, AV_OPT_TYPE_CONST, {.i64=0}, 0, 0, A, "mode" },
  68. { "lr>ms", 0, 0, AV_OPT_TYPE_CONST, {.i64=1}, 0, 0, A, "mode" },
  69. { "ms>lr", 0, 0, AV_OPT_TYPE_CONST, {.i64=2}, 0, 0, A, "mode" },
  70. { "lr>ll", 0, 0, AV_OPT_TYPE_CONST, {.i64=3}, 0, 0, A, "mode" },
  71. { "lr>rr", 0, 0, AV_OPT_TYPE_CONST, {.i64=4}, 0, 0, A, "mode" },
  72. { "lr>l+r", 0, 0, AV_OPT_TYPE_CONST, {.i64=5}, 0, 0, A, "mode" },
  73. { "lr>rl", 0, 0, AV_OPT_TYPE_CONST, {.i64=6}, 0, 0, A, "mode" },
  74. { "ms>ll", 0, 0, AV_OPT_TYPE_CONST, {.i64=7}, 0, 0, A, "mode" },
  75. { "ms>rr", 0, 0, AV_OPT_TYPE_CONST, {.i64=8}, 0, 0, A, "mode" },
  76. { "ms>rl", 0, 0, AV_OPT_TYPE_CONST, {.i64=9}, 0, 0, A, "mode" },
  77. { "lr>l-r", 0, 0, AV_OPT_TYPE_CONST, {.i64=10}, 0, 0, A, "mode" },
  78. { "slev", "set side level", OFFSET(slev), AV_OPT_TYPE_DOUBLE, {.dbl=1}, 0.015625, 64, A },
  79. { "sbal", "set side balance", OFFSET(sbal), AV_OPT_TYPE_DOUBLE, {.dbl=0}, -1, 1, A },
  80. { "mlev", "set middle level", OFFSET(mlev), AV_OPT_TYPE_DOUBLE, {.dbl=1}, 0.015625, 64, A },
  81. { "mpan", "set middle pan", OFFSET(mpan), AV_OPT_TYPE_DOUBLE, {.dbl=0}, -1, 1, A },
  82. { "base", "set stereo base", OFFSET(base), AV_OPT_TYPE_DOUBLE, {.dbl=0}, -1, 1, A },
  83. { "delay", "set delay", OFFSET(delay), AV_OPT_TYPE_DOUBLE, {.dbl=0}, -20, 20, A },
  84. { "sclevel", "set S/C level", OFFSET(sc_level), AV_OPT_TYPE_DOUBLE, {.dbl=1}, 1, 100, A },
  85. { "phase", "set stereo phase", OFFSET(phase), AV_OPT_TYPE_DOUBLE, {.dbl=0}, 0, 360, A },
  86. { "bmode_in", "set balance in mode", OFFSET(bmode_in), AV_OPT_TYPE_INT, {.i64=0}, 0, 2, A, "bmode" },
  87. { "balance", 0, 0, AV_OPT_TYPE_CONST, {.i64=0}, 0, 0, A, "bmode" },
  88. { "amplitude", 0, 0, AV_OPT_TYPE_CONST, {.i64=1}, 0, 0, A, "bmode" },
  89. { "power", 0, 0, AV_OPT_TYPE_CONST, {.i64=2}, 0, 0, A, "bmode" },
  90. { "bmode_out", "set balance out mode", OFFSET(bmode_out), AV_OPT_TYPE_INT, {.i64=0}, 0, 2, A, "bmode" },
  91. { NULL }
  92. };
  93. AVFILTER_DEFINE_CLASS(stereotools);
  94. static int query_formats(AVFilterContext *ctx)
  95. {
  96. AVFilterFormats *formats = NULL;
  97. AVFilterChannelLayouts *layout = NULL;
  98. int ret;
  99. if ((ret = ff_add_format (&formats, AV_SAMPLE_FMT_DBL )) < 0 ||
  100. (ret = ff_set_common_formats (ctx , formats )) < 0 ||
  101. (ret = ff_add_channel_layout (&layout , AV_CH_LAYOUT_STEREO)) < 0 ||
  102. (ret = ff_set_common_channel_layouts (ctx , layout )) < 0)
  103. return ret;
  104. formats = ff_all_samplerates();
  105. return ff_set_common_samplerates(ctx, formats);
  106. }
  107. static int config_input(AVFilterLink *inlink)
  108. {
  109. AVFilterContext *ctx = inlink->dst;
  110. StereoToolsContext *s = ctx->priv;
  111. s->length = FFALIGN(inlink->sample_rate / 10, 2);
  112. if (!s->buffer)
  113. s->buffer = av_calloc(s->length, sizeof(*s->buffer));
  114. if (!s->buffer)
  115. return AVERROR(ENOMEM);
  116. s->inv_atan_shape = 1.0 / atan(s->sc_level);
  117. s->phase_cos_coef = cos(s->phase / 180 * M_PI);
  118. s->phase_sin_coef = sin(s->phase / 180 * M_PI);
  119. return 0;
  120. }
  121. static int filter_frame(AVFilterLink *inlink, AVFrame *in)
  122. {
  123. AVFilterContext *ctx = inlink->dst;
  124. AVFilterLink *outlink = ctx->outputs[0];
  125. StereoToolsContext *s = ctx->priv;
  126. const double *src = (const double *)in->data[0];
  127. const double sb = s->base < 0 ? s->base * 0.5 : s->base;
  128. const double sbal = 1 + s->sbal;
  129. const double mpan = 1 + s->mpan;
  130. const double slev = s->slev;
  131. const double mlev = s->mlev;
  132. const double balance_in = s->balance_in;
  133. const double balance_out = s->balance_out;
  134. const double level_in = s->level_in;
  135. const double level_out = s->level_out;
  136. const double sc_level = s->sc_level;
  137. const double delay = s->delay;
  138. const int length = s->length;
  139. const int mute_l = s->mute_l;
  140. const int mute_r = s->mute_r;
  141. const int phase_l = s->phase_l;
  142. const int phase_r = s->phase_r;
  143. double *buffer = s->buffer;
  144. AVFrame *out;
  145. double *dst;
  146. int nbuf = inlink->sample_rate * (fabs(delay) / 1000.);
  147. int n;
  148. nbuf -= nbuf % 2;
  149. if (av_frame_is_writable(in)) {
  150. out = in;
  151. } else {
  152. out = ff_get_audio_buffer(outlink, in->nb_samples);
  153. if (!out) {
  154. av_frame_free(&in);
  155. return AVERROR(ENOMEM);
  156. }
  157. av_frame_copy_props(out, in);
  158. }
  159. dst = (double *)out->data[0];
  160. for (n = 0; n < in->nb_samples; n++, src += 2, dst += 2) {
  161. double L = src[0], R = src[1], l, r, m, S, gl, gr, gd;
  162. L *= level_in;
  163. R *= level_in;
  164. gl = 1. - FFMAX(0., balance_in);
  165. gr = 1. + FFMIN(0., balance_in);
  166. switch (s->bmode_in) {
  167. case 1:
  168. gd = gl - gr;
  169. gl = 1. + gd;
  170. gr = 1. - gd;
  171. break;
  172. case 2:
  173. if (balance_in < 0.) {
  174. gr = FFMAX(0.5, gr);
  175. gl = 1. / gr;
  176. } else if (balance_in > 0.) {
  177. gl = FFMAX(0.5, gl);
  178. gr = 1. / gl;
  179. }
  180. break;
  181. }
  182. L *= gl;
  183. R *= gr;
  184. if (s->softclip) {
  185. R = s->inv_atan_shape * atan(R * sc_level);
  186. L = s->inv_atan_shape * atan(L * sc_level);
  187. }
  188. switch (s->mode) {
  189. case 0:
  190. m = (L + R) * 0.5;
  191. S = (L - R) * 0.5;
  192. l = m * mlev * FFMIN(1., 2. - mpan) + S * slev * FFMIN(1., 2. - sbal);
  193. r = m * mlev * FFMIN(1., mpan) - S * slev * FFMIN(1., sbal);
  194. L = l;
  195. R = r;
  196. break;
  197. case 1:
  198. l = L * FFMIN(1., 2. - sbal);
  199. r = R * FFMIN(1., sbal);
  200. L = 0.5 * (l + r) * mlev;
  201. R = 0.5 * (l - r) * slev;
  202. break;
  203. case 2:
  204. l = L * mlev * FFMIN(1., 2. - mpan) + R * slev * FFMIN(1., 2. - sbal);
  205. r = L * mlev * FFMIN(1., mpan) - R * slev * FFMIN(1., sbal);
  206. L = l;
  207. R = r;
  208. break;
  209. case 3:
  210. R = L;
  211. break;
  212. case 4:
  213. L = R;
  214. break;
  215. case 5:
  216. L = (L + R) * 0.5;
  217. R = L;
  218. break;
  219. case 6:
  220. l = L;
  221. L = R;
  222. R = l;
  223. m = (L + R) * 0.5;
  224. S = (L - R) * 0.5;
  225. l = m * mlev * FFMIN(1., 2. - mpan) + S * slev * FFMIN(1., 2. - sbal);
  226. r = m * mlev * FFMIN(1., mpan) - S * slev * FFMIN(1., sbal);
  227. L = l;
  228. R = r;
  229. break;
  230. case 7:
  231. l = L * mlev * FFMIN(1., 2. - mpan) + R * slev * FFMIN(1., 2. - sbal);
  232. L = l;
  233. R = l;
  234. break;
  235. case 8:
  236. r = L * mlev * FFMIN(1., mpan) - R * slev * FFMIN(1., sbal);
  237. L = r;
  238. R = r;
  239. break;
  240. case 9:
  241. l = L * mlev * FFMIN(1., 2. - mpan) + R * slev * FFMIN(1., 2. - sbal);
  242. r = L * mlev * FFMIN(1., mpan) - R * slev * FFMIN(1., sbal);
  243. L = r;
  244. R = l;
  245. break;
  246. case 10:
  247. L = (L - R) * 0.5;
  248. R = L;
  249. break;
  250. }
  251. L *= 1. - mute_l;
  252. R *= 1. - mute_r;
  253. L *= (2. * (1. - phase_l)) - 1.;
  254. R *= (2. * (1. - phase_r)) - 1.;
  255. buffer[s->pos ] = L;
  256. buffer[s->pos+1] = R;
  257. if (delay > 0.) {
  258. R = buffer[(s->pos - (int)nbuf + 1 + length) % length];
  259. } else if (delay < 0.) {
  260. L = buffer[(s->pos - (int)nbuf + length) % length];
  261. }
  262. l = L + sb * L - sb * R;
  263. r = R + sb * R - sb * L;
  264. L = l;
  265. R = r;
  266. l = L * s->phase_cos_coef - R * s->phase_sin_coef;
  267. r = L * s->phase_sin_coef + R * s->phase_cos_coef;
  268. L = l;
  269. R = r;
  270. s->pos = (s->pos + 2) % s->length;
  271. gl = 1. - FFMAX(0., balance_out);
  272. gr = 1. + FFMIN(0., balance_out);
  273. switch (s->bmode_out) {
  274. case 1:
  275. gd = gl - gr;
  276. gl = 1. + gd;
  277. gr = 1. - gd;
  278. break;
  279. case 2:
  280. if (balance_out < 0.) {
  281. gr = FFMAX(0.5, gr);
  282. gl = 1. / gr;
  283. } else if (balance_out > 0.) {
  284. gl = FFMAX(0.5, gl);
  285. gr = 1. / gl;
  286. }
  287. break;
  288. }
  289. L *= gl;
  290. R *= gr;
  291. L *= level_out;
  292. R *= level_out;
  293. if (ctx->is_disabled) {
  294. dst[0] = src[0];
  295. dst[1] = src[1];
  296. } else {
  297. dst[0] = L;
  298. dst[1] = R;
  299. }
  300. }
  301. if (out != in)
  302. av_frame_free(&in);
  303. return ff_filter_frame(outlink, out);
  304. }
  305. static int process_command(AVFilterContext *ctx, const char *cmd, const char *args,
  306. char *res, int res_len, int flags)
  307. {
  308. int ret;
  309. ret = ff_filter_process_command(ctx, cmd, args, res, res_len, flags);
  310. if (ret < 0)
  311. return ret;
  312. return config_input(ctx->inputs[0]);
  313. }
  314. static av_cold void uninit(AVFilterContext *ctx)
  315. {
  316. StereoToolsContext *s = ctx->priv;
  317. av_freep(&s->buffer);
  318. }
  319. static const AVFilterPad inputs[] = {
  320. {
  321. .name = "default",
  322. .type = AVMEDIA_TYPE_AUDIO,
  323. .filter_frame = filter_frame,
  324. .config_props = config_input,
  325. },
  326. { NULL }
  327. };
  328. static const AVFilterPad outputs[] = {
  329. {
  330. .name = "default",
  331. .type = AVMEDIA_TYPE_AUDIO,
  332. },
  333. { NULL }
  334. };
  335. AVFilter ff_af_stereotools = {
  336. .name = "stereotools",
  337. .description = NULL_IF_CONFIG_SMALL("Apply various stereo tools."),
  338. .query_formats = query_formats,
  339. .priv_size = sizeof(StereoToolsContext),
  340. .priv_class = &stereotools_class,
  341. .uninit = uninit,
  342. .inputs = inputs,
  343. .outputs = outputs,
  344. .process_command = process_command,
  345. .flags = AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL,
  346. };