You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

342 lines
11KB

  1. /*
  2. * Copyright (c) 2016 Paul B Mahol
  3. *
  4. * This file is part of FFmpeg.
  5. *
  6. * FFmpeg is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU Lesser General Public
  8. * License as published by the Free Software Foundation; either
  9. * version 2.1 of the License, or (at your option) any later version.
  10. *
  11. * FFmpeg is distributed in the hope that it will be useful,
  12. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  14. * Lesser General Public License for more details.
  15. *
  16. * You should have received a copy of the GNU Lesser General Public
  17. * License along with FFmpeg; if not, write to the Free Software
  18. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  19. */
  20. /**
  21. * @file
  22. * filter for manipulating frame metadata
  23. */
  24. #include "libavutil/avassert.h"
  25. #include "libavutil/avstring.h"
  26. #include "libavutil/eval.h"
  27. #include "libavutil/fifo.h"
  28. #include "libavutil/internal.h"
  29. #include "libavutil/opt.h"
  30. #include "libavutil/pixelutils.h"
  31. #include "avfilter.h"
  32. #include "audio.h"
  33. #include "formats.h"
  34. #include "internal.h"
  35. #include "video.h"
  36. enum MetadataMode {
  37. METADATA_SELECT,
  38. METADATA_ADD,
  39. METADATA_MODIFY,
  40. METADATA_DELETE,
  41. METADATA_PRINT,
  42. METADATA_NB
  43. };
  44. enum MetadataFunction {
  45. METADATAF_STRING,
  46. METADATAF_LESS,
  47. METADATAF_EQUAL,
  48. METADATAF_GREATER,
  49. METADATAF_EXPR,
  50. METADATAF_NB
  51. };
  52. static const char *const var_names[] = {
  53. "VALUE1",
  54. "VALUE2",
  55. NULL
  56. };
  57. enum var_name {
  58. VAR_VALUE1,
  59. VAR_VALUE2,
  60. VAR_VARS_NB
  61. };
  62. typedef struct MetadataContext {
  63. const AVClass *class;
  64. int mode;
  65. char *key;
  66. char *value;
  67. int length;
  68. int function;
  69. char *expr_str;
  70. AVExpr *expr;
  71. double var_values[VAR_VARS_NB];
  72. int (*compare)(struct MetadataContext *s,
  73. const char *value1, const char *value2, size_t length);
  74. } MetadataContext;
  75. #define OFFSET(x) offsetof(MetadataContext, x)
  76. #define DEFINE_OPTIONS(filt_name, FLAGS) \
  77. static const AVOption filt_name##_options[] = { \
  78. { "mode", "set a mode of operation", OFFSET(mode), AV_OPT_TYPE_INT, {.i64 = 0 }, 0, METADATA_NB-1, FLAGS, "mode" }, \
  79. { "select", "select frame", 0, AV_OPT_TYPE_CONST, {.i64 = METADATA_SELECT }, 0, 0, FLAGS, "mode" }, \
  80. { "add", "add new metadata", 0, AV_OPT_TYPE_CONST, {.i64 = METADATA_ADD }, 0, 0, FLAGS, "mode" }, \
  81. { "modify", "modify metadata", 0, AV_OPT_TYPE_CONST, {.i64 = METADATA_MODIFY }, 0, 0, FLAGS, "mode" }, \
  82. { "delete", "delete metadata", 0, AV_OPT_TYPE_CONST, {.i64 = METADATA_DELETE }, 0, 0, FLAGS, "mode" }, \
  83. { "print", "print metadata", 0, AV_OPT_TYPE_CONST, {.i64 = METADATA_PRINT }, 0, 0, FLAGS, "mode" }, \
  84. { "key", "set metadata key", OFFSET(key), AV_OPT_TYPE_STRING, {.str = NULL }, 0, 0, FLAGS }, \
  85. { "value", "set metadata value", OFFSET(value), AV_OPT_TYPE_STRING, {.str = NULL }, 0, 0, FLAGS }, \
  86. { "function", "function for comparing values", OFFSET(function), AV_OPT_TYPE_INT, {.i64 = 0 }, 0, METADATAF_NB-1, FLAGS, "function" }, \
  87. { "string", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = METADATAF_STRING }, 0, 3, FLAGS, "function" }, \
  88. { "less", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = METADATAF_LESS }, 0, 3, FLAGS, "function" }, \
  89. { "equal", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = METADATAF_EQUAL }, 0, 3, FLAGS, "function" }, \
  90. { "greater", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = METADATAF_GREATER }, 0, 3, FLAGS, "function" }, \
  91. { "expr", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = METADATAF_EXPR }, 0, 3, FLAGS, "function" }, \
  92. { "expr", "set expression for expr function", OFFSET(expr_str), AV_OPT_TYPE_STRING, {.str = NULL }, 0, 0, FLAGS }, \
  93. { "length", "compare up to N chars for string function", OFFSET(length), AV_OPT_TYPE_INT, {.i64 = INT_MAX }, 1, INT_MAX, FLAGS }, \
  94. { NULL } \
  95. }
  96. static int string(MetadataContext *s, const char *value1, const char *value2, size_t length)
  97. {
  98. return !strncmp(value1, value2, length);
  99. }
  100. static int equal(MetadataContext *s, const char *value1, const char *value2, size_t length)
  101. {
  102. float f1, f2;
  103. if (sscanf(value1, "%f", &f1) + sscanf(value2, "%f", &f2) != 2)
  104. return 0;
  105. return f1 == f2;
  106. }
  107. static int less(MetadataContext *s, const char *value1, const char *value2, size_t length)
  108. {
  109. float f1, f2;
  110. if (sscanf(value1, "%f", &f1) + sscanf(value2, "%f", &f2) != 2)
  111. return 0;
  112. return f1 < f2;
  113. }
  114. static int greater(MetadataContext *s, const char *value1, const char *value2, size_t length)
  115. {
  116. float f1, f2;
  117. if (sscanf(value1, "%f", &f1) + sscanf(value2, "%f", &f2) != 2)
  118. return 0;
  119. return f1 > f2;
  120. }
  121. static int parse_expr(MetadataContext *s, const char *value1, const char *value2, size_t length)
  122. {
  123. double f1, f2;
  124. if (sscanf(value1, "%lf", &f1) + sscanf(value2, "%lf", &f2) != 2)
  125. return 0;
  126. s->var_values[VAR_VALUE1] = f1;
  127. s->var_values[VAR_VALUE2] = f2;
  128. return av_expr_eval(s->expr, s->var_values, NULL);
  129. }
  130. static av_cold int init(AVFilterContext *ctx)
  131. {
  132. MetadataContext *s = ctx->priv;
  133. int ret;
  134. if (!s->key && s->mode != METADATA_PRINT) {
  135. av_log(ctx, AV_LOG_WARNING, "Metadata key must be set\n");
  136. return AVERROR(EINVAL);
  137. }
  138. if ((s->mode == METADATA_MODIFY ||
  139. s->mode == METADATA_ADD) && !s->value) {
  140. av_log(ctx, AV_LOG_WARNING, "Missing metadata value\n");
  141. return AVERROR(EINVAL);
  142. }
  143. switch (s->function) {
  144. case METADATAF_STRING:
  145. s->compare = string;
  146. break;
  147. case METADATAF_LESS:
  148. s->compare = less;
  149. break;
  150. case METADATAF_EQUAL:
  151. s->compare = equal;
  152. break;
  153. case METADATAF_GREATER:
  154. s->compare = greater;
  155. break;
  156. case METADATAF_EXPR:
  157. s->compare = parse_expr;
  158. break;
  159. default:
  160. av_assert0(0);
  161. };
  162. if (s->function == METADATAF_EXPR) {
  163. if (!s->expr_str) {
  164. av_log(ctx, AV_LOG_WARNING, "expr option not set\n");
  165. return AVERROR(EINVAL);
  166. }
  167. if ((ret = av_expr_parse(&s->expr, s->expr_str,
  168. var_names, NULL, NULL, NULL, NULL, 0, ctx)) < 0) {
  169. av_log(ctx, AV_LOG_ERROR, "Error while parsing expression '%s'\n", s->expr_str);
  170. return ret;
  171. }
  172. }
  173. return 0;
  174. }
  175. static int filter_frame(AVFilterLink *inlink, AVFrame *frame)
  176. {
  177. AVFilterContext *ctx = inlink->dst;
  178. AVFilterLink *outlink = ctx->outputs[0];
  179. MetadataContext *s = ctx->priv;
  180. AVDictionary *metadata = av_frame_get_metadata(frame);
  181. AVDictionaryEntry *e;
  182. if (!metadata)
  183. return ff_filter_frame(outlink, frame);
  184. e = av_dict_get(metadata, !s->key ? "" : s->key, NULL,
  185. !s->key ? AV_DICT_IGNORE_SUFFIX: 0);
  186. switch (s->mode) {
  187. case METADATA_SELECT:
  188. if (!s->value && e && e->value) {
  189. return ff_filter_frame(outlink, frame);
  190. } else if (s->value && e && e->value &&
  191. s->compare(s, e->value, s->value, s->length)) {
  192. return ff_filter_frame(outlink, frame);
  193. }
  194. break;
  195. case METADATA_ADD:
  196. if (e && e->value) {
  197. ;
  198. } else {
  199. av_dict_set(&metadata, s->key, s->value, 0);
  200. }
  201. return ff_filter_frame(outlink, frame);
  202. break;
  203. case METADATA_MODIFY:
  204. if (e && e->value) {
  205. av_dict_set(&metadata, s->key, s->value, 0);
  206. }
  207. return ff_filter_frame(outlink, frame);
  208. break;
  209. case METADATA_PRINT:
  210. if (!s->key && e) {
  211. av_log(ctx, AV_LOG_INFO, "frame %"PRId64" pts %"PRId64"\n", inlink->frame_count, frame->pts);
  212. av_log(ctx, AV_LOG_INFO, "%s=%s\n", e->key, e->value);
  213. while ((e = av_dict_get(metadata, "", e, AV_DICT_IGNORE_SUFFIX)) != NULL) {
  214. av_log(ctx, AV_LOG_INFO, "%s=%s\n", e->key, e->value);
  215. }
  216. } else if (e && e->value && (!s->value || (e->value && s->compare(s, e->value, s->value, s->length)))) {
  217. av_log(ctx, AV_LOG_INFO, "frame %"PRId64" pts %"PRId64"\n", inlink->frame_count, frame->pts);
  218. av_log(ctx, AV_LOG_INFO, "%s=%s\n", s->key, e->value);
  219. }
  220. return ff_filter_frame(outlink, frame);
  221. break;
  222. case METADATA_DELETE:
  223. if (e && e->value && s->value && s->compare(s, e->value, s->value, s->length)) {
  224. av_dict_set(&metadata, s->key, NULL, 0);
  225. } else if (e && e->value) {
  226. av_dict_set(&metadata, s->key, NULL, 0);
  227. }
  228. return ff_filter_frame(outlink, frame);
  229. break;
  230. default:
  231. av_assert0(0);
  232. };
  233. av_frame_free(&frame);
  234. return 0;
  235. }
  236. #if CONFIG_AMETADATA_FILTER
  237. DEFINE_OPTIONS(ametadata, AV_OPT_FLAG_AUDIO_PARAM|AV_OPT_FLAG_FILTERING_PARAM);
  238. AVFILTER_DEFINE_CLASS(ametadata);
  239. static const AVFilterPad ainputs[] = {
  240. {
  241. .name = "default",
  242. .type = AVMEDIA_TYPE_AUDIO,
  243. .filter_frame = filter_frame,
  244. },
  245. { NULL }
  246. };
  247. static const AVFilterPad aoutputs[] = {
  248. {
  249. .name = "default",
  250. .type = AVMEDIA_TYPE_AUDIO,
  251. },
  252. { NULL }
  253. };
  254. AVFilter ff_af_ametadata = {
  255. .name = "ametadata",
  256. .description = NULL_IF_CONFIG_SMALL("Manipulate audio frame metadata."),
  257. .priv_size = sizeof(MetadataContext),
  258. .priv_class = &ametadata_class,
  259. .init = init,
  260. .query_formats = ff_query_formats_all,
  261. .inputs = ainputs,
  262. .outputs = aoutputs,
  263. .flags = AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC,
  264. };
  265. #endif /* CONFIG_AMETADATA_FILTER */
  266. #if CONFIG_METADATA_FILTER
  267. DEFINE_OPTIONS(metadata, AV_OPT_FLAG_VIDEO_PARAM|AV_OPT_FLAG_FILTERING_PARAM);
  268. AVFILTER_DEFINE_CLASS(metadata);
  269. static const AVFilterPad inputs[] = {
  270. {
  271. .name = "default",
  272. .type = AVMEDIA_TYPE_VIDEO,
  273. .filter_frame = filter_frame,
  274. },
  275. { NULL }
  276. };
  277. static const AVFilterPad outputs[] = {
  278. {
  279. .name = "default",
  280. .type = AVMEDIA_TYPE_VIDEO,
  281. },
  282. { NULL }
  283. };
  284. AVFilter ff_vf_metadata = {
  285. .name = "metadata",
  286. .description = NULL_IF_CONFIG_SMALL("Manipulate video frame metadata."),
  287. .priv_size = sizeof(MetadataContext),
  288. .priv_class = &metadata_class,
  289. .init = init,
  290. .inputs = inputs,
  291. .outputs = outputs,
  292. .flags = AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC,
  293. };
  294. #endif /* CONFIG_METADATA_FILTER */