You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

344 lines
11KB

  1. /*
  2. * Copyright (c) 2016 Paul B Mahol
  3. *
  4. * This file is part of FFmpeg.
  5. *
  6. * FFmpeg is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU Lesser General Public
  8. * License as published by the Free Software Foundation; either
  9. * version 2.1 of the License, or (at your option) any later version.
  10. *
  11. * FFmpeg is distributed in the hope that it will be useful,
  12. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  14. * Lesser General Public License for more details.
  15. *
  16. * You should have received a copy of the GNU Lesser General Public
  17. * License along with FFmpeg; if not, write to the Free Software
  18. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  19. */
  20. /**
  21. * @file
  22. * filter for manipulating frame metadata
  23. */
  24. #include <float.h>
  25. #include "libavutil/avassert.h"
  26. #include "libavutil/avstring.h"
  27. #include "libavutil/eval.h"
  28. #include "libavutil/fifo.h"
  29. #include "libavutil/internal.h"
  30. #include "libavutil/opt.h"
  31. #include "libavutil/pixelutils.h"
  32. #include "avfilter.h"
  33. #include "audio.h"
  34. #include "formats.h"
  35. #include "internal.h"
  36. #include "video.h"
  37. enum MetadataMode {
  38. METADATA_SELECT,
  39. METADATA_ADD,
  40. METADATA_MODIFY,
  41. METADATA_DELETE,
  42. METADATA_PRINT,
  43. METADATA_NB
  44. };
  45. enum MetadataFunction {
  46. METADATAF_STRING,
  47. METADATAF_LESS,
  48. METADATAF_EQUAL,
  49. METADATAF_GREATER,
  50. METADATAF_EXPR,
  51. METADATAF_NB
  52. };
  53. static const char *const var_names[] = {
  54. "VALUE1",
  55. "VALUE2",
  56. NULL
  57. };
  58. enum var_name {
  59. VAR_VALUE1,
  60. VAR_VALUE2,
  61. VAR_VARS_NB
  62. };
  63. typedef struct MetadataContext {
  64. const AVClass *class;
  65. int mode;
  66. char *key;
  67. char *value;
  68. int length;
  69. int function;
  70. char *expr_str;
  71. AVExpr *expr;
  72. double var_values[VAR_VARS_NB];
  73. int (*compare)(struct MetadataContext *s,
  74. const char *value1, const char *value2, size_t length);
  75. } MetadataContext;
  76. #define OFFSET(x) offsetof(MetadataContext, x)
  77. #define DEFINE_OPTIONS(filt_name, FLAGS) \
  78. static const AVOption filt_name##_options[] = { \
  79. { "mode", "set a mode of operation", OFFSET(mode), AV_OPT_TYPE_INT, {.i64 = 0 }, 0, METADATA_NB-1, FLAGS, "mode" }, \
  80. { "select", "select frame", 0, AV_OPT_TYPE_CONST, {.i64 = METADATA_SELECT }, 0, 0, FLAGS, "mode" }, \
  81. { "add", "add new metadata", 0, AV_OPT_TYPE_CONST, {.i64 = METADATA_ADD }, 0, 0, FLAGS, "mode" }, \
  82. { "modify", "modify metadata", 0, AV_OPT_TYPE_CONST, {.i64 = METADATA_MODIFY }, 0, 0, FLAGS, "mode" }, \
  83. { "delete", "delete metadata", 0, AV_OPT_TYPE_CONST, {.i64 = METADATA_DELETE }, 0, 0, FLAGS, "mode" }, \
  84. { "print", "print metadata", 0, AV_OPT_TYPE_CONST, {.i64 = METADATA_PRINT }, 0, 0, FLAGS, "mode" }, \
  85. { "key", "set metadata key", OFFSET(key), AV_OPT_TYPE_STRING, {.str = NULL }, 0, 0, FLAGS }, \
  86. { "value", "set metadata value", OFFSET(value), AV_OPT_TYPE_STRING, {.str = NULL }, 0, 0, FLAGS }, \
  87. { "function", "function for comparing values", OFFSET(function), AV_OPT_TYPE_INT, {.i64 = 0 }, 0, METADATAF_NB-1, FLAGS, "function" }, \
  88. { "string", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = METADATAF_STRING }, 0, 3, FLAGS, "function" }, \
  89. { "less", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = METADATAF_LESS }, 0, 3, FLAGS, "function" }, \
  90. { "equal", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = METADATAF_EQUAL }, 0, 3, FLAGS, "function" }, \
  91. { "greater", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = METADATAF_GREATER }, 0, 3, FLAGS, "function" }, \
  92. { "expr", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = METADATAF_EXPR }, 0, 3, FLAGS, "function" }, \
  93. { "expr", "set expression for expr function", OFFSET(expr_str), AV_OPT_TYPE_STRING, {.str = NULL }, 0, 0, FLAGS }, \
  94. { "length", "compare up to N chars for string function", OFFSET(length), AV_OPT_TYPE_INT, {.i64 = INT_MAX }, 1, INT_MAX, FLAGS }, \
  95. { NULL } \
  96. }
  97. static int string(MetadataContext *s, const char *value1, const char *value2, size_t length)
  98. {
  99. return !strncmp(value1, value2, length);
  100. }
  101. static int equal(MetadataContext *s, const char *value1, const char *value2, size_t length)
  102. {
  103. float f1, f2;
  104. if (sscanf(value1, "%f", &f1) + sscanf(value2, "%f", &f2) != 2)
  105. return 0;
  106. return fabsf(f1 - f2) < FLT_EPSILON;
  107. }
  108. static int less(MetadataContext *s, const char *value1, const char *value2, size_t length)
  109. {
  110. float f1, f2;
  111. if (sscanf(value1, "%f", &f1) + sscanf(value2, "%f", &f2) != 2)
  112. return 0;
  113. return (f1 - f2) < FLT_EPSILON;
  114. }
  115. static int greater(MetadataContext *s, const char *value1, const char *value2, size_t length)
  116. {
  117. float f1, f2;
  118. if (sscanf(value1, "%f", &f1) + sscanf(value2, "%f", &f2) != 2)
  119. return 0;
  120. return (f2 - f1) < FLT_EPSILON;
  121. }
  122. static int parse_expr(MetadataContext *s, const char *value1, const char *value2, size_t length)
  123. {
  124. double f1, f2;
  125. if (sscanf(value1, "%lf", &f1) + sscanf(value2, "%lf", &f2) != 2)
  126. return 0;
  127. s->var_values[VAR_VALUE1] = f1;
  128. s->var_values[VAR_VALUE2] = f2;
  129. return av_expr_eval(s->expr, s->var_values, NULL);
  130. }
  131. static av_cold int init(AVFilterContext *ctx)
  132. {
  133. MetadataContext *s = ctx->priv;
  134. int ret;
  135. if (!s->key && s->mode != METADATA_PRINT) {
  136. av_log(ctx, AV_LOG_WARNING, "Metadata key must be set\n");
  137. return AVERROR(EINVAL);
  138. }
  139. if ((s->mode == METADATA_MODIFY ||
  140. s->mode == METADATA_ADD) && !s->value) {
  141. av_log(ctx, AV_LOG_WARNING, "Missing metadata value\n");
  142. return AVERROR(EINVAL);
  143. }
  144. switch (s->function) {
  145. case METADATAF_STRING:
  146. s->compare = string;
  147. break;
  148. case METADATAF_LESS:
  149. s->compare = less;
  150. break;
  151. case METADATAF_EQUAL:
  152. s->compare = equal;
  153. break;
  154. case METADATAF_GREATER:
  155. s->compare = greater;
  156. break;
  157. case METADATAF_EXPR:
  158. s->compare = parse_expr;
  159. break;
  160. default:
  161. av_assert0(0);
  162. };
  163. if (s->function == METADATAF_EXPR) {
  164. if (!s->expr_str) {
  165. av_log(ctx, AV_LOG_WARNING, "expr option not set\n");
  166. return AVERROR(EINVAL);
  167. }
  168. if ((ret = av_expr_parse(&s->expr, s->expr_str,
  169. var_names, NULL, NULL, NULL, NULL, 0, ctx)) < 0) {
  170. av_log(ctx, AV_LOG_ERROR, "Error while parsing expression '%s'\n", s->expr_str);
  171. return ret;
  172. }
  173. }
  174. return 0;
  175. }
  176. static int filter_frame(AVFilterLink *inlink, AVFrame *frame)
  177. {
  178. AVFilterContext *ctx = inlink->dst;
  179. AVFilterLink *outlink = ctx->outputs[0];
  180. MetadataContext *s = ctx->priv;
  181. AVDictionary *metadata = av_frame_get_metadata(frame);
  182. AVDictionaryEntry *e;
  183. if (!metadata)
  184. return ff_filter_frame(outlink, frame);
  185. e = av_dict_get(metadata, !s->key ? "" : s->key, NULL,
  186. !s->key ? AV_DICT_IGNORE_SUFFIX: 0);
  187. switch (s->mode) {
  188. case METADATA_SELECT:
  189. if (!s->value && e && e->value) {
  190. return ff_filter_frame(outlink, frame);
  191. } else if (s->value && e && e->value &&
  192. s->compare(s, e->value, s->value, s->length)) {
  193. return ff_filter_frame(outlink, frame);
  194. }
  195. break;
  196. case METADATA_ADD:
  197. if (e && e->value) {
  198. ;
  199. } else {
  200. av_dict_set(&metadata, s->key, s->value, 0);
  201. }
  202. return ff_filter_frame(outlink, frame);
  203. break;
  204. case METADATA_MODIFY:
  205. if (e && e->value) {
  206. av_dict_set(&metadata, s->key, s->value, 0);
  207. }
  208. return ff_filter_frame(outlink, frame);
  209. break;
  210. case METADATA_PRINT:
  211. if (!s->key && e) {
  212. av_log(ctx, AV_LOG_INFO, "frame %"PRId64" pts %"PRId64"\n", inlink->frame_count, frame->pts);
  213. av_log(ctx, AV_LOG_INFO, "%s=%s\n", e->key, e->value);
  214. while ((e = av_dict_get(metadata, "", e, AV_DICT_IGNORE_SUFFIX)) != NULL) {
  215. av_log(ctx, AV_LOG_INFO, "%s=%s\n", e->key, e->value);
  216. }
  217. } else if (e && e->value && (!s->value || (e->value && s->compare(s, e->value, s->value, s->length)))) {
  218. av_log(ctx, AV_LOG_INFO, "frame %"PRId64" pts %"PRId64"\n", inlink->frame_count, frame->pts);
  219. av_log(ctx, AV_LOG_INFO, "%s=%s\n", s->key, e->value);
  220. }
  221. return ff_filter_frame(outlink, frame);
  222. break;
  223. case METADATA_DELETE:
  224. if (e && e->value && s->value && s->compare(s, e->value, s->value, s->length)) {
  225. av_dict_set(&metadata, s->key, NULL, 0);
  226. } else if (e && e->value) {
  227. av_dict_set(&metadata, s->key, NULL, 0);
  228. }
  229. return ff_filter_frame(outlink, frame);
  230. break;
  231. default:
  232. av_assert0(0);
  233. };
  234. av_frame_free(&frame);
  235. return 0;
  236. }
  237. #if CONFIG_AMETADATA_FILTER
  238. DEFINE_OPTIONS(ametadata, AV_OPT_FLAG_AUDIO_PARAM|AV_OPT_FLAG_FILTERING_PARAM);
  239. AVFILTER_DEFINE_CLASS(ametadata);
  240. static const AVFilterPad ainputs[] = {
  241. {
  242. .name = "default",
  243. .type = AVMEDIA_TYPE_AUDIO,
  244. .filter_frame = filter_frame,
  245. },
  246. { NULL }
  247. };
  248. static const AVFilterPad aoutputs[] = {
  249. {
  250. .name = "default",
  251. .type = AVMEDIA_TYPE_AUDIO,
  252. },
  253. { NULL }
  254. };
  255. AVFilter ff_af_ametadata = {
  256. .name = "ametadata",
  257. .description = NULL_IF_CONFIG_SMALL("Manipulate audio frame metadata."),
  258. .priv_size = sizeof(MetadataContext),
  259. .priv_class = &ametadata_class,
  260. .init = init,
  261. .query_formats = ff_query_formats_all,
  262. .inputs = ainputs,
  263. .outputs = aoutputs,
  264. .flags = AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC,
  265. };
  266. #endif /* CONFIG_AMETADATA_FILTER */
  267. #if CONFIG_METADATA_FILTER
  268. DEFINE_OPTIONS(metadata, AV_OPT_FLAG_VIDEO_PARAM|AV_OPT_FLAG_FILTERING_PARAM);
  269. AVFILTER_DEFINE_CLASS(metadata);
  270. static const AVFilterPad inputs[] = {
  271. {
  272. .name = "default",
  273. .type = AVMEDIA_TYPE_VIDEO,
  274. .filter_frame = filter_frame,
  275. },
  276. { NULL }
  277. };
  278. static const AVFilterPad outputs[] = {
  279. {
  280. .name = "default",
  281. .type = AVMEDIA_TYPE_VIDEO,
  282. },
  283. { NULL }
  284. };
  285. AVFilter ff_vf_metadata = {
  286. .name = "metadata",
  287. .description = NULL_IF_CONFIG_SMALL("Manipulate video frame metadata."),
  288. .priv_size = sizeof(MetadataContext),
  289. .priv_class = &metadata_class,
  290. .init = init,
  291. .inputs = inputs,
  292. .outputs = outputs,
  293. .flags = AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC,
  294. };
  295. #endif /* CONFIG_METADATA_FILTER */