You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

368 lines
13KB

  1. /*
  2. * Copyright (c) 2011 Stefano Sabatini
  3. * This file is part of FFmpeg.
  4. *
  5. * FFmpeg is free software; you can redistribute it and/or
  6. * modify it under the terms of the GNU Lesser General Public
  7. * License as published by the Free Software Foundation; either
  8. * version 2.1 of the License, or (at your option) any later version.
  9. *
  10. * FFmpeg is distributed in the hope that it will be useful,
  11. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  13. * Lesser General Public License for more details.
  14. *
  15. * You should have received a copy of the GNU Lesser General Public
  16. * License along with FFmpeg; if not, write to the Free Software
  17. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  18. */
  19. /**
  20. * @file
  21. * filter for showing textual video frame information
  22. */
  23. #include <inttypes.h>
  24. #include "libavutil/adler32.h"
  25. #include "libavutil/display.h"
  26. #include "libavutil/imgutils.h"
  27. #include "libavutil/internal.h"
  28. #include "libavutil/opt.h"
  29. #include "libavutil/pixdesc.h"
  30. #include "libavutil/spherical.h"
  31. #include "libavutil/stereo3d.h"
  32. #include "libavutil/timestamp.h"
  33. #include "libavutil/timecode.h"
  34. #include "libavutil/mastering_display_metadata.h"
  35. #include "avfilter.h"
  36. #include "internal.h"
  37. #include "video.h"
  38. typedef struct ShowInfoContext {
  39. const AVClass *class;
  40. int calculate_checksums;
  41. } ShowInfoContext;
  42. #define OFFSET(x) offsetof(ShowInfoContext, x)
  43. #define VF AV_OPT_FLAG_VIDEO_PARAM|AV_OPT_FLAG_FILTERING_PARAM
  44. static const AVOption showinfo_options[] = {
  45. { "checksum", "calculate checksums", OFFSET(calculate_checksums), AV_OPT_TYPE_BOOL, {.i64=1}, 0, 1, VF },
  46. { NULL }
  47. };
  48. AVFILTER_DEFINE_CLASS(showinfo);
  49. static void dump_spherical(AVFilterContext *ctx, AVFrame *frame, AVFrameSideData *sd)
  50. {
  51. AVSphericalMapping *spherical = (AVSphericalMapping *)sd->data;
  52. double yaw, pitch, roll;
  53. av_log(ctx, AV_LOG_INFO, "spherical information: ");
  54. if (sd->size < sizeof(*spherical)) {
  55. av_log(ctx, AV_LOG_ERROR, "invalid data");
  56. return;
  57. }
  58. if (spherical->projection == AV_SPHERICAL_EQUIRECTANGULAR)
  59. av_log(ctx, AV_LOG_INFO, "equirectangular ");
  60. else if (spherical->projection == AV_SPHERICAL_CUBEMAP)
  61. av_log(ctx, AV_LOG_INFO, "cubemap ");
  62. else if (spherical->projection == AV_SPHERICAL_EQUIRECTANGULAR_TILE)
  63. av_log(ctx, AV_LOG_INFO, "tiled equirectangular ");
  64. else {
  65. av_log(ctx, AV_LOG_WARNING, "unknown");
  66. return;
  67. }
  68. yaw = ((double)spherical->yaw) / (1 << 16);
  69. pitch = ((double)spherical->pitch) / (1 << 16);
  70. roll = ((double)spherical->roll) / (1 << 16);
  71. av_log(ctx, AV_LOG_INFO, "(%f/%f/%f) ", yaw, pitch, roll);
  72. if (spherical->projection == AV_SPHERICAL_EQUIRECTANGULAR_TILE) {
  73. size_t l, t, r, b;
  74. av_spherical_tile_bounds(spherical, frame->width, frame->height,
  75. &l, &t, &r, &b);
  76. av_log(ctx, AV_LOG_INFO,
  77. "[%"SIZE_SPECIFIER", %"SIZE_SPECIFIER", %"SIZE_SPECIFIER", %"SIZE_SPECIFIER"] ",
  78. l, t, r, b);
  79. } else if (spherical->projection == AV_SPHERICAL_CUBEMAP) {
  80. av_log(ctx, AV_LOG_INFO, "[pad %"PRIu32"] ", spherical->padding);
  81. }
  82. }
  83. static void dump_stereo3d(AVFilterContext *ctx, AVFrameSideData *sd)
  84. {
  85. AVStereo3D *stereo;
  86. av_log(ctx, AV_LOG_INFO, "stereoscopic information: ");
  87. if (sd->size < sizeof(*stereo)) {
  88. av_log(ctx, AV_LOG_ERROR, "invalid data");
  89. return;
  90. }
  91. stereo = (AVStereo3D *)sd->data;
  92. av_log(ctx, AV_LOG_INFO, "type - %s", av_stereo3d_type_name(stereo->type));
  93. if (stereo->flags & AV_STEREO3D_FLAG_INVERT)
  94. av_log(ctx, AV_LOG_INFO, " (inverted)");
  95. }
  96. static void dump_roi(AVFilterContext *ctx, AVFrameSideData *sd)
  97. {
  98. int nb_rois;
  99. const AVRegionOfInterest *roi;
  100. uint32_t roi_size;
  101. roi = (const AVRegionOfInterest *)sd->data;
  102. roi_size = roi->self_size;
  103. if (!roi_size || sd->size % roi_size != 0) {
  104. av_log(ctx, AV_LOG_ERROR, "Invalid AVRegionOfInterest.self_size.");
  105. return;
  106. }
  107. nb_rois = sd->size / roi_size;
  108. av_log(ctx, AV_LOG_INFO, "Regions Of Interest(RoI) information: ");
  109. for (int i = 0; i < nb_rois; i++) {
  110. roi = (const AVRegionOfInterest *)(sd->data + roi_size * i);
  111. av_log(ctx, AV_LOG_INFO, "index: %d, region: (%d, %d)/(%d, %d), qp offset: %d/%d.\n",
  112. i, roi->left, roi->top, roi->right, roi->bottom, roi->qoffset.num, roi->qoffset.den);
  113. }
  114. }
  115. static void dump_mastering_display(AVFilterContext *ctx, AVFrameSideData *sd)
  116. {
  117. AVMasteringDisplayMetadata *mastering_display;
  118. av_log(ctx, AV_LOG_INFO, "mastering display: ");
  119. if (sd->size < sizeof(*mastering_display)) {
  120. av_log(ctx, AV_LOG_ERROR, "invalid data");
  121. return;
  122. }
  123. mastering_display = (AVMasteringDisplayMetadata *)sd->data;
  124. av_log(ctx, AV_LOG_INFO, "has_primaries:%d has_luminance:%d "
  125. "r(%5.4f,%5.4f) g(%5.4f,%5.4f) b(%5.4f %5.4f) wp(%5.4f, %5.4f) "
  126. "min_luminance=%f, max_luminance=%f",
  127. mastering_display->has_primaries, mastering_display->has_luminance,
  128. av_q2d(mastering_display->display_primaries[0][0]),
  129. av_q2d(mastering_display->display_primaries[0][1]),
  130. av_q2d(mastering_display->display_primaries[1][0]),
  131. av_q2d(mastering_display->display_primaries[1][1]),
  132. av_q2d(mastering_display->display_primaries[2][0]),
  133. av_q2d(mastering_display->display_primaries[2][1]),
  134. av_q2d(mastering_display->white_point[0]), av_q2d(mastering_display->white_point[1]),
  135. av_q2d(mastering_display->min_luminance), av_q2d(mastering_display->max_luminance));
  136. }
  137. static void dump_color_property(AVFilterContext *ctx, AVFrame *frame)
  138. {
  139. const char *color_range_str = av_color_range_name(frame->color_range);
  140. const char *colorspace_str = av_color_space_name(frame->colorspace);
  141. const char *color_primaries_str = av_color_primaries_name(frame->color_primaries);
  142. const char *color_trc_str = av_color_transfer_name(frame->color_trc);
  143. if (!color_range_str || frame->color_range == AVCOL_RANGE_UNSPECIFIED) {
  144. av_log(ctx, AV_LOG_INFO, "color_range:unknown");
  145. } else {
  146. av_log(ctx, AV_LOG_INFO, "color_range:%s", color_range_str);
  147. }
  148. if (!colorspace_str || frame->colorspace == AVCOL_SPC_UNSPECIFIED) {
  149. av_log(ctx, AV_LOG_INFO, " color_space:unknown");
  150. } else {
  151. av_log(ctx, AV_LOG_INFO, " color_space:%s", colorspace_str);
  152. }
  153. if (!color_primaries_str || frame->color_primaries == AVCOL_PRI_UNSPECIFIED) {
  154. av_log(ctx, AV_LOG_INFO, " color_primaries:unknown");
  155. } else {
  156. av_log(ctx, AV_LOG_INFO, " color_primaries:%s", color_primaries_str);
  157. }
  158. if (!color_trc_str || frame->color_trc == AVCOL_TRC_UNSPECIFIED) {
  159. av_log(ctx, AV_LOG_INFO, " color_trc:unknown");
  160. } else {
  161. av_log(ctx, AV_LOG_INFO, " color_trc:%s", color_trc_str);
  162. }
  163. av_log(ctx, AV_LOG_INFO, "\n");
  164. }
  165. static void update_sample_stats(const uint8_t *src, int len, int64_t *sum, int64_t *sum2)
  166. {
  167. int i;
  168. for (i = 0; i < len; i++) {
  169. *sum += src[i];
  170. *sum2 += src[i] * src[i];
  171. }
  172. }
  173. static int filter_frame(AVFilterLink *inlink, AVFrame *frame)
  174. {
  175. AVFilterContext *ctx = inlink->dst;
  176. ShowInfoContext *s = ctx->priv;
  177. const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(inlink->format);
  178. uint32_t plane_checksum[4] = {0}, checksum = 0;
  179. int64_t sum[4] = {0}, sum2[4] = {0};
  180. int32_t pixelcount[4] = {0};
  181. int i, plane, vsub = desc->log2_chroma_h;
  182. for (plane = 0; plane < 4 && s->calculate_checksums && frame->data[plane] && frame->linesize[plane]; plane++) {
  183. uint8_t *data = frame->data[plane];
  184. int h = plane == 1 || plane == 2 ? AV_CEIL_RSHIFT(inlink->h, vsub) : inlink->h;
  185. int linesize = av_image_get_linesize(frame->format, frame->width, plane);
  186. if (linesize < 0)
  187. return linesize;
  188. for (i = 0; i < h; i++) {
  189. plane_checksum[plane] = av_adler32_update(plane_checksum[plane], data, linesize);
  190. checksum = av_adler32_update(checksum, data, linesize);
  191. update_sample_stats(data, linesize, sum+plane, sum2+plane);
  192. pixelcount[plane] += linesize;
  193. data += frame->linesize[plane];
  194. }
  195. }
  196. av_log(ctx, AV_LOG_INFO,
  197. "n:%4"PRId64" pts:%7s pts_time:%-7s pos:%9"PRId64" "
  198. "fmt:%s sar:%d/%d s:%dx%d i:%c iskey:%d type:%c ",
  199. inlink->frame_count_out,
  200. av_ts2str(frame->pts), av_ts2timestr(frame->pts, &inlink->time_base), frame->pkt_pos,
  201. desc->name,
  202. frame->sample_aspect_ratio.num, frame->sample_aspect_ratio.den,
  203. frame->width, frame->height,
  204. !frame->interlaced_frame ? 'P' : /* Progressive */
  205. frame->top_field_first ? 'T' : 'B', /* Top / Bottom */
  206. frame->key_frame,
  207. av_get_picture_type_char(frame->pict_type));
  208. if (s->calculate_checksums) {
  209. av_log(ctx, AV_LOG_INFO,
  210. "checksum:%08"PRIX32" plane_checksum:[%08"PRIX32,
  211. checksum, plane_checksum[0]);
  212. for (plane = 1; plane < 4 && frame->data[plane] && frame->linesize[plane]; plane++)
  213. av_log(ctx, AV_LOG_INFO, " %08"PRIX32, plane_checksum[plane]);
  214. av_log(ctx, AV_LOG_INFO, "] mean:[");
  215. for (plane = 0; plane < 4 && frame->data[plane] && frame->linesize[plane]; plane++)
  216. av_log(ctx, AV_LOG_INFO, "%"PRId64" ", (sum[plane] + pixelcount[plane]/2) / pixelcount[plane]);
  217. av_log(ctx, AV_LOG_INFO, "\b] stdev:[");
  218. for (plane = 0; plane < 4 && frame->data[plane] && frame->linesize[plane]; plane++)
  219. av_log(ctx, AV_LOG_INFO, "%3.1f ",
  220. sqrt((sum2[plane] - sum[plane]*(double)sum[plane]/pixelcount[plane])/pixelcount[plane]));
  221. av_log(ctx, AV_LOG_INFO, "\b]");
  222. }
  223. av_log(ctx, AV_LOG_INFO, "\n");
  224. for (i = 0; i < frame->nb_side_data; i++) {
  225. AVFrameSideData *sd = frame->side_data[i];
  226. av_log(ctx, AV_LOG_INFO, " side data - ");
  227. switch (sd->type) {
  228. case AV_FRAME_DATA_PANSCAN:
  229. av_log(ctx, AV_LOG_INFO, "pan/scan");
  230. break;
  231. case AV_FRAME_DATA_A53_CC:
  232. av_log(ctx, AV_LOG_INFO, "A/53 closed captions (%d bytes)", sd->size);
  233. break;
  234. case AV_FRAME_DATA_SPHERICAL:
  235. dump_spherical(ctx, frame, sd);
  236. break;
  237. case AV_FRAME_DATA_STEREO3D:
  238. dump_stereo3d(ctx, sd);
  239. break;
  240. case AV_FRAME_DATA_S12M_TIMECODE: {
  241. uint32_t *tc = (uint32_t*)sd->data;
  242. for (int j = 1; j <= tc[0]; j++) {
  243. char tcbuf[AV_TIMECODE_STR_SIZE];
  244. av_timecode_make_smpte_tc_string(tcbuf, tc[j], 0);
  245. av_log(ctx, AV_LOG_INFO, "timecode - %s%s", tcbuf, j != tc[0] ? ", " : "");
  246. }
  247. break;
  248. }
  249. case AV_FRAME_DATA_DISPLAYMATRIX:
  250. av_log(ctx, AV_LOG_INFO, "displaymatrix: rotation of %.2f degrees",
  251. av_display_rotation_get((int32_t *)sd->data));
  252. break;
  253. case AV_FRAME_DATA_AFD:
  254. av_log(ctx, AV_LOG_INFO, "afd: value of %"PRIu8, sd->data[0]);
  255. break;
  256. case AV_FRAME_DATA_REGIONS_OF_INTEREST:
  257. dump_roi(ctx, sd);
  258. break;
  259. case AV_FRAME_DATA_MASTERING_DISPLAY_METADATA:
  260. dump_mastering_display(ctx, sd);
  261. break;
  262. default:
  263. av_log(ctx, AV_LOG_WARNING, "unknown side data type %d (%d bytes)",
  264. sd->type, sd->size);
  265. break;
  266. }
  267. av_log(ctx, AV_LOG_INFO, "\n");
  268. }
  269. dump_color_property(ctx, frame);
  270. return ff_filter_frame(inlink->dst->outputs[0], frame);
  271. }
  272. static int config_props(AVFilterContext *ctx, AVFilterLink *link, int is_out)
  273. {
  274. av_log(ctx, AV_LOG_INFO, "config %s time_base: %d/%d, frame_rate: %d/%d\n",
  275. is_out ? "out" : "in",
  276. link->time_base.num, link->time_base.den,
  277. link->frame_rate.num, link->frame_rate.den);
  278. return 0;
  279. }
  280. static int config_props_in(AVFilterLink *link)
  281. {
  282. AVFilterContext *ctx = link->dst;
  283. return config_props(ctx, link, 0);
  284. }
  285. static int config_props_out(AVFilterLink *link)
  286. {
  287. AVFilterContext *ctx = link->src;
  288. return config_props(ctx, link, 1);
  289. }
  290. static const AVFilterPad avfilter_vf_showinfo_inputs[] = {
  291. {
  292. .name = "default",
  293. .type = AVMEDIA_TYPE_VIDEO,
  294. .filter_frame = filter_frame,
  295. .config_props = config_props_in,
  296. },
  297. { NULL }
  298. };
  299. static const AVFilterPad avfilter_vf_showinfo_outputs[] = {
  300. {
  301. .name = "default",
  302. .type = AVMEDIA_TYPE_VIDEO,
  303. .config_props = config_props_out,
  304. },
  305. { NULL }
  306. };
  307. AVFilter ff_vf_showinfo = {
  308. .name = "showinfo",
  309. .description = NULL_IF_CONFIG_SMALL("Show textual information for each video frame."),
  310. .inputs = avfilter_vf_showinfo_inputs,
  311. .outputs = avfilter_vf_showinfo_outputs,
  312. .priv_size = sizeof(ShowInfoContext),
  313. .priv_class = &showinfo_class,
  314. };