FFmpeg  4.0
vf_showinfo.c
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2011 Stefano Sabatini
3  * This file is part of FFmpeg.
4  *
5  * FFmpeg is free software; you can redistribute it and/or
6  * modify it under the terms of the GNU Lesser General Public
7  * License as published by the Free Software Foundation; either
8  * version 2.1 of the License, or (at your option) any later version.
9  *
10  * FFmpeg is distributed in the hope that it will be useful,
11  * but WITHOUT ANY WARRANTY; without even the implied warranty of
12  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13  * Lesser General Public License for more details.
14  *
15  * You should have received a copy of the GNU Lesser General Public
16  * License along with FFmpeg; if not, write to the Free Software
17  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
18  */
19 
20 /**
21  * @file
22  * filter for showing textual video frame information
23  */
24 
25 #include <inttypes.h>
26 
27 #include "libavutil/adler32.h"
28 #include "libavutil/display.h"
29 #include "libavutil/imgutils.h"
30 #include "libavutil/internal.h"
31 #include "libavutil/pixdesc.h"
32 #include "libavutil/spherical.h"
33 #include "libavutil/stereo3d.h"
34 #include "libavutil/timestamp.h"
35 
36 #include "avfilter.h"
37 #include "internal.h"
38 #include "video.h"
39 
41 {
42  AVSphericalMapping *spherical = (AVSphericalMapping *)sd->data;
43  double yaw, pitch, roll;
44 
45  av_log(ctx, AV_LOG_INFO, "spherical information: ");
46  if (sd->size < sizeof(*spherical)) {
47  av_log(ctx, AV_LOG_INFO, "invalid data");
48  return;
49  }
50 
51  if (spherical->projection == AV_SPHERICAL_EQUIRECTANGULAR)
52  av_log(ctx, AV_LOG_INFO, "equirectangular ");
53  else if (spherical->projection == AV_SPHERICAL_CUBEMAP)
54  av_log(ctx, AV_LOG_INFO, "cubemap ");
55  else if (spherical->projection == AV_SPHERICAL_EQUIRECTANGULAR_TILE)
56  av_log(ctx, AV_LOG_INFO, "tiled equirectangular ");
57  else {
58  av_log(ctx, AV_LOG_WARNING, "unknown");
59  return;
60  }
61 
62  yaw = ((double)spherical->yaw) / (1 << 16);
63  pitch = ((double)spherical->pitch) / (1 << 16);
64  roll = ((double)spherical->roll) / (1 << 16);
65  av_log(ctx, AV_LOG_INFO, "(%f/%f/%f) ", yaw, pitch, roll);
66 
68  size_t l, t, r, b;
69  av_spherical_tile_bounds(spherical, frame->width, frame->height,
70  &l, &t, &r, &b);
71  av_log(ctx, AV_LOG_INFO,
73  l, t, r, b);
74  } else if (spherical->projection == AV_SPHERICAL_CUBEMAP) {
75  av_log(ctx, AV_LOG_INFO, "[pad %"PRIu32"] ", spherical->padding);
76  }
77 }
78 
80 {
81  AVStereo3D *stereo;
82 
83  av_log(ctx, AV_LOG_INFO, "stereoscopic information: ");
84  if (sd->size < sizeof(*stereo)) {
85  av_log(ctx, AV_LOG_INFO, "invalid data");
86  return;
87  }
88 
89  stereo = (AVStereo3D *)sd->data;
90 
91  av_log(ctx, AV_LOG_INFO, "type - %s", av_stereo3d_type_name(stereo->type));
92 
93  if (stereo->flags & AV_STEREO3D_FLAG_INVERT)
94  av_log(ctx, AV_LOG_INFO, " (inverted)");
95 }
96 
97 static void update_sample_stats(const uint8_t *src, int len, int64_t *sum, int64_t *sum2)
98 {
99  int i;
100 
101  for (i = 0; i < len; i++) {
102  *sum += src[i];
103  *sum2 += src[i] * src[i];
104  }
105 }
106 
107 static int filter_frame(AVFilterLink *inlink, AVFrame *frame)
108 {
109  AVFilterContext *ctx = inlink->dst;
111  uint32_t plane_checksum[4] = {0}, checksum = 0;
112  int64_t sum[4] = {0}, sum2[4] = {0};
113  int32_t pixelcount[4] = {0};
114  int i, plane, vsub = desc->log2_chroma_h;
115 
116  for (plane = 0; plane < 4 && frame->data[plane] && frame->linesize[plane]; plane++) {
117  uint8_t *data = frame->data[plane];
118  int h = plane == 1 || plane == 2 ? AV_CEIL_RSHIFT(inlink->h, vsub) : inlink->h;
119  int linesize = av_image_get_linesize(frame->format, frame->width, plane);
120 
121  if (linesize < 0)
122  return linesize;
123 
124  for (i = 0; i < h; i++) {
125  plane_checksum[plane] = av_adler32_update(plane_checksum[plane], data, linesize);
126  checksum = av_adler32_update(checksum, data, linesize);
127 
128  update_sample_stats(data, linesize, sum+plane, sum2+plane);
129  pixelcount[plane] += linesize;
130  data += frame->linesize[plane];
131  }
132  }
133 
134  av_log(ctx, AV_LOG_INFO,
135  "n:%4"PRId64" pts:%7s pts_time:%-7s pos:%9"PRId64" "
136  "fmt:%s sar:%d/%d s:%dx%d i:%c iskey:%d type:%c "
137  "checksum:%08"PRIX32" plane_checksum:[%08"PRIX32,
138  inlink->frame_count_out,
139  av_ts2str(frame->pts), av_ts2timestr(frame->pts, &inlink->time_base), frame->pkt_pos,
140  desc->name,
142  frame->width, frame->height,
143  !frame->interlaced_frame ? 'P' : /* Progressive */
144  frame->top_field_first ? 'T' : 'B', /* Top / Bottom */
145  frame->key_frame,
147  checksum, plane_checksum[0]);
148 
149  for (plane = 1; plane < 4 && frame->data[plane] && frame->linesize[plane]; plane++)
150  av_log(ctx, AV_LOG_INFO, " %08"PRIX32, plane_checksum[plane]);
151  av_log(ctx, AV_LOG_INFO, "] mean:[");
152  for (plane = 0; plane < 4 && frame->data[plane] && frame->linesize[plane]; plane++)
153  av_log(ctx, AV_LOG_INFO, "%"PRId64" ", (sum[plane] + pixelcount[plane]/2) / pixelcount[plane]);
154  av_log(ctx, AV_LOG_INFO, "\b] stdev:[");
155  for (plane = 0; plane < 4 && frame->data[plane] && frame->linesize[plane]; plane++)
156  av_log(ctx, AV_LOG_INFO, "%3.1f ",
157  sqrt((sum2[plane] - sum[plane]*(double)sum[plane]/pixelcount[plane])/pixelcount[plane]));
158  av_log(ctx, AV_LOG_INFO, "\b]\n");
159 
160  for (i = 0; i < frame->nb_side_data; i++) {
161  AVFrameSideData *sd = frame->side_data[i];
162 
163  av_log(ctx, AV_LOG_INFO, " side data - ");
164  switch (sd->type) {
166  av_log(ctx, AV_LOG_INFO, "pan/scan");
167  break;
169  av_log(ctx, AV_LOG_INFO, "A/53 closed captions (%d bytes)", sd->size);
170  break;
172  dump_spherical(ctx, frame, sd);
173  break;
175  dump_stereo3d(ctx, sd);
176  break;
178  av_log(ctx, AV_LOG_INFO, "displaymatrix: rotation of %.2f degrees",
180  break;
181  case AV_FRAME_DATA_AFD:
182  av_log(ctx, AV_LOG_INFO, "afd: value of %"PRIu8, sd->data[0]);
183  break;
184  default:
185  av_log(ctx, AV_LOG_WARNING, "unknown side data type %d (%d bytes)",
186  sd->type, sd->size);
187  break;
188  }
189 
190  av_log(ctx, AV_LOG_INFO, "\n");
191  }
192 
193  return ff_filter_frame(inlink->dst->outputs[0], frame);
194 }
195 
196 static int config_props(AVFilterContext *ctx, AVFilterLink *link, int is_out)
197 {
198 
199  av_log(ctx, AV_LOG_INFO, "config %s time_base: %d/%d, frame_rate: %d/%d\n",
200  is_out ? "out" : "in",
201  link->time_base.num, link->time_base.den,
202  link->frame_rate.num, link->frame_rate.den);
203 
204  return 0;
205 }
206 
207 static int config_props_in(AVFilterLink *link)
208 {
209  AVFilterContext *ctx = link->dst;
210  return config_props(ctx, link, 0);
211 }
212 
214 {
215  AVFilterContext *ctx = link->src;
216  return config_props(ctx, link, 1);
217 }
218 
220  {
221  .name = "default",
222  .type = AVMEDIA_TYPE_VIDEO,
223  .filter_frame = filter_frame,
224  .config_props = config_props_in,
225  },
226  { NULL }
227 };
228 
230  {
231  .name = "default",
232  .type = AVMEDIA_TYPE_VIDEO,
233  .config_props = config_props_out,
234  },
235  { NULL }
236 };
237 
239  .name = "showinfo",
240  .description = NULL_IF_CONFIG_SMALL("Show textual information for each video frame."),
241  .inputs = avfilter_vf_showinfo_inputs,
242  .outputs = avfilter_vf_showinfo_outputs,
243 };
int32_t pitch
Rotation around the right vector [-90, 90].
Definition: spherical.h:127
int plane
Definition: avisynth_c.h:422
#define AV_STEREO3D_FLAG_INVERT
Inverted views, Right/Bottom represents the left view.
Definition: stereo3d.h:167
#define NULL
Definition: coverity.c:32
static int config_props_out(AVFilterLink *link)
Definition: vf_showinfo.c:213
int av_image_get_linesize(enum AVPixelFormat pix_fmt, int width, int plane)
Compute the size of an image line with format pix_fmt and width width for the plane plane...
Definition: imgutils.c:76
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:2363
This structure describes decoded (raw) audio or video data.
Definition: frame.h:218
static void dump_spherical(AVFilterContext *ctx, AVFrame *frame, AVFrameSideData *sd)
Definition: vf_showinfo.c:40
int64_t pkt_pos
reordered pos from the last AVPacket that has been input into the decoder
Definition: frame.h:490
misc image utilities
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:182
Main libavfilter public API header.
const char * desc
Definition: nvenc.c:65
Video represents a portion of a sphere mapped on a flat surface using equirectangular projection...
Definition: spherical.h:72
int num
Numerator.
Definition: rational.h:59
const char * b
Definition: vf_curves.c:113
Video represents a sphere mapped on a flat surface using equirectangular projection.
Definition: spherical.h:56
#define src
Definition: vp8dsp.c:254
static const AVFilterPad avfilter_vf_showinfo_inputs[]
Definition: vf_showinfo.c:219
static int filter_frame(AVFilterLink *inlink, AVFrame *frame)
Definition: vf_showinfo.c:107
const char * name
Pad name.
Definition: internal.h:60
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
Definition: avfilter.c:1080
uint8_t
timestamp utils, mostly useful for debugging/logging purposes
Stereo 3D type: this structure describes how two videos are packed within a single video surface...
Definition: stereo3d.h:176
static int config_props_in(AVFilterLink *link)
Definition: vf_showinfo.c:207
unsigned long av_adler32_update(unsigned long adler, const uint8_t *buf, unsigned int len)
Calculate the Adler32 checksum of a buffer.
Definition: adler32.c:44
void av_spherical_tile_bounds(const AVSphericalMapping *map, size_t width, size_t height, size_t *left, size_t *top, size_t *right, size_t *bottom)
Convert the bounding fields from an AVSphericalVideo from 0.32 fixed point to pixels.
Definition: spherical.c:36
int64_t pts
Presentation timestamp in time_base units (time when frame should be shown to user).
Definition: frame.h:311
The data is the AVPanScan struct defined in libavcodec.
Definition: frame.h:52
static AVFrame * frame
const char data[16]
Definition: mxf.c:90
Structure to hold side data for an AVFrame.
Definition: frame.h:180
const char * av_stereo3d_type_name(unsigned int type)
Provide a human-readable name of a given stereo3d type.
Definition: stereo3d.c:57
char av_get_picture_type_char(enum AVPictureType pict_type)
Return a single letter to describe the given picture type pict_type.
Definition: utils.c:88
int interlaced_frame
The content of the picture is interlaced.
Definition: frame.h:365
The data represents the AVSphericalMapping structure defined in libavutil/spherical.h.
Definition: frame.h:130
Active Format Description data consisting of a single byte as specified in ETSI TS 101 154 using AVAc...
Definition: frame.h:89
int nb_side_data
Definition: frame.h:431
AVFrameSideData ** side_data
Definition: frame.h:430
#define av_log(a,...)
const char * name
Definition: pixdesc.h:82
A filter pad used for either input or output.
Definition: internal.h:54
int width
Definition: frame.h:276
int flags
Additional information about the frame packing.
Definition: stereo3d.h:185
uint8_t log2_chroma_h
Amount to shift the luma height right to find the chroma height.
Definition: pixdesc.h:101
#define av_ts2timestr(ts, tb)
Convenience macro, the return value should be used only directly in function arguments but never stan...
Definition: timestamp.h:76
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
Definition: internal.h:186
Display matrix.
const char * r
Definition: vf_curves.c:111
ATSC A53 Part 4 Closed Captions.
Definition: frame.h:58
static void update_sample_stats(const uint8_t *src, int len, int64_t *sum, int64_t *sum2)
Definition: vf_showinfo.c:97
common internal API header
Video frame is split into 6 faces of a cube, and arranged on a 3x2 layout.
Definition: spherical.h:65
enum AVPictureType pict_type
Picture type of the frame.
Definition: frame.h:301
static int config_props(AVFilterContext *ctx, AVFilterLink *link, int is_out)
Definition: vf_showinfo.c:196
Spherical video.
static void dump_stereo3d(AVFilterContext *ctx, AVFrameSideData *sd)
Definition: vf_showinfo.c:79
int32_t
AVFormatContext * ctx
Definition: movenc.c:48
int32_t yaw
Rotation around the up vector [-180, 180].
Definition: spherical.h:126
static volatile int checksum
Definition: adler32.c:30
uint32_t padding
Number of pixels to pad from the edge of each cube face.
Definition: spherical.h:182
Public header for Adler-32 hash function implementation.
int format
format of the frame, -1 if unknown or unset Values correspond to enum AVPixelFormat for video frames...
Definition: frame.h:291
enum AVStereo3DType type
How views are packed within the video.
Definition: stereo3d.h:180
#define AV_LOG_INFO
Standard information.
Definition: log.h:187
This side data contains a 3x3 transformation matrix describing an affine transformation that needs to...
Definition: frame.h:84
int linesize[AV_NUM_DATA_POINTERS]
For video, size in bytes of each picture line.
Definition: frame.h:249
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
Definition: pixdesc.h:81
AVRational sample_aspect_ratio
Sample aspect ratio for the video frame, 0/1 if unknown/unspecified.
Definition: frame.h:306
uint8_t * data
Definition: frame.h:182
static const AVFilterPad avfilter_vf_showinfo_outputs[]
Definition: vf_showinfo.c:229
Filter definition.
Definition: avfilter.h:144
int32_t roll
Rotation around the forward vector [-180, 180].
Definition: spherical.h:128
const char * name
Filter name.
Definition: avfilter.h:148
This structure describes how to handle spherical videos, outlining information about projection...
Definition: spherical.h:82
AVFilterLink ** outputs
array of pointers to output links
Definition: avfilter.h:350
enum AVFrameSideDataType type
Definition: frame.h:181
#define SIZE_SPECIFIER
Definition: internal.h:262
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
Definition: frame.h:232
enum AVSphericalProjection projection
Projection type.
Definition: spherical.h:86
Stereoscopic video.
int den
Denominator.
Definition: rational.h:60
int top_field_first
If the content is interlaced, is top field displayed first.
Definition: frame.h:370
#define av_ts2str(ts)
Convenience macro, the return value should be used only directly in function arguments but never stan...
Definition: timestamp.h:54
int len
int key_frame
1 -> keyframe, 0-> not
Definition: frame.h:296
An instance of a filter.
Definition: avfilter.h:338
double av_display_rotation_get(const int32_t matrix[9])
Extract the rotation component of the transformation matrix.
Definition: display.c:34
int height
Definition: frame.h:276
internal API functions
Stereoscopic 3d metadata.
Definition: frame.h:63
#define AV_CEIL_RSHIFT(a, b)
Definition: common.h:58
AVFilter ff_vf_showinfo
Definition: vf_showinfo.c:238