{ "S12M_TIMECOD", "", 0, AV_OPT_TYPE_CONST, {.i64 = AV_FRAME_DATA_S12M_TIMECODE }, 0, 0, FLAGS, "type" }, \
{ "DYNAMIC_HDR_PLUS", "", 0, AV_OPT_TYPE_CONST, {.i64 = AV_FRAME_DATA_DYNAMIC_HDR_PLUS }, 0, 0, FLAGS, "type" }, \
{ "REGIONS_OF_INTEREST", "", 0, AV_OPT_TYPE_CONST, {.i64 = AV_FRAME_DATA_REGIONS_OF_INTEREST }, 0, 0, FLAGS, "type" }, \
+ { "DETECTION_BOUNDING_BOXES", "", 0, AV_OPT_TYPE_CONST, {.i64 = AV_FRAME_DATA_DETECTION_BBOXES }, 0, 0, FLAGS, "type" }, \
{ "SEI_UNREGISTERED", "", 0, AV_OPT_TYPE_CONST, {.i64 = AV_FRAME_DATA_SEI_UNREGISTERED }, 0, 0, FLAGS, "type" }, \
{ NULL } \
}
{ "S12M_TIMECOD", "", 0, AV_OPT_TYPE_CONST, {.i64 = AV_FRAME_DATA_S12M_TIMECODE }, 0, 0, FLAGS, "type" }, \
{ "DYNAMIC_HDR_PLUS", "", 0, AV_OPT_TYPE_CONST, {.i64 = AV_FRAME_DATA_DYNAMIC_HDR_PLUS }, 0, 0, FLAGS, "type" }, \
{ "REGIONS_OF_INTEREST", "", 0, AV_OPT_TYPE_CONST, {.i64 = AV_FRAME_DATA_REGIONS_OF_INTEREST }, 0, 0, FLAGS, "type" }, \
+ { "DETECTION_BOUNDING_BOXES", "", 0, AV_OPT_TYPE_CONST, {.i64 = AV_FRAME_DATA_DETECTION_BBOXES }, 0, 0, FLAGS, "type" }, \
{ "SEI_UNREGISTERED", "", 0, AV_OPT_TYPE_CONST, {.i64 = AV_FRAME_DATA_SEI_UNREGISTERED }, 0, 0, FLAGS, "type" }, \
{ NULL } \
}
#include "libavutil/timecode.h"
#include "libavutil/mastering_display_metadata.h"
#include "libavutil/video_enc_params.h"
+#include "libavutil/detection_bbox.h"
#include "avfilter.h"
#include "internal.h"
}
}
+static void dump_detection_bbox(AVFilterContext *ctx, const AVFrameSideData *sd)
+{
+ int nb_bboxes;
+ const AVDetectionBBoxHeader *header;
+ const AVDetectionBBox *bbox;
+
+ header = (const AVDetectionBBoxHeader *)sd->data;
+ nb_bboxes = header->nb_bboxes;
+ av_log(ctx, AV_LOG_INFO, "detection bounding boxes:\n");
+ av_log(ctx, AV_LOG_INFO, "source: %s\n", header->source);
+
+ for (int i = 0; i < nb_bboxes; i++) {
+ bbox = av_get_detection_bbox(header, i);
+ av_log(ctx, AV_LOG_INFO, "index: %d,\tregion: (%d, %d) -> (%d, %d), label: %s, confidence: %d/%d.\n",
+ i, bbox->x, bbox->y, bbox->x + bbox->w, bbox->y + bbox->h,
+ bbox->detect_label, bbox->detect_confidence.num, bbox->detect_confidence.den);
+ if (bbox->classify_count > 0) {
+ for (int j = 0; j < bbox->classify_count; j++) {
+ av_log(ctx, AV_LOG_INFO, "\t\tclassify: label: %s, confidence: %d/%d.\n",
+ bbox->classify_labels[j], bbox->classify_confidences[j].num, bbox->classify_confidences[j].den);
+ }
+ }
+ }
+}
+
static void dump_mastering_display(AVFilterContext *ctx, const AVFrameSideData *sd)
{
const AVMasteringDisplayMetadata *mastering_display;
case AV_FRAME_DATA_REGIONS_OF_INTEREST:
dump_roi(ctx, sd);
break;
+ case AV_FRAME_DATA_DETECTION_BBOXES:
+ dump_detection_bbox(ctx, sd);
+ break;
case AV_FRAME_DATA_MASTERING_DISPLAY_METADATA:
dump_mastering_display(ctx, sd);
break;