enum MatrixMode {
MATRIX_SQUARE,
MATRIX_ROW,
+ MATRIX_COLUMN,
MATRIX_NBMODES,
};
void (*setup[4])(int radius, const uint8_t *c[], const uint8_t *src, int stride,
int x, int width, int y, int height, int bpc);
- void (*filter[4])(uint8_t *dst, const uint8_t *src, int width,
+ void (*filter[4])(uint8_t *dst, int width,
float rdiv, float bias, const int *const matrix,
- const uint8_t *c[], int peak, int radius);
+ const uint8_t *c[], int peak, int radius,
+ int dstride, int stride);
} ConvolutionContext;
#define OFFSET(x) offsetof(ConvolutionContext, x)
{ "3mode", "set matrix mode for 4th plane", OFFSET(mode[3]), AV_OPT_TYPE_INT, {.i64=MATRIX_SQUARE}, 0, MATRIX_NBMODES-1, FLAGS, "mode" },
{ "square", "square matrix", 0, AV_OPT_TYPE_CONST, {.i64=MATRIX_SQUARE}, 0, 0, FLAGS, "mode" },
{ "row", "single row matrix", 0, AV_OPT_TYPE_CONST, {.i64=MATRIX_ROW} , 0, 0, FLAGS, "mode" },
+ { "column", "single column matrix", 0, AV_OPT_TYPE_CONST, {.i64=MATRIX_COLUMN}, 0, 0, FLAGS, "mode" },
{ NULL }
};
AVFrame *in, *out;
} ThreadData;
-static void filter16_prewitt(uint8_t *dstp, const uint8_t *src, int width,
+static void filter16_prewitt(uint8_t *dstp, int width,
float scale, float delta, const int *const matrix,
- const uint8_t *c[], int peak, int radius)
+ const uint8_t *c[], int peak, int radius,
+ int dstride, int stride)
{
uint16_t *dst = (uint16_t *)dstp;
int x;
}
}
-static void filter16_roberts(uint8_t *dstp, const uint8_t *src, int width,
+static void filter16_roberts(uint8_t *dstp, int width,
float scale, float delta, const int *const matrix,
- const uint8_t *c[], int peak, int radius)
+ const uint8_t *c[], int peak, int radius,
+ int dstride, int stride)
{
uint16_t *dst = (uint16_t *)dstp;
int x;
}
}
-static void filter16_sobel(uint8_t *dstp, const uint8_t *src, int width,
+static void filter16_sobel(uint8_t *dstp, int width,
float scale, float delta, const int *const matrix,
- const uint8_t *c[], int peak, int radius)
+ const uint8_t *c[], int peak, int radius,
+ int dstride, int stride)
{
uint16_t *dst = (uint16_t *)dstp;
int x;
}
}
-static void filter_prewitt(uint8_t *dst, const uint8_t *src, int width,
+static void filter_prewitt(uint8_t *dst, int width,
float scale, float delta, const int *const matrix,
- const uint8_t *c[], int peak, int radius)
+ const uint8_t *c[], int peak, int radius,
+ int dstride, int stride)
{
const uint8_t *c0 = c[0], *c1 = c[1], *c2 = c[2];
const uint8_t *c3 = c[3], *c5 = c[5];
}
}
-static void filter_roberts(uint8_t *dst, const uint8_t *src, int width,
+static void filter_roberts(uint8_t *dst, int width,
float scale, float delta, const int *const matrix,
- const uint8_t *c[], int peak, int radius)
+ const uint8_t *c[], int peak, int radius,
+ int dstride, int stride)
{
int x;
}
}
-static void filter_sobel(uint8_t *dst, const uint8_t *src, int width,
+static void filter_sobel(uint8_t *dst, int width,
float scale, float delta, const int *const matrix,
- const uint8_t *c[], int peak, int radius)
+ const uint8_t *c[], int peak, int radius,
+ int dstride, int stride)
{
const uint8_t *c0 = c[0], *c1 = c[1], *c2 = c[2];
const uint8_t *c3 = c[3], *c5 = c[5];
}
}
-static void filter16_3x3(uint8_t *dstp, const uint8_t *src, int width,
+static void filter16_3x3(uint8_t *dstp, int width,
float rdiv, float bias, const int *const matrix,
- const uint8_t *c[], int peak, int radius)
+ const uint8_t *c[], int peak, int radius,
+ int dstride, int stride)
{
uint16_t *dst = (uint16_t *)dstp;
int x;
}
}
-static void filter16_5x5(uint8_t *dstp, const uint8_t *src, int width,
+static void filter16_5x5(uint8_t *dstp, int width,
float rdiv, float bias, const int *const matrix,
- const uint8_t *c[], int peak, int radius)
+ const uint8_t *c[], int peak, int radius,
+ int dstride, int stride)
{
uint16_t *dst = (uint16_t *)dstp;
int x;
}
}
-static void filter16_7x7(uint8_t *dstp, const uint8_t *src, int width,
+static void filter16_7x7(uint8_t *dstp, int width,
float rdiv, float bias, const int *const matrix,
- const uint8_t *c[], int peak, int radius)
+ const uint8_t *c[], int peak, int radius,
+ int dstride, int stride)
{
uint16_t *dst = (uint16_t *)dstp;
int x;
}
}
-static void filter16_row(uint8_t *dstp, const uint8_t *src, int width,
+static void filter16_row(uint8_t *dstp, int width,
float rdiv, float bias, const int *const matrix,
- const uint8_t *c[], int peak, int radius)
+ const uint8_t *c[], int peak, int radius,
+ int dstride, int stride)
{
uint16_t *dst = (uint16_t *)dstp;
int x;
}
}
-static void filter_7x7(uint8_t *dst, const uint8_t *src, int width,
+static void filter16_column(uint8_t *dstp, int height,
+ float rdiv, float bias, const int *const matrix,
+ const uint8_t *c[], int peak, int radius,
+ int dstride, int stride)
+{
+ uint16_t *dst = (uint16_t *)dstp;
+ int y;
+
+ for (y = 0; y < height; y++) {
+ int i, sum = 0;
+
+ for (i = 0; i < 2 * radius + 1; i++)
+ sum += AV_RN16A(&c[i][0 + y * stride]) * matrix[i];
+
+ sum = (int)(sum * rdiv + bias + 0.5f);
+ dst[0] = av_clip(sum, 0, peak);
+ dst += dstride / 2;
+ }
+}
+
+static void filter_7x7(uint8_t *dst, int width,
float rdiv, float bias, const int *const matrix,
- const uint8_t *c[], int peak, int radius)
+ const uint8_t *c[], int peak, int radius,
+ int dstride, int stride)
{
int x;
}
}
-static void filter_5x5(uint8_t *dst, const uint8_t *src, int width,
+static void filter_5x5(uint8_t *dst, int width,
float rdiv, float bias, const int *const matrix,
- const uint8_t *c[], int peak, int radius)
+ const uint8_t *c[], int peak, int radius,
+ int dstride, int stride)
{
int x;
}
}
-static void filter_3x3(uint8_t *dst, const uint8_t *src, int width,
+static void filter_3x3(uint8_t *dst, int width,
float rdiv, float bias, const int *const matrix,
- const uint8_t *c[], int peak, int radius)
+ const uint8_t *c[], int peak, int radius,
+ int dstride, int stride)
{
const uint8_t *c0 = c[0], *c1 = c[1], *c2 = c[2];
const uint8_t *c3 = c[3], *c4 = c[4], *c5 = c[5];
}
}
-static void filter_row(uint8_t *dst, const uint8_t *src, int width,
+static void filter_row(uint8_t *dst, int width,
float rdiv, float bias, const int *const matrix,
- const uint8_t *c[], int peak, int radius)
+ const uint8_t *c[], int peak, int radius,
+ int dstride, int stride)
{
int x;
}
}
+static void filter_column(uint8_t *dst, int height,
+ float rdiv, float bias, const int *const matrix,
+ const uint8_t *c[], int peak, int radius,
+ int dstride, int stride)
+{
+ int y;
+
+ for (y = 0; y < height; y++) {
+ int i, sum = 0;
+
+ for (i = 0; i < 2 * radius + 1; i++)
+ sum += c[i][0 + y * stride] * matrix[i];
+
+ sum = (int)(sum * rdiv + bias + 0.5f);
+ dst[0] = av_clip_uint8(sum);
+ dst += dstride;
+ }
+}
+
static void setup_3x3(int radius, const uint8_t *c[], const uint8_t *src, int stride,
int x, int w, int y, int h, int bpc)
{
}
}
+static void setup_column(int radius, const uint8_t *c[], const uint8_t *src, int stride,
+ int x, int w, int y, int h, int bpc)
+{
+ int i;
+
+ for (i = 0; i < radius * 2 + 1; i++) {
+ int xoff = FFABS(x + i - radius);
+
+ xoff = xoff >= h ? 2 * h - 1 - xoff : xoff;
+
+ c[i] = src + y * bpc + xoff * stride;
+ }
+}
+
static int filter_slice(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
{
ConvolutionContext *s = ctx->priv;
int plane;
for (plane = 0; plane < s->nb_planes; plane++) {
+ const int mode = s->mode[plane];
+ const int bpc = s->bpc;
const int radius = s->size[plane] / 2;
const int height = s->planeheight[plane];
const int width = s->planewidth[plane];
const int stride = in->linesize[plane];
const int dstride = out->linesize[plane];
- const int slice_start = (height * jobnr) / nb_jobs;
- const int slice_end = (height * (jobnr+1)) / nb_jobs;
+ const int sizeh = mode == MATRIX_COLUMN ? width : height;
+ const int sizew = mode == MATRIX_COLUMN ? height : width;
+ const int slice_start = (sizeh * jobnr) / nb_jobs;
+ const int slice_end = (sizeh * (jobnr+1)) / nb_jobs;
const float rdiv = s->rdiv[plane];
const float bias = s->bias[plane];
const uint8_t *src = in->data[plane];
- uint8_t *dst = out->data[plane] + slice_start * out->linesize[plane];
+ const int dst_pos = slice_start * (mode == MATRIX_COLUMN ? bpc : out->linesize[plane]);
+ uint8_t *dst = out->data[plane] + dst_pos;
const int *matrix = s->matrix[plane];
- const int bpc = s->bpc;
const uint8_t *c[49];
int y, x;
if (s->copy[plane]) {
- av_image_copy_plane(dst, dstride, src + slice_start * stride, stride,
- width * bpc, slice_end - slice_start);
+ if (mode == MATRIX_COLUMN)
+ av_image_copy_plane(dst, dstride, src + slice_start * bpc, stride,
+ (slice_end - slice_start) * bpc, height);
+ else
+ av_image_copy_plane(dst, dstride, src + slice_start * stride, stride,
+ width * bpc, slice_end - slice_start);
continue;
}
for (y = slice_start; y < slice_end; y++) {
+ const int xoff = mode == MATRIX_COLUMN ? (y - slice_start) * bpc : radius * bpc;
+ const int yoff = mode == MATRIX_COLUMN ? radius * stride : 0;
+
for (x = 0; x < radius; x++) {
+ const int xoff = mode == MATRIX_COLUMN ? (y - slice_start) * bpc : x * bpc;
+ const int yoff = mode == MATRIX_COLUMN ? x * stride : 0;
+
s->setup[plane](radius, c, src, stride, x, width, y, height, bpc);
- s->filter[plane](dst + x * bpc, src, 1, rdiv,
- bias, matrix, c, s->max, radius);
+ s->filter[plane](dst + yoff + xoff, 1, rdiv,
+ bias, matrix, c, s->max, radius,
+ dstride, stride);
}
s->setup[plane](radius, c, src, stride, radius, width, y, height, bpc);
- s->filter[plane](dst + radius * bpc, src, width - 2 * radius,
- rdiv, bias, matrix, c, s->max, radius);
- for (x = width - radius; x < width; x++) {
+ s->filter[plane](dst + yoff + xoff, sizew - 2 * radius,
+ rdiv, bias, matrix, c, s->max, radius,
+ dstride, stride);
+ for (x = sizew - radius; x < sizew; x++) {
+ const int xoff = mode == MATRIX_COLUMN ? (y - slice_start) * bpc : x * bpc;
+ const int yoff = mode == MATRIX_COLUMN ? x * stride : 0;
+
s->setup[plane](radius, c, src, stride, x, width, y, height, bpc);
- s->filter[plane](dst + x * bpc, src, 1, rdiv,
- bias, matrix, c, s->max, radius);
+ s->filter[plane](dst + yoff + xoff, 1, rdiv,
+ bias, matrix, c, s->max, radius,
+ dstride, stride);
}
- dst += dstride;
+ if (mode != MATRIX_COLUMN)
+ dst += dstride;
}
}
for (p = 0; p < s->nb_planes; p++) {
if (s->mode[p] == MATRIX_ROW)
s->filter[p] = filter16_row;
+ else if (s->mode[p] == MATRIX_COLUMN)
+ s->filter[p] = filter16_column;
else if (s->size[p] == 3)
s->filter[p] = filter16_3x3;
else if (s->size[p] == 5)
td.in = in;
td.out = out;
- ctx->internal->execute(ctx, filter_slice, &td, NULL, FFMIN(s->planeheight[1], s->nb_threads));
+ ctx->internal->execute(ctx, filter_slice, &td, NULL, FFMIN3(s->planeheight[1], s->planewidth[1], s->nb_threads));
av_frame_free(&in);
return ff_filter_frame(outlink, out);
s->filter[i] = filter_row;
s->setup[i] = setup_row;
s->size[i] = s->matrix_length[i];
+ } else if (s->mode[i] == MATRIX_COLUMN) {
+ s->filter[i] = filter_column;
+ s->setup[i] = setup_column;
+ s->size[i] = s->matrix_length[i];
} else if (s->matrix_length[i] == 9) {
s->size[i] = 3;
if (!memcmp(matrix, same3x3, sizeof(same3x3)))