+static av_always_inline int filter_slice_rgba_planar(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs,
+ int have_alpha)
+{
+ ColorChannelMixerContext *s = ctx->priv;
+ ThreadData *td = arg;
+ AVFrame *in = td->in;
+ AVFrame *out = td->out;
+ const int slice_start = (out->height * jobnr) / nb_jobs;
+ const int slice_end = (out->height * (jobnr+1)) / nb_jobs;
+ const uint8_t *srcg = in->data[0] + slice_start * in->linesize[0];
+ const uint8_t *srcb = in->data[1] + slice_start * in->linesize[1];
+ const uint8_t *srcr = in->data[2] + slice_start * in->linesize[2];
+ const uint8_t *srca = in->data[3] + slice_start * in->linesize[3];
+ uint8_t *dstg = out->data[0] + slice_start * out->linesize[0];
+ uint8_t *dstb = out->data[1] + slice_start * out->linesize[1];
+ uint8_t *dstr = out->data[2] + slice_start * out->linesize[2];
+ uint8_t *dsta = out->data[3] + slice_start * out->linesize[3];
+ int i, j;
+
+ for (i = slice_start; i < slice_end; i++) {
+ for (j = 0; j < out->width; j++) {
+ const uint8_t rin = srcr[j];
+ const uint8_t gin = srcg[j];
+ const uint8_t bin = srcb[j];
+ const uint8_t ain = srca[j];
+
+ dstr[j] = av_clip_uint8(s->lut[R][R][rin] +
+ s->lut[R][G][gin] +
+ s->lut[R][B][bin] +
+ (have_alpha == 1 ? s->lut[R][A][ain] : 0));
+ dstg[j] = av_clip_uint8(s->lut[G][R][rin] +
+ s->lut[G][G][gin] +
+ s->lut[G][B][bin] +
+ (have_alpha == 1 ? s->lut[G][A][ain] : 0));
+ dstb[j] = av_clip_uint8(s->lut[B][R][rin] +
+ s->lut[B][G][gin] +
+ s->lut[B][B][bin] +
+ (have_alpha == 1 ? s->lut[B][A][ain] : 0));
+ if (have_alpha == 1) {
+ dsta[j] = av_clip_uint8(s->lut[A][R][rin] +
+ s->lut[A][G][gin] +
+ s->lut[A][B][bin] +
+ s->lut[A][A][ain]);
+ }
+ }
+
+ srcg += in->linesize[0];
+ srcb += in->linesize[1];
+ srcr += in->linesize[2];
+ srca += in->linesize[3];
+ dstg += out->linesize[0];
+ dstb += out->linesize[1];
+ dstr += out->linesize[2];
+ dsta += out->linesize[3];
+ }
+
+ return 0;
+}
+
+static av_always_inline int filter_slice_rgba16_planar(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs,
+ int have_alpha, int depth)
+{
+ ColorChannelMixerContext *s = ctx->priv;
+ ThreadData *td = arg;
+ AVFrame *in = td->in;
+ AVFrame *out = td->out;
+ const int slice_start = (out->height * jobnr) / nb_jobs;
+ const int slice_end = (out->height * (jobnr+1)) / nb_jobs;
+ const uint16_t *srcg = (const uint16_t *)(in->data[0] + slice_start * in->linesize[0]);
+ const uint16_t *srcb = (const uint16_t *)(in->data[1] + slice_start * in->linesize[1]);
+ const uint16_t *srcr = (const uint16_t *)(in->data[2] + slice_start * in->linesize[2]);
+ const uint16_t *srca = (const uint16_t *)(in->data[3] + slice_start * in->linesize[3]);
+ uint16_t *dstg = (uint16_t *)(out->data[0] + slice_start * out->linesize[0]);
+ uint16_t *dstb = (uint16_t *)(out->data[1] + slice_start * out->linesize[1]);
+ uint16_t *dstr = (uint16_t *)(out->data[2] + slice_start * out->linesize[2]);
+ uint16_t *dsta = (uint16_t *)(out->data[3] + slice_start * out->linesize[3]);
+ int i, j;
+
+ for (i = slice_start; i < slice_end; i++) {
+ for (j = 0; j < out->width; j++) {
+ const uint16_t rin = srcr[j];
+ const uint16_t gin = srcg[j];
+ const uint16_t bin = srcb[j];
+ const uint16_t ain = srca[j];
+
+ dstr[j] = av_clip_uintp2(s->lut[R][R][rin] +
+ s->lut[R][G][gin] +
+ s->lut[R][B][bin] +
+ (have_alpha == 1 ? s->lut[R][A][ain] : 0), depth);
+ dstg[j] = av_clip_uintp2(s->lut[G][R][rin] +
+ s->lut[G][G][gin] +
+ s->lut[G][B][bin] +
+ (have_alpha == 1 ? s->lut[G][A][ain] : 0), depth);
+ dstb[j] = av_clip_uintp2(s->lut[B][R][rin] +
+ s->lut[B][G][gin] +
+ s->lut[B][B][bin] +
+ (have_alpha == 1 ? s->lut[B][A][ain] : 0), depth);
+ if (have_alpha == 1) {
+ dsta[j] = av_clip_uintp2(s->lut[A][R][rin] +
+ s->lut[A][G][gin] +
+ s->lut[A][B][bin] +
+ s->lut[A][A][ain], depth);
+ }
+ }
+
+ srcg += in->linesize[0] / 2;
+ srcb += in->linesize[1] / 2;
+ srcr += in->linesize[2] / 2;
+ srca += in->linesize[3] / 2;
+ dstg += out->linesize[0] / 2;
+ dstb += out->linesize[1] / 2;
+ dstr += out->linesize[2] / 2;
+ dsta += out->linesize[3] / 2;
+ }
+
+ return 0;
+}
+
+static int filter_slice_gbrp(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
+{
+ return filter_slice_rgba_planar(ctx, arg, jobnr, nb_jobs, 0);
+}
+
+static int filter_slice_gbrap(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
+{
+ return filter_slice_rgba_planar(ctx, arg, jobnr, nb_jobs, 1);
+}
+
+static int filter_slice_gbrp9(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
+{
+ return filter_slice_rgba16_planar(ctx, arg, jobnr, nb_jobs, 0, 9);
+}
+
+static int filter_slice_gbrp10(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
+{
+ return filter_slice_rgba16_planar(ctx, arg, jobnr, nb_jobs, 0, 10);
+}
+
+static int filter_slice_gbrap10(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
+{
+ return filter_slice_rgba16_planar(ctx, arg, jobnr, nb_jobs, 1, 10);
+}
+
+static int filter_slice_gbrp12(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
+{
+ return filter_slice_rgba16_planar(ctx, arg, jobnr, nb_jobs, 0, 12);
+}
+
+static int filter_slice_gbrap12(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
+{
+ return filter_slice_rgba16_planar(ctx, arg, jobnr, nb_jobs, 1, 12);
+}
+
+static int filter_slice_gbrp14(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
+{
+ return filter_slice_rgba16_planar(ctx, arg, jobnr, nb_jobs, 0, 14);
+}
+
+static int filter_slice_gbrp16(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
+{
+ return filter_slice_rgba16_planar(ctx, arg, jobnr, nb_jobs, 0, 16);
+}
+
+static int filter_slice_gbrap16(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
+{
+ return filter_slice_rgba16_planar(ctx, arg, jobnr, nb_jobs, 1, 16);
+}
+
+static av_always_inline int filter_slice_rgba_packed(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs,
+ int have_alpha, int step)
+{
+ ColorChannelMixerContext *s = ctx->priv;
+ ThreadData *td = arg;
+ AVFrame *in = td->in;
+ AVFrame *out = td->out;
+ const int slice_start = (out->height * jobnr) / nb_jobs;
+ const int slice_end = (out->height * (jobnr+1)) / nb_jobs;
+ const uint8_t roffset = s->rgba_map[R];
+ const uint8_t goffset = s->rgba_map[G];
+ const uint8_t boffset = s->rgba_map[B];
+ const uint8_t aoffset = s->rgba_map[A];
+ const uint8_t *srcrow = in->data[0] + slice_start * in->linesize[0];
+ uint8_t *dstrow = out->data[0] + slice_start * out->linesize[0];
+ int i, j;
+
+ for (i = slice_start; i < slice_end; i++) {
+ const uint8_t *src = srcrow;
+ uint8_t *dst = dstrow;
+
+ for (j = 0; j < out->width * step; j += step) {
+ const uint8_t rin = src[j + roffset];
+ const uint8_t gin = src[j + goffset];
+ const uint8_t bin = src[j + boffset];
+ const uint8_t ain = src[j + aoffset];
+
+ dst[j + roffset] = av_clip_uint8(s->lut[R][R][rin] +
+ s->lut[R][G][gin] +
+ s->lut[R][B][bin] +
+ (have_alpha == 1 ? s->lut[R][A][ain] : 0));
+ dst[j + goffset] = av_clip_uint8(s->lut[G][R][rin] +
+ s->lut[G][G][gin] +
+ s->lut[G][B][bin] +
+ (have_alpha == 1 ? s->lut[G][A][ain] : 0));
+ dst[j + boffset] = av_clip_uint8(s->lut[B][R][rin] +
+ s->lut[B][G][gin] +
+ s->lut[B][B][bin] +
+ (have_alpha == 1 ? s->lut[B][A][ain] : 0));
+ if (have_alpha == 1) {
+ dst[j + aoffset] = av_clip_uint8(s->lut[A][R][rin] +
+ s->lut[A][G][gin] +
+ s->lut[A][B][bin] +
+ s->lut[A][A][ain]);
+ } else if (have_alpha == -1 && in != out)
+ dst[j + aoffset] = 0;
+ }
+
+ srcrow += in->linesize[0];
+ dstrow += out->linesize[0];
+ }
+
+ return 0;
+}
+
+static av_always_inline int filter_slice_rgba16_packed(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs,
+ int have_alpha, int step)
+{
+ ColorChannelMixerContext *s = ctx->priv;
+ ThreadData *td = arg;
+ AVFrame *in = td->in;
+ AVFrame *out = td->out;
+ const int slice_start = (out->height * jobnr) / nb_jobs;
+ const int slice_end = (out->height * (jobnr+1)) / nb_jobs;
+ const uint8_t roffset = s->rgba_map[R];
+ const uint8_t goffset = s->rgba_map[G];
+ const uint8_t boffset = s->rgba_map[B];
+ const uint8_t aoffset = s->rgba_map[A];
+ const uint8_t *srcrow = in->data[0] + slice_start * in->linesize[0];
+ uint8_t *dstrow = out->data[0] + slice_start * out->linesize[0];
+ int i, j;
+
+ for (i = slice_start; i < slice_end; i++) {
+ const uint16_t *src = (const uint16_t *)srcrow;
+ uint16_t *dst = (uint16_t *)dstrow;
+
+ for (j = 0; j < out->width * step; j += step) {
+ const uint16_t rin = src[j + roffset];
+ const uint16_t gin = src[j + goffset];
+ const uint16_t bin = src[j + boffset];
+ const uint16_t ain = src[j + aoffset];
+
+ dst[j + roffset] = av_clip_uint16(s->lut[R][R][rin] +
+ s->lut[R][G][gin] +
+ s->lut[R][B][bin] +
+ (have_alpha == 1 ? s->lut[R][A][ain] : 0));
+ dst[j + goffset] = av_clip_uint16(s->lut[G][R][rin] +
+ s->lut[G][G][gin] +
+ s->lut[G][B][bin] +
+ (have_alpha == 1 ? s->lut[G][A][ain] : 0));
+ dst[j + boffset] = av_clip_uint16(s->lut[B][R][rin] +
+ s->lut[B][G][gin] +
+ s->lut[B][B][bin] +
+ (have_alpha == 1 ? s->lut[B][A][ain] : 0));
+ if (have_alpha == 1) {
+ dst[j + aoffset] = av_clip_uint16(s->lut[A][R][rin] +
+ s->lut[A][G][gin] +
+ s->lut[A][B][bin] +
+ s->lut[A][A][ain]);
+ }
+ }
+
+ srcrow += in->linesize[0];
+ dstrow += out->linesize[0];
+ }
+
+ return 0;
+}
+
+static int filter_slice_rgba64(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
+{
+ return filter_slice_rgba16_packed(ctx, arg, jobnr, nb_jobs, 1, 4);
+}
+
+static int filter_slice_rgb48(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
+{
+ return filter_slice_rgba16_packed(ctx, arg, jobnr, nb_jobs, 0, 3);
+}
+
+static int filter_slice_rgba(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
+{
+ return filter_slice_rgba_packed(ctx, arg, jobnr, nb_jobs, 1, 4);
+}
+
+static int filter_slice_rgb24(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
+{
+ return filter_slice_rgba_packed(ctx, arg, jobnr, nb_jobs, 0, 3);
+}
+
+static int filter_slice_rgb0(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
+{
+ return filter_slice_rgba_packed(ctx, arg, jobnr, nb_jobs, -1, 4);
+}
+