- const uint16_t *bsrc = (const uint16_t *)bbsrc;
- const uint16_t *darksrc = (const uint16_t *)oosrc;
- const uint16_t *brightsrc = (const uint16_t *)mmsrc;
- uint16_t *dst = (uint16_t *)ddst;
- int x, y;
-
- dlinesize /= 2;
- blinesize /= 2;
- darklinesize /= 2;
- brightlinesize /= 2;
-
- for (y = 0; y < h; y++) {
- for (x = 0; x < w; x++) {
- if (bsrc[x] < darksrc[x] - undershoot)
- dst[x] = darksrc[x] - undershoot;
- else if (bsrc[x] > brightsrc[x] + overshoot)
- dst[x] = brightsrc[x] + overshoot;
- else
- dst[x] = bsrc[x];
+ MaskedClampContext *s = ctx->priv;
+ ThreadData *td = arg;
+ int p;
+
+ for (p = 0; p < s->nb_planes; p++) {
+ const ptrdiff_t blinesize = td->b->linesize[p] / 2;
+ const ptrdiff_t brightlinesize = td->m->linesize[p] / 2;
+ const ptrdiff_t darklinesize = td->o->linesize[p] / 2;
+ const ptrdiff_t dlinesize = td->d->linesize[p] / 2;
+ const int w = s->width[p];
+ const int h = s->height[p];
+ const int slice_start = (h * jobnr) / nb_jobs;
+ const int slice_end = (h * (jobnr+1)) / nb_jobs;
+ const uint16_t *bsrc = (const uint16_t *)td->b->data[p] + slice_start * blinesize;
+ const uint16_t *darksrc = (const uint16_t *)td->o->data[p] + slice_start * darklinesize;
+ const uint16_t *brightsrc = (const uint16_t *)td->m->data[p] + slice_start * brightlinesize;
+ uint16_t *dst = (uint16_t *)td->d->data[p] + slice_start * dlinesize;
+ const int undershoot = s->undershoot;
+ const int overshoot = s->overshoot;
+ int x, y;
+
+ if (!((1 << p) & s->planes)) {
+ av_image_copy_plane((uint8_t *)dst, dlinesize, (const uint8_t *)bsrc, blinesize,
+ s->linesize[p], slice_end - slice_start);
+ continue;