2 * Discrete wavelet transform
3 * Copyright (c) 2007 Kamil Nowosad
4 * Copyright (c) 2013 Nicolas Bertrand <nicoinattendu@gmail.com>
6 * This file is part of FFmpeg.
8 * FFmpeg is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2.1 of the License, or (at your option) any later version.
13 * FFmpeg is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Lesser General Public License for more details.
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with FFmpeg; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
25 * Discrete wavelet transform
28 #include "libavutil/avassert.h"
29 #include "libavutil/common.h"
30 #include "libavutil/mem.h"
31 #include "jpeg2000dwt.h"
34 /* Defines for 9/7 DWT lifting parameters.
35 * Parameters are in float. */
36 #define F_LFTG_ALPHA 1.586134342059924f
37 #define F_LFTG_BETA 0.052980118572961f
38 #define F_LFTG_GAMMA 0.882911075530934f
39 #define F_LFTG_DELTA 0.443506852043971f
40 #define F_LFTG_K 1.230174104914001f
41 #define F_LFTG_X 1.625732422f
42 /* FIXME: Why use 1.625732422 instead of 1/F_LFTG_K?
43 * Incorrect value in JPEG2000 norm.
44 * see (ISO/IEC 15444:1 (version 2002) F.3.8.2 */
46 /* Lifting parameters in integer format.
47 * Computed as param = (float param) * (1 << 16) */
48 #define I_LFTG_ALPHA 103949
49 #define I_LFTG_BETA 3472
50 #define I_LFTG_GAMMA 57862
51 #define I_LFTG_DELTA 29066
52 #define I_LFTG_K 80621
53 #define I_LFTG_X 106544
55 static inline void extend53(int *p, int i0, int i1)
57 p[i0 - 1] = p[i0 + 1];
59 p[i0 - 2] = p[i0 + 2];
60 p[i1 + 1] = p[i1 - 3];
63 static inline void extend97_float(float *p, int i0, int i1)
67 for (i = 1; i <= 4; i++) {
68 p[i0 - i] = p[i0 + i];
69 p[i1 + i - 1] = p[i1 - i - 1];
73 static inline void extend97_int(int32_t *p, int i0, int i1)
77 for (i = 1; i <= 4; i++) {
78 p[i0 - i] = p[i0 + i];
79 p[i1 + i - 1] = p[i1 - i - 1];
83 static void sd_1d53(int *p, int i0, int i1)
95 for (i = (i0+1)/2 - 1; i < (i1+1)/2; i++)
96 p[2*i+1] -= (p[2*i] + p[2*i+2]) >> 1;
97 for (i = (i0+1)/2; i < (i1+1)/2; i++)
98 p[2*i] += (p[2*i-1] + p[2*i+1] + 2) >> 2;
101 static void dwt_encode53(DWTContext *s, int *t)
104 w = s->linelen[s->ndeclevels-1][0];
105 int *line = s->i_linebuf;
108 for (lev = s->ndeclevels-1; lev >= 0; lev--){
109 int lh = s->linelen[lev][0],
110 lv = s->linelen[lev][1],
118 for (lp = 0; lp < lh; lp++) {
121 for (i = 0; i < lv; i++)
124 sd_1d53(line, mv, mv + lv);
126 // copy back and deinterleave
127 for (i = mv; i < lv; i+=2, j++)
129 for (i = 1-mv; i < lv; i+=2, j++)
135 for (lp = 0; lp < lv; lp++){
138 for (i = 0; i < lh; i++)
141 sd_1d53(line, mh, mh + lh);
143 // copy back and deinterleave
144 for (i = mh; i < lh; i+=2, j++)
146 for (i = 1-mh; i < lh; i+=2, j++)
151 static void sd_1d97_float(float *p, int i0, int i1)
163 extend97_float(p, i0, i1);
166 for (i = i0/2 - 2; i < i1/2 + 1; i++)
167 p[2*i+1] -= 1.586134 * (p[2*i] + p[2*i+2]);
168 for (i = i0/2 - 1; i < i1/2 + 1; i++)
169 p[2*i] -= 0.052980 * (p[2*i-1] + p[2*i+1]);
170 for (i = i0/2 - 1; i < i1/2; i++)
171 p[2*i+1] += 0.882911 * (p[2*i] + p[2*i+2]);
172 for (i = i0/2; i < i1/2; i++)
173 p[2*i] += 0.443506 * (p[2*i-1] + p[2*i+1]);
176 static void dwt_encode97_float(DWTContext *s, float *t)
179 w = s->linelen[s->ndeclevels-1][0];
180 float *line = s->f_linebuf;
183 for (lev = s->ndeclevels-1; lev >= 0; lev--){
184 int lh = s->linelen[lev][0],
185 lv = s->linelen[lev][1],
191 av_assert1(!mh && !mv);
194 for (lp = 0; lp < lv; lp++){
197 for (i = 0; i < lh; i++)
200 sd_1d97_float(line, mh, mh + lh);
202 // copy back and deinterleave
203 for (i = mh; i < lh; i+=2, j++)
204 t[w*lp + j] = F_LFTG_X * l[i] / 2;
205 for (i = 1-mh; i < lh; i+=2, j++)
206 t[w*lp + j] = F_LFTG_K * l[i] / 2;
211 for (lp = 0; lp < lh; lp++) {
214 for (i = 0; i < lv; i++)
217 sd_1d97_float(line, mv, mv + lv);
219 // copy back and deinterleave
220 for (i = mv; i < lv; i+=2, j++)
221 t[w*j + lp] = F_LFTG_X * l[i] / 2;
222 for (i = 1-mv; i < lv; i+=2, j++)
223 t[w*j + lp] = F_LFTG_K * l[i] / 2;
228 static void sd_1d97_int(int *p, int i0, int i1)
234 p[1] = (p[1] * I_LFTG_X + (1<<15)) >> 16;
236 p[0] = (p[0] * I_LFTG_K + (1<<15)) >> 16;
240 extend97_int(p, i0, i1);
243 for (i = i0/2 - 2; i < i1/2 + 1; i++)
244 p[2 * i + 1] -= (I_LFTG_ALPHA * (p[2 * i] + p[2 * i + 2]) + (1 << 15)) >> 16;
245 for (i = i0/2 - 1; i < i1/2 + 1; i++)
246 p[2 * i] -= (I_LFTG_BETA * (p[2 * i - 1] + p[2 * i + 1]) + (1 << 15)) >> 16;
247 for (i = i0/2 - 1; i < i1/2; i++)
248 p[2 * i + 1] += (I_LFTG_GAMMA * (p[2 * i] + p[2 * i + 2]) + (1 << 15)) >> 16;
249 for (i = i0/2; i < i1/2; i++)
250 p[2 * i] += (I_LFTG_DELTA * (p[2 * i - 1] + p[2 * i + 1]) + (1 << 15)) >> 16;
253 static void dwt_encode97_int(DWTContext *s, int *t)
256 w = s->linelen[s->ndeclevels-1][0];
257 int *line = s->i_linebuf;
260 for (lev = s->ndeclevels-1; lev >= 0; lev--){
261 int lh = s->linelen[lev][0],
262 lv = s->linelen[lev][1],
270 for (lp = 0; lp < lh; lp++) {
273 for (i = 0; i < lv; i++)
276 sd_1d97_int(line, mv, mv + lv);
278 // copy back and deinterleave
279 for (i = mv; i < lv; i+=2, j++)
280 t[w*j + lp] = ((l[i] * I_LFTG_X) + (1 << 16)) >> 17;
281 for (i = 1-mv; i < lv; i+=2, j++)
282 t[w*j + lp] = ((l[i] * I_LFTG_K) + (1 << 16)) >> 17;
287 for (lp = 0; lp < lv; lp++){
290 for (i = 0; i < lh; i++)
293 sd_1d97_int(line, mh, mh + lh);
295 // copy back and deinterleave
296 for (i = mh; i < lh; i+=2, j++)
297 t[w*lp + j] = ((l[i] * I_LFTG_X) + (1 << 16)) >> 17;
298 for (i = 1-mh; i < lh; i+=2, j++)
299 t[w*lp + j] = ((l[i] * I_LFTG_K) + (1 << 16)) >> 17;
305 static void sr_1d53(int *p, int i0, int i1)
317 for (i = i0 / 2; i < i1 / 2 + 1; i++)
318 p[2 * i] -= (p[2 * i - 1] + p[2 * i + 1] + 2) >> 2;
319 for (i = i0 / 2; i < i1 / 2; i++)
320 p[2 * i + 1] += (p[2 * i] + p[2 * i + 2]) >> 1;
323 static void dwt_decode53(DWTContext *s, int *t)
326 int w = s->linelen[s->ndeclevels - 1][0];
327 int32_t *line = s->i_linebuf;
330 for (lev = 0; lev < s->ndeclevels; lev++) {
331 int lh = s->linelen[lev][0],
332 lv = s->linelen[lev][1],
340 for (lp = 0; lp < lv; lp++) {
342 // copy with interleaving
343 for (i = mh; i < lh; i += 2, j++)
344 l[i] = t[w * lp + j];
345 for (i = 1 - mh; i < lh; i += 2, j++)
346 l[i] = t[w * lp + j];
348 sr_1d53(line, mh, mh + lh);
350 for (i = 0; i < lh; i++)
351 t[w * lp + i] = l[i];
356 for (lp = 0; lp < lh; lp++) {
358 // copy with interleaving
359 for (i = mv; i < lv; i += 2, j++)
360 l[i] = t[w * j + lp];
361 for (i = 1 - mv; i < lv; i += 2, j++)
362 l[i] = t[w * j + lp];
364 sr_1d53(line, mv, mv + lv);
366 for (i = 0; i < lv; i++)
367 t[w * i + lp] = l[i];
372 static void sr_1d97_float(float *p, int i0, int i1)
384 extend97_float(p, i0, i1);
386 for (i = i0 / 2 - 1; i < i1 / 2 + 2; i++)
387 p[2 * i] -= F_LFTG_DELTA * (p[2 * i - 1] + p[2 * i + 1]);
389 for (i = i0 / 2 - 1; i < i1 / 2 + 1; i++)
390 p[2 * i + 1] -= F_LFTG_GAMMA * (p[2 * i] + p[2 * i + 2]);
392 for (i = i0 / 2; i < i1 / 2 + 1; i++)
393 p[2 * i] += F_LFTG_BETA * (p[2 * i - 1] + p[2 * i + 1]);
395 for (i = i0 / 2; i < i1 / 2; i++)
396 p[2 * i + 1] += F_LFTG_ALPHA * (p[2 * i] + p[2 * i + 2]);
399 static void dwt_decode97_float(DWTContext *s, float *t)
402 int w = s->linelen[s->ndeclevels - 1][0];
403 float *line = s->f_linebuf;
405 /* position at index O of line range [0-5,w+5] cf. extend function */
408 for (lev = 0; lev < s->ndeclevels; lev++) {
409 int lh = s->linelen[lev][0],
410 lv = s->linelen[lev][1],
417 for (lp = 0; lp < lv; lp++) {
419 // copy with interleaving
420 for (i = mh; i < lh; i += 2, j++)
421 l[i] = data[w * lp + j] * F_LFTG_K;
422 for (i = 1 - mh; i < lh; i += 2, j++)
423 l[i] = data[w * lp + j] * F_LFTG_X;
425 sr_1d97_float(line, mh, mh + lh);
427 for (i = 0; i < lh; i++)
428 data[w * lp + i] = l[i];
433 for (lp = 0; lp < lh; lp++) {
435 // copy with interleaving
436 for (i = mv; i < lv; i += 2, j++)
437 l[i] = data[w * j + lp] * F_LFTG_K;
438 for (i = 1 - mv; i < lv; i += 2, j++)
439 l[i] = data[w * j + lp] * F_LFTG_X;
441 sr_1d97_float(line, mv, mv + lv);
443 for (i = 0; i < lv; i++)
444 data[w * i + lp] = l[i];
449 static void sr_1d97_int(int32_t *p, int i0, int i1)
455 p[1] = (p[1] * I_LFTG_K + (1<<16)) >> 17;
457 p[0] = (p[0] * I_LFTG_X + (1<<16)) >> 17;
461 extend97_int(p, i0, i1);
463 for (i = i0 / 2 - 1; i < i1 / 2 + 2; i++)
464 p[2 * i] -= (I_LFTG_DELTA * (p[2 * i - 1] + p[2 * i + 1]) + (1 << 15)) >> 16;
466 for (i = i0 / 2 - 1; i < i1 / 2 + 1; i++)
467 p[2 * i + 1] -= (I_LFTG_GAMMA * (p[2 * i] + p[2 * i + 2]) + (1 << 15)) >> 16;
469 for (i = i0 / 2; i < i1 / 2 + 1; i++)
470 p[2 * i] += (I_LFTG_BETA * (p[2 * i - 1] + p[2 * i + 1]) + (1 << 15)) >> 16;
472 for (i = i0 / 2; i < i1 / 2; i++)
473 p[2 * i + 1] += (I_LFTG_ALPHA * (p[2 * i] + p[2 * i + 2]) + (1 << 15)) >> 16;
476 static void dwt_decode97_int(DWTContext *s, int32_t *t)
479 int w = s->linelen[s->ndeclevels - 1][0];
480 int32_t *line = s->i_linebuf;
482 /* position at index O of line range [0-5,w+5] cf. extend function */
485 for (lev = 0; lev < s->ndeclevels; lev++) {
486 int lh = s->linelen[lev][0],
487 lv = s->linelen[lev][1],
494 for (lp = 0; lp < lv; lp++) {
496 // rescale with interleaving
497 for (i = mh; i < lh; i += 2, j++)
498 l[i] = ((data[w * lp + j] * I_LFTG_K) + (1 << 15)) >> 16;
499 for (i = 1 - mh; i < lh; i += 2, j++)
500 l[i] = ((data[w * lp + j] * I_LFTG_X) + (1 << 15)) >> 16;
502 sr_1d97_int(line, mh, mh + lh);
504 for (i = 0; i < lh; i++)
505 data[w * lp + i] = l[i];
510 for (lp = 0; lp < lh; lp++) {
512 // rescale with interleaving
513 for (i = mv; i < lv; i += 2, j++)
514 l[i] = ((data[w * j + lp] * I_LFTG_K) + (1 << 15)) >> 16;
515 for (i = 1 - mv; i < lv; i += 2, j++)
516 l[i] = ((data[w * j + lp] * I_LFTG_X) + (1 << 15)) >> 16;
518 sr_1d97_int(line, mv, mv + lv);
520 for (i = 0; i < lv; i++)
521 data[w * i + lp] = l[i];
526 int ff_jpeg2000_dwt_init(DWTContext *s, uint16_t border[2][2],
527 int decomp_levels, int type)
529 int i, j, lev = decomp_levels, maxlen,
532 s->ndeclevels = decomp_levels;
535 for (i = 0; i < 2; i++)
536 for (j = 0; j < 2; j++)
537 b[i][j] = border[i][j];
539 maxlen = FFMAX(b[0][1] - b[0][0],
542 for (i = 0; i < 2; i++) {
543 s->linelen[lev][i] = b[i][1] - b[i][0];
544 s->mod[lev][i] = b[i][0] & 1;
545 for (j = 0; j < 2; j++)
546 b[i][j] = (b[i][j] + 1) >> 1;
550 s->f_linebuf = av_malloc_array((maxlen + 12), sizeof(*s->f_linebuf));
552 return AVERROR(ENOMEM);
555 s->i_linebuf = av_malloc_array((maxlen + 12), sizeof(*s->i_linebuf));
557 return AVERROR(ENOMEM);
560 s->i_linebuf = av_malloc_array((maxlen + 6), sizeof(*s->i_linebuf));
562 return AVERROR(ENOMEM);
570 int ff_dwt_encode(DWTContext *s, void *t)
574 dwt_encode97_float(s, t); break;
576 dwt_encode97_int(s, t); break;
578 dwt_encode53(s, t); break;
585 int ff_dwt_decode(DWTContext *s, void *t)
589 dwt_decode97_float(s, t);
592 dwt_decode97_int(s, t);
603 void ff_dwt_destroy(DWTContext *s)
605 av_freep(&s->f_linebuf);
606 av_freep(&s->i_linebuf);
611 #include "libavutil/lfg.h"
615 static int test_dwt(int *array, int *ref, uint16_t border[2][2], int decomp_levels, int type, int max_diff) {
617 DWTContext s1={{{0}}}, *s= &s1;
619 ret = ff_jpeg2000_dwt_init(s, border, decomp_levels, type);
621 fprintf(stderr, "ff_jpeg2000_dwt_init failed\n");
624 ret = ff_dwt_encode(s, array);
626 fprintf(stderr, "ff_dwt_encode failed\n");
629 ret = ff_dwt_decode(s, array);
631 fprintf(stderr, "ff_dwt_encode failed\n");
634 for (j = 0; j<MAX_W * MAX_W; j++) {
635 if (FFABS(array[j] - ref[j]) > max_diff) {
636 fprintf(stderr, "missmatch at %d (%d != %d) decomp:%d border %d %d %d %d\n",
637 j, array[j], ref[j],decomp_levels, border[0][0], border[0][1], border[1][0], border[1][1]);
648 int array[MAX_W * MAX_W];
649 int ref [MAX_W * MAX_W];
652 uint16_t border[2][2];
653 int ret, decomp_levels;
655 av_lfg_init(&prng, 1);
657 for (i = 0; i<MAX_W * MAX_W; i++)
658 array[i] = ref[i] = av_lfg_get(&prng) % 2048;
660 for (i = 0; i < 40; i++) {
662 border[j>>1][j&1] = av_lfg_get(&prng) % MAX_W;
663 if (border[0][0] >= border[0][1] || border[1][0] >= border[1][1])
665 decomp_levels = av_lfg_get(&prng) % FF_DWT_MAX_DECLVLS;
667 ret = test_dwt(array, ref, border, decomp_levels, FF_DWT53, 0);
670 ret = test_dwt(array, ref, border, decomp_levels, FF_DWT97_INT, FFMIN(7+5*decomp_levels, 15+3*decomp_levels));