2 * Copyright (c) 2015 James Almer
4 * This file is part of FFmpeg.
6 * FFmpeg is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
11 * FFmpeg is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
16 * You should have received a copy of the GNU General Public License along
17 * with FFmpeg; if not, write to the Free Software Foundation, Inc.,
18 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
22 #include "libavutil/common.h"
23 #include "libavutil/fixed_dsp.h"
24 #include "libavutil/internal.h"
25 #include "libavutil/mem.h"
29 #define randomize_buffers() \
32 for (i = 0; i < BUF_SIZE; i++) { \
33 src0[i] = sign_extend(rnd(), 24); \
34 src1[i] = sign_extend(rnd(), 24); \
35 src2[i] = sign_extend(rnd(), 24); \
39 static void check_vector_fmul(const int *src0, const int *src1)
41 LOCAL_ALIGNED_32(int, ref, [BUF_SIZE]);
42 LOCAL_ALIGNED_32(int, new, [BUF_SIZE]);
44 declare_func(void, int *dst, const int *src0, const int *src1, int len);
46 call_ref(ref, src0, src1, BUF_SIZE);
47 call_new(new, src0, src1, BUF_SIZE);
48 if (memcmp(ref, new, BUF_SIZE * sizeof(int)))
50 bench_new(new, src0, src1, BUF_SIZE);
53 static void check_vector_fmul_add(const int *src0, const int *src1, const int *src2)
55 LOCAL_ALIGNED_32(int, ref, [BUF_SIZE]);
56 LOCAL_ALIGNED_32(int, new, [BUF_SIZE]);
58 declare_func(void, int *dst, const int *src0, const int *src1, const int *src2, int len);
60 call_ref(ref, src0, src1, src2, BUF_SIZE);
61 call_new(new, src0, src1, src2, BUF_SIZE);
62 if (memcmp(ref, new, BUF_SIZE * sizeof(int)))
64 bench_new(new, src0, src1, src2, BUF_SIZE);
67 static void check_vector_fmul_window(const int32_t *src0, const int32_t *src1, const int32_t *win)
69 LOCAL_ALIGNED_32(int32_t, ref, [BUF_SIZE]);
70 LOCAL_ALIGNED_32(int32_t, new, [BUF_SIZE]);
72 declare_func(void, int32_t *dst, const int32_t *src0, const int32_t *src1, const int32_t *win, int len);
74 call_ref(ref, src0, src1, win, BUF_SIZE / 2);
75 call_new(new, src0, src1, win, BUF_SIZE / 2);
76 if (memcmp(ref, new, BUF_SIZE * sizeof(int32_t)))
78 bench_new(new, src0, src1, win, BUF_SIZE / 2);
81 static void check_vector_fmul_window_scaled(const int32_t *src0, const int32_t *src1, const int32_t *win)
83 LOCAL_ALIGNED_16(int16_t, ref, [BUF_SIZE]);
84 LOCAL_ALIGNED_16(int16_t, new, [BUF_SIZE]);
86 declare_func(void, int16_t *dst, const int32_t *src0, const int32_t *src1, const int32_t *win, int len, uint8_t bits);
88 call_ref(ref, src0, src1, win, BUF_SIZE / 2, 2);
89 call_new(new, src0, src1, win, BUF_SIZE / 2, 2);
90 if (memcmp(ref, new, BUF_SIZE * sizeof(int16_t)))
92 bench_new(new, src0, src1, win, BUF_SIZE / 2, 2);
95 static void check_butterflies(const int *src0, const int *src1)
97 LOCAL_ALIGNED_16(int, ref0, [BUF_SIZE]);
98 LOCAL_ALIGNED_16(int, ref1, [BUF_SIZE]);
99 LOCAL_ALIGNED_16(int, new0, [BUF_SIZE]);
100 LOCAL_ALIGNED_16(int, new1, [BUF_SIZE]);
102 declare_func(void, int *av_restrict src0, int *av_restrict src1, int len);
104 memcpy(ref0, src0, BUF_SIZE * sizeof(*src0));
105 memcpy(ref1, src1, BUF_SIZE * sizeof(*src1));
106 memcpy(new0, src0, BUF_SIZE * sizeof(*src0));
107 memcpy(new1, src1, BUF_SIZE * sizeof(*src1));
109 call_ref(ref0, ref1, BUF_SIZE);
110 call_new(new0, new1, BUF_SIZE);
111 if (memcmp(ref0, new0, BUF_SIZE * sizeof(*ref0)) ||
112 memcmp(ref1, new1, BUF_SIZE * sizeof(*ref1)))
114 memcpy(new0, src0, BUF_SIZE * sizeof(*src0));
115 memcpy(new1, src1, BUF_SIZE * sizeof(*src1));
116 bench_new(new0, new1, BUF_SIZE);
119 static void check_scalarproduct_fixed(const int *src0, const int *src1)
123 declare_func(int, const int *src0, const int *src1, int len);
125 ref = call_ref(src0, src1, BUF_SIZE);
126 new = call_new(src0, src1, BUF_SIZE);
129 bench_new(src0, src1, BUF_SIZE);
132 void checkasm_check_fixed_dsp(void)
134 LOCAL_ALIGNED_32(int32_t, src0, [BUF_SIZE]);
135 LOCAL_ALIGNED_32(int32_t, src1, [BUF_SIZE]);
136 LOCAL_ALIGNED_32(int32_t, src2, [BUF_SIZE]);
137 AVFixedDSPContext *fdsp = avpriv_alloc_fixed_dsp(1);
140 if (check_func(fdsp->vector_fmul, "vector_fmul_fixed"))
141 check_vector_fmul(src0, src1);
142 if (check_func(fdsp->vector_fmul_add, "vector_fmul_add_fixed"))
143 check_vector_fmul_add(src0, src1, src2);
144 if (check_func(fdsp->vector_fmul_reverse, "vector_fmul_reverse_fixed"))
145 check_vector_fmul(src0, src1);
146 if (check_func(fdsp->vector_fmul_window, "vector_fmul_window_fixed"))
147 check_vector_fmul_window(src0, src1, src2);
148 if (check_func(fdsp->vector_fmul_window_scaled, "vector_fmul_window_scaled_fixed"))
149 check_vector_fmul_window_scaled(src0, src1, src2);
150 report("vector_fmul");
151 if (check_func(fdsp->butterflies_fixed, "butterflies_fixed"))
152 check_butterflies(src0, src1);
153 report("butterflies_fixed");
154 if (check_func(fdsp->scalarproduct_fixed, "scalarproduct_fixed"))
155 check_scalarproduct_fixed(src0, src1);
156 report("scalarproduct_fixed");