2 * Copyright (c) 2015 Shivraj Patil (Shivraj.Patil@imgtec.com)
4 * This file is part of FFmpeg.
6 * FFmpeg is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
11 * FFmpeg is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with FFmpeg; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21 #ifndef AVCODEC_MIPS_VP9DSP_MIPS_H
22 #define AVCODEC_MIPS_VP9DSP_MIPS_H
24 #define VP9_8TAP_MIPS_MSA_FUNC(SIZE, type, type_idx) \
25 void ff_put_8tap_##type##_##SIZE##h_msa(uint8_t *dst, ptrdiff_t dststride, \
27 ptrdiff_t srcstride, \
28 int h, int mx, int my); \
30 void ff_put_8tap_##type##_##SIZE##v_msa(uint8_t *dst, ptrdiff_t dststride, \
32 ptrdiff_t srcstride, \
33 int h, int mx, int my); \
35 void ff_put_8tap_##type##_##SIZE##hv_msa(uint8_t *dst, ptrdiff_t dststride, \
37 ptrdiff_t srcstride, \
38 int h, int mx, int my); \
40 void ff_avg_8tap_##type##_##SIZE##h_msa(uint8_t *dst, ptrdiff_t dststride, \
42 ptrdiff_t srcstride, \
43 int h, int mx, int my); \
45 void ff_avg_8tap_##type##_##SIZE##v_msa(uint8_t *dst, ptrdiff_t dststride, \
47 ptrdiff_t srcstride, \
48 int h, int mx, int my); \
50 void ff_avg_8tap_##type##_##SIZE##hv_msa(uint8_t *dst, ptrdiff_t dststride, \
52 ptrdiff_t srcstride, \
53 int h, int mx, int my);
55 #define VP9_BILINEAR_MIPS_MSA_FUNC(SIZE) \
56 void ff_put_bilin_##SIZE##h_msa(uint8_t *dst, ptrdiff_t dststride, \
57 const uint8_t *src, ptrdiff_t srcstride, \
58 int h, int mx, int my); \
60 void ff_put_bilin_##SIZE##v_msa(uint8_t *dst, ptrdiff_t dststride, \
61 const uint8_t *src, ptrdiff_t srcstride, \
62 int h, int mx, int my); \
64 void ff_put_bilin_##SIZE##hv_msa(uint8_t *dst, ptrdiff_t dststride, \
65 const uint8_t *src, ptrdiff_t srcstride, \
66 int h, int mx, int my); \
68 void ff_avg_bilin_##SIZE##h_msa(uint8_t *dst, ptrdiff_t dststride, \
69 const uint8_t *src, ptrdiff_t srcstride, \
70 int h, int mx, int my); \
72 void ff_avg_bilin_##SIZE##v_msa(uint8_t *dst, ptrdiff_t dststride, \
73 const uint8_t *src, ptrdiff_t srcstride, \
74 int h, int mx, int my); \
76 void ff_avg_bilin_##SIZE##hv_msa(uint8_t *dst, ptrdiff_t dststride, \
77 const uint8_t *src, ptrdiff_t srcstride, \
78 int h, int mx, int my);
80 #define VP9_COPY_AVG_MIPS_MSA_FUNC(SIZE) \
81 void ff_copy##SIZE##_msa(uint8_t *dst, ptrdiff_t dststride, \
82 const uint8_t *src, ptrdiff_t srcstride, \
83 int h, int mx, int my); \
85 void ff_avg##SIZE##_msa(uint8_t *dst, ptrdiff_t dststride, \
86 const uint8_t *src, ptrdiff_t srcstride, \
87 int h, int mx, int my);
89 VP9_8TAP_MIPS_MSA_FUNC(64, regular, FILTER_8TAP_REGULAR);
90 VP9_8TAP_MIPS_MSA_FUNC(32, regular, FILTER_8TAP_REGULAR);
91 VP9_8TAP_MIPS_MSA_FUNC(16, regular, FILTER_8TAP_REGULAR);
92 VP9_8TAP_MIPS_MSA_FUNC(8, regular, FILTER_8TAP_REGULAR);
93 VP9_8TAP_MIPS_MSA_FUNC(4, regular, FILTER_8TAP_REGULAR);
95 VP9_8TAP_MIPS_MSA_FUNC(64, sharp, FILTER_8TAP_SHARP);
96 VP9_8TAP_MIPS_MSA_FUNC(32, sharp, FILTER_8TAP_SHARP);
97 VP9_8TAP_MIPS_MSA_FUNC(16, sharp, FILTER_8TAP_SHARP);
98 VP9_8TAP_MIPS_MSA_FUNC(8, sharp, FILTER_8TAP_SHARP);
99 VP9_8TAP_MIPS_MSA_FUNC(4, sharp, FILTER_8TAP_SHARP);
101 VP9_8TAP_MIPS_MSA_FUNC(64, smooth, FILTER_8TAP_SMOOTH);
102 VP9_8TAP_MIPS_MSA_FUNC(32, smooth, FILTER_8TAP_SMOOTH);
103 VP9_8TAP_MIPS_MSA_FUNC(16, smooth, FILTER_8TAP_SMOOTH);
104 VP9_8TAP_MIPS_MSA_FUNC(8, smooth, FILTER_8TAP_SMOOTH);
105 VP9_8TAP_MIPS_MSA_FUNC(4, smooth, FILTER_8TAP_SMOOTH);
107 VP9_BILINEAR_MIPS_MSA_FUNC(64);
108 VP9_BILINEAR_MIPS_MSA_FUNC(32);
109 VP9_BILINEAR_MIPS_MSA_FUNC(16);
110 VP9_BILINEAR_MIPS_MSA_FUNC(8);
111 VP9_BILINEAR_MIPS_MSA_FUNC(4);
113 VP9_COPY_AVG_MIPS_MSA_FUNC(64);
114 VP9_COPY_AVG_MIPS_MSA_FUNC(32);
115 VP9_COPY_AVG_MIPS_MSA_FUNC(16);
116 VP9_COPY_AVG_MIPS_MSA_FUNC(8);
117 VP9_COPY_AVG_MIPS_MSA_FUNC(4);
119 #undef VP9_8TAP_MIPS_MSA_FUNC
120 #undef VP9_BILINEAR_MIPS_MSA_FUNC
121 #undef VP9_COPY_AVG_MIPS_MSA_FUNC
123 void ff_loop_filter_h_4_8_msa(uint8_t *dst, ptrdiff_t stride, int32_t e,
124 int32_t i, int32_t h);
125 void ff_loop_filter_h_8_8_msa(uint8_t *dst, ptrdiff_t stride, int32_t e,
126 int32_t i, int32_t h);
127 void ff_loop_filter_h_16_8_msa(uint8_t *dst, ptrdiff_t stride, int32_t e,
128 int32_t i, int32_t h);
129 void ff_loop_filter_v_4_8_msa(uint8_t *dst, ptrdiff_t stride, int32_t e,
130 int32_t i, int32_t h);
131 void ff_loop_filter_v_8_8_msa(uint8_t *dst, ptrdiff_t stride, int32_t e,
132 int32_t i, int32_t h);
133 void ff_loop_filter_v_16_8_msa(uint8_t *dst, ptrdiff_t stride, int32_t e,
134 int32_t i, int32_t h);
135 void ff_loop_filter_h_44_16_msa(uint8_t *dst, ptrdiff_t stride, int32_t e,
136 int32_t i, int32_t h);
137 void ff_loop_filter_h_88_16_msa(uint8_t *dst, ptrdiff_t stride, int32_t e,
138 int32_t i, int32_t h);
139 void ff_loop_filter_h_16_16_msa(uint8_t *dst, ptrdiff_t stride, int32_t e,
140 int32_t i, int32_t h);
141 void ff_loop_filter_v_44_16_msa(uint8_t *dst, ptrdiff_t stride, int32_t e,
142 int32_t i, int32_t h);
143 void ff_loop_filter_v_88_16_msa(uint8_t *dst, ptrdiff_t stride, int32_t e,
144 int32_t i, int32_t h);
145 void ff_loop_filter_v_16_16_msa(uint8_t *dst, ptrdiff_t stride, int32_t e,
146 int32_t i, int32_t h);
147 void ff_loop_filter_h_48_16_msa(uint8_t *dst, ptrdiff_t stride, int32_t e,
148 int32_t i, int32_t h);
149 void ff_loop_filter_h_84_16_msa(uint8_t *dst, ptrdiff_t stride, int32_t e,
150 int32_t i, int32_t h);
151 void ff_loop_filter_v_48_16_msa(uint8_t *dst, ptrdiff_t stride, int32_t e,
152 int32_t i, int32_t h);
153 void ff_loop_filter_v_84_16_msa(uint8_t *dst, ptrdiff_t stride, int32_t e,
154 int32_t i, int32_t h);
155 void ff_idct_idct_4x4_add_msa(uint8_t *dst, ptrdiff_t stride,
156 int16_t *block, int eob);
157 void ff_idct_idct_8x8_add_msa(uint8_t *dst, ptrdiff_t stride,
158 int16_t *block, int eob);
159 void ff_idct_idct_16x16_add_msa(uint8_t *dst, ptrdiff_t stride,
160 int16_t *block, int eob);
161 void ff_idct_idct_32x32_add_msa(uint8_t *dst, ptrdiff_t stride,
162 int16_t *block, int eob);
163 void ff_iadst_iadst_4x4_add_msa(uint8_t *dst, ptrdiff_t stride,
164 int16_t *block, int eob);
165 void ff_iadst_iadst_8x8_add_msa(uint8_t *dst, ptrdiff_t stride,
166 int16_t *block, int eob);
167 void ff_iadst_iadst_16x16_add_msa(uint8_t *dst, ptrdiff_t stride,
168 int16_t *block, int eob);
169 void ff_iadst_idct_4x4_add_msa(uint8_t *dst, ptrdiff_t stride,
170 int16_t *block, int eob);
171 void ff_iadst_idct_8x8_add_msa(uint8_t *dst, ptrdiff_t stride,
172 int16_t *block, int eob);
173 void ff_iadst_idct_16x16_add_msa(uint8_t *dst, ptrdiff_t stride,
174 int16_t *block, int eob);
175 void ff_idct_iadst_4x4_add_msa(uint8_t *pu8Dest, ptrdiff_t stride,
176 int16_t *block, int eob);
177 void ff_idct_iadst_8x8_add_msa(uint8_t *pu8Dest, ptrdiff_t stride,
178 int16_t *block, int eob);
179 void ff_idct_iadst_16x16_add_msa(uint8_t *pu8Dest, ptrdiff_t stride,
180 int16_t *block, int eob);
181 void ff_iwht_iwht_4x4_add_msa(uint8_t *dst, ptrdiff_t stride,
182 int16_t *block, int eob);
184 void ff_vert_16x16_msa(uint8_t *dst, ptrdiff_t stride, const uint8_t *left,
186 void ff_vert_32x32_msa(uint8_t *dst, ptrdiff_t stride, const uint8_t *left,
188 void ff_hor_16x16_msa(uint8_t *dst, ptrdiff_t stride, const uint8_t *left,
190 void ff_hor_32x32_msa(uint8_t *dst, ptrdiff_t stride, const uint8_t *left,
192 void ff_dc_4x4_msa(uint8_t *dst, ptrdiff_t stride, const uint8_t *left,
194 void ff_dc_8x8_msa(uint8_t *dst, ptrdiff_t stride, const uint8_t *left,
196 void ff_dc_16x16_msa(uint8_t *dst, ptrdiff_t stride, const uint8_t *left,
198 void ff_dc_32x32_msa(uint8_t *dst, ptrdiff_t stride, const uint8_t *left,
200 void ff_dc_left_4x4_msa(uint8_t *dst, ptrdiff_t stride, const uint8_t *left,
202 void ff_dc_left_8x8_msa(uint8_t *dst, ptrdiff_t stride, const uint8_t *left,
204 void ff_dc_left_16x16_msa(uint8_t *dst, ptrdiff_t stride,
205 const uint8_t *left, const uint8_t *top);
206 void ff_dc_left_32x32_msa(uint8_t *dst, ptrdiff_t stride,
207 const uint8_t *left, const uint8_t *top);
208 void ff_dc_top_4x4_msa(uint8_t *dst, ptrdiff_t stride, const uint8_t *left,
210 void ff_dc_top_8x8_msa(uint8_t *dst, ptrdiff_t stride, const uint8_t *left,
212 void ff_dc_top_16x16_msa(uint8_t *dst, ptrdiff_t stride,
213 const uint8_t *left, const uint8_t *top);
214 void ff_dc_top_32x32_msa(uint8_t *dst, ptrdiff_t stride,
215 const uint8_t *left, const uint8_t *top);
216 void ff_dc_128_16x16_msa(uint8_t *dst, ptrdiff_t stride,
217 const uint8_t *left, const uint8_t *top);
218 void ff_dc_128_32x32_msa(uint8_t *dst, ptrdiff_t stride,
219 const uint8_t *left, const uint8_t *top);
220 void ff_dc_127_16x16_msa(uint8_t *dst, ptrdiff_t stride,
221 const uint8_t *left, const uint8_t *top);
222 void ff_dc_127_32x32_msa(uint8_t *dst, ptrdiff_t stride,
223 const uint8_t *left, const uint8_t *top);
224 void ff_dc_129_16x16_msa(uint8_t *dst, ptrdiff_t stride,
225 const uint8_t *left, const uint8_t *top);
226 void ff_dc_129_32x32_msa(uint8_t *dst, ptrdiff_t stride,
227 const uint8_t *left, const uint8_t *top);
228 void ff_tm_4x4_msa(uint8_t *dst, ptrdiff_t stride, const uint8_t *left,
230 void ff_tm_8x8_msa(uint8_t *dst, ptrdiff_t stride, const uint8_t *left,
232 void ff_tm_16x16_msa(uint8_t *dst, ptrdiff_t stride, const uint8_t *left,
234 void ff_tm_32x32_msa(uint8_t *dst, ptrdiff_t stride, const uint8_t *left,
237 #endif // #ifndef AVCODEC_MIPS_VP9DSP_MIPS_H