FFmpeg  4.4.4
h264_intrapred_init.c
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2010 Fiona Glaser <fiona@x264.com>
3  *
4  * This file is part of FFmpeg.
5  *
6  * FFmpeg is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * FFmpeg is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with FFmpeg; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19  */
20 
21 #include "libavutil/attributes.h"
22 #include "libavutil/cpu.h"
23 #include "libavutil/x86/cpu.h"
24 #include "libavcodec/avcodec.h"
25 #include "libavcodec/h264pred.h"
26 
27 #define PRED4x4(TYPE, DEPTH, OPT) \
28 void ff_pred4x4_ ## TYPE ## _ ## DEPTH ## _ ## OPT (uint8_t *src, \
29  const uint8_t *topright, \
30  ptrdiff_t stride);
31 
32 PRED4x4(dc, 10, mmxext)
33 PRED4x4(down_left, 10, sse2)
34 PRED4x4(down_left, 10, avx)
35 PRED4x4(down_right, 10, sse2)
36 PRED4x4(down_right, 10, ssse3)
37 PRED4x4(down_right, 10, avx)
38 PRED4x4(vertical_left, 10, sse2)
39 PRED4x4(vertical_left, 10, avx)
40 PRED4x4(vertical_right, 10, sse2)
41 PRED4x4(vertical_right, 10, ssse3)
42 PRED4x4(vertical_right, 10, avx)
43 PRED4x4(horizontal_up, 10, mmxext)
44 PRED4x4(horizontal_down, 10, sse2)
45 PRED4x4(horizontal_down, 10, ssse3)
46 PRED4x4(horizontal_down, 10, avx)
47 
48 #define PRED8x8(TYPE, DEPTH, OPT) \
49 void ff_pred8x8_ ## TYPE ## _ ## DEPTH ## _ ## OPT (uint8_t *src, \
50  ptrdiff_t stride);
51 
52 PRED8x8(dc, 10, mmxext)
53 PRED8x8(dc, 10, sse2)
54 PRED8x8(top_dc, 10, sse2)
55 PRED8x8(plane, 10, sse2)
56 PRED8x8(vertical, 10, sse2)
57 PRED8x8(horizontal, 10, sse2)
58 
59 #define PRED8x8L(TYPE, DEPTH, OPT)\
60 void ff_pred8x8l_ ## TYPE ## _ ## DEPTH ## _ ## OPT (uint8_t *src, \
61  int has_topleft, \
62  int has_topright, \
63  ptrdiff_t stride);
64 
65 PRED8x8L(dc, 10, sse2)
66 PRED8x8L(dc, 10, avx)
67 PRED8x8L(128_dc, 10, mmxext)
68 PRED8x8L(128_dc, 10, sse2)
69 PRED8x8L(top_dc, 10, sse2)
70 PRED8x8L(top_dc, 10, avx)
71 PRED8x8L(vertical, 10, sse2)
72 PRED8x8L(vertical, 10, avx)
73 PRED8x8L(horizontal, 10, sse2)
74 PRED8x8L(horizontal, 10, ssse3)
75 PRED8x8L(horizontal, 10, avx)
76 PRED8x8L(down_left, 10, sse2)
77 PRED8x8L(down_left, 10, ssse3)
78 PRED8x8L(down_left, 10, avx)
79 PRED8x8L(down_right, 10, sse2)
80 PRED8x8L(down_right, 10, ssse3)
81 PRED8x8L(down_right, 10, avx)
82 PRED8x8L(vertical_right, 10, sse2)
83 PRED8x8L(vertical_right, 10, ssse3)
84 PRED8x8L(vertical_right, 10, avx)
85 PRED8x8L(horizontal_up, 10, sse2)
86 PRED8x8L(horizontal_up, 10, ssse3)
87 PRED8x8L(horizontal_up, 10, avx)
88 
89 #define PRED16x16(TYPE, DEPTH, OPT)\
90 void ff_pred16x16_ ## TYPE ## _ ## DEPTH ## _ ## OPT (uint8_t *src, \
91  ptrdiff_t stride);
92 
93 PRED16x16(dc, 10, mmxext)
94 PRED16x16(dc, 10, sse2)
95 PRED16x16(top_dc, 10, mmxext)
96 PRED16x16(top_dc, 10, sse2)
97 PRED16x16(128_dc, 10, mmxext)
98 PRED16x16(128_dc, 10, sse2)
99 PRED16x16(left_dc, 10, mmxext)
100 PRED16x16(left_dc, 10, sse2)
101 PRED16x16(vertical, 10, mmxext)
102 PRED16x16(vertical, 10, sse2)
103 PRED16x16(horizontal, 10, mmxext)
104 PRED16x16(horizontal, 10, sse2)
105 
106 /* 8-bit versions */
107 PRED16x16(vertical, 8, mmx)
108 PRED16x16(vertical, 8, sse)
109 PRED16x16(horizontal, 8, mmx)
110 PRED16x16(horizontal, 8, mmxext)
111 PRED16x16(horizontal, 8, ssse3)
112 PRED16x16(dc, 8, mmxext)
113 PRED16x16(dc, 8, sse2)
114 PRED16x16(dc, 8, ssse3)
115 PRED16x16(plane_h264, 8, mmx)
116 PRED16x16(plane_h264, 8, mmxext)
117 PRED16x16(plane_h264, 8, sse2)
118 PRED16x16(plane_h264, 8, ssse3)
119 PRED16x16(plane_rv40, 8, mmx)
120 PRED16x16(plane_rv40, 8, mmxext)
121 PRED16x16(plane_rv40, 8, sse2)
122 PRED16x16(plane_rv40, 8, ssse3)
123 PRED16x16(plane_svq3, 8, mmx)
124 PRED16x16(plane_svq3, 8, mmxext)
125 PRED16x16(plane_svq3, 8, sse2)
126 PRED16x16(plane_svq3, 8, ssse3)
127 PRED16x16(tm_vp8, 8, mmx)
128 PRED16x16(tm_vp8, 8, mmxext)
129 PRED16x16(tm_vp8, 8, sse2)
130 PRED16x16(tm_vp8, 8, avx2)
131 
132 PRED8x8(top_dc, 8, mmxext)
133 PRED8x8(dc_rv40, 8, mmxext)
134 PRED8x8(dc, 8, mmxext)
135 PRED8x8(vertical, 8, mmx)
136 PRED8x8(horizontal, 8, mmx)
137 PRED8x8(horizontal, 8, mmxext)
138 PRED8x8(horizontal, 8, ssse3)
139 PRED8x8(plane, 8, mmx)
140 PRED8x8(plane, 8, mmxext)
141 PRED8x8(plane, 8, sse2)
142 PRED8x8(plane, 8, ssse3)
143 PRED8x8(tm_vp8, 8, mmx)
144 PRED8x8(tm_vp8, 8, mmxext)
145 PRED8x8(tm_vp8, 8, sse2)
146 PRED8x8(tm_vp8, 8, ssse3)
147 
148 PRED8x8L(top_dc, 8, mmxext)
149 PRED8x8L(top_dc, 8, ssse3)
150 PRED8x8L(dc, 8, mmxext)
151 PRED8x8L(dc, 8, ssse3)
152 PRED8x8L(horizontal, 8, mmxext)
153 PRED8x8L(horizontal, 8, ssse3)
154 PRED8x8L(vertical, 8, mmxext)
155 PRED8x8L(vertical, 8, ssse3)
156 PRED8x8L(down_left, 8, mmxext)
157 PRED8x8L(down_left, 8, sse2)
158 PRED8x8L(down_left, 8, ssse3)
159 PRED8x8L(down_right, 8, mmxext)
160 PRED8x8L(down_right, 8, sse2)
161 PRED8x8L(down_right, 8, ssse3)
162 PRED8x8L(vertical_right, 8, mmxext)
163 PRED8x8L(vertical_right, 8, sse2)
164 PRED8x8L(vertical_right, 8, ssse3)
165 PRED8x8L(vertical_left, 8, sse2)
166 PRED8x8L(vertical_left, 8, ssse3)
167 PRED8x8L(horizontal_up, 8, mmxext)
168 PRED8x8L(horizontal_up, 8, ssse3)
169 PRED8x8L(horizontal_down, 8, mmxext)
170 PRED8x8L(horizontal_down, 8, sse2)
171 PRED8x8L(horizontal_down, 8, ssse3)
172 
173 PRED4x4(dc, 8, mmxext)
174 PRED4x4(down_left, 8, mmxext)
175 PRED4x4(down_right, 8, mmxext)
176 PRED4x4(vertical_left, 8, mmxext)
177 PRED4x4(vertical_right, 8, mmxext)
178 PRED4x4(horizontal_up, 8, mmxext)
179 PRED4x4(horizontal_down, 8, mmxext)
180 PRED4x4(tm_vp8, 8, mmx)
181 PRED4x4(tm_vp8, 8, mmxext)
182 PRED4x4(tm_vp8, 8, ssse3)
183 PRED4x4(vertical_vp8, 8, mmxext)
184 
186  const int bit_depth,
187  const int chroma_format_idc)
188 {
189  int cpu_flags = av_get_cpu_flags();
190 
191  if (bit_depth == 8) {
192  if (EXTERNAL_MMX(cpu_flags)) {
193  h->pred16x16[VERT_PRED8x8 ] = ff_pred16x16_vertical_8_mmx;
194  h->pred16x16[HOR_PRED8x8 ] = ff_pred16x16_horizontal_8_mmx;
195  if (chroma_format_idc <= 1) {
196  h->pred8x8 [VERT_PRED8x8 ] = ff_pred8x8_vertical_8_mmx;
197  h->pred8x8 [HOR_PRED8x8 ] = ff_pred8x8_horizontal_8_mmx;
198  }
200  h->pred16x16[PLANE_PRED8x8 ] = ff_pred16x16_tm_vp8_8_mmx;
201  h->pred8x8 [PLANE_PRED8x8 ] = ff_pred8x8_tm_vp8_8_mmx;
202  h->pred4x4 [TM_VP8_PRED ] = ff_pred4x4_tm_vp8_8_mmx;
203  } else {
204  if (chroma_format_idc <= 1)
205  h->pred8x8 [PLANE_PRED8x8] = ff_pred8x8_plane_8_mmx;
206  if (codec_id == AV_CODEC_ID_SVQ3) {
208  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_svq3_8_mmx;
209  } else if (codec_id == AV_CODEC_ID_RV40) {
210  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_rv40_8_mmx;
211  } else {
212  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_h264_8_mmx;
213  }
214  }
215  }
216 
217  if (EXTERNAL_MMXEXT(cpu_flags)) {
218  h->pred16x16[HOR_PRED8x8 ] = ff_pred16x16_horizontal_8_mmxext;
219  h->pred16x16[DC_PRED8x8 ] = ff_pred16x16_dc_8_mmxext;
220  if (chroma_format_idc <= 1)
221  h->pred8x8[HOR_PRED8x8 ] = ff_pred8x8_horizontal_8_mmxext;
222  h->pred8x8l [TOP_DC_PRED ] = ff_pred8x8l_top_dc_8_mmxext;
223  h->pred8x8l [DC_PRED ] = ff_pred8x8l_dc_8_mmxext;
224  h->pred8x8l [HOR_PRED ] = ff_pred8x8l_horizontal_8_mmxext;
225  h->pred8x8l [VERT_PRED ] = ff_pred8x8l_vertical_8_mmxext;
226  h->pred8x8l [DIAG_DOWN_RIGHT_PRED ] = ff_pred8x8l_down_right_8_mmxext;
227  h->pred8x8l [VERT_RIGHT_PRED ] = ff_pred8x8l_vertical_right_8_mmxext;
228  h->pred8x8l [HOR_UP_PRED ] = ff_pred8x8l_horizontal_up_8_mmxext;
229  h->pred8x8l [DIAG_DOWN_LEFT_PRED ] = ff_pred8x8l_down_left_8_mmxext;
230  h->pred8x8l [HOR_DOWN_PRED ] = ff_pred8x8l_horizontal_down_8_mmxext;
231  h->pred4x4 [DIAG_DOWN_RIGHT_PRED ] = ff_pred4x4_down_right_8_mmxext;
232  h->pred4x4 [VERT_RIGHT_PRED ] = ff_pred4x4_vertical_right_8_mmxext;
233  h->pred4x4 [HOR_DOWN_PRED ] = ff_pred4x4_horizontal_down_8_mmxext;
234  h->pred4x4 [DC_PRED ] = ff_pred4x4_dc_8_mmxext;
237  h->pred4x4 [DIAG_DOWN_LEFT_PRED] = ff_pred4x4_down_left_8_mmxext;
238  }
240  h->pred4x4 [VERT_LEFT_PRED ] = ff_pred4x4_vertical_left_8_mmxext;
241  }
242  if (codec_id != AV_CODEC_ID_RV40) {
243  h->pred4x4 [HOR_UP_PRED ] = ff_pred4x4_horizontal_up_8_mmxext;
244  }
246  if (chroma_format_idc <= 1) {
247  h->pred8x8[TOP_DC_PRED8x8 ] = ff_pred8x8_top_dc_8_mmxext;
248  h->pred8x8[DC_PRED8x8 ] = ff_pred8x8_dc_8_mmxext;
249  }
250  }
252  h->pred16x16[PLANE_PRED8x8 ] = ff_pred16x16_tm_vp8_8_mmxext;
253  h->pred8x8 [DC_PRED8x8 ] = ff_pred8x8_dc_rv40_8_mmxext;
254  h->pred8x8 [PLANE_PRED8x8 ] = ff_pred8x8_tm_vp8_8_mmxext;
255  h->pred4x4 [TM_VP8_PRED ] = ff_pred4x4_tm_vp8_8_mmxext;
256  h->pred4x4 [VERT_PRED ] = ff_pred4x4_vertical_vp8_8_mmxext;
257  } else {
258  if (chroma_format_idc <= 1)
259  h->pred8x8 [PLANE_PRED8x8] = ff_pred8x8_plane_8_mmxext;
260  if (codec_id == AV_CODEC_ID_SVQ3) {
261  h->pred16x16[PLANE_PRED8x8 ] = ff_pred16x16_plane_svq3_8_mmxext;
262  } else if (codec_id == AV_CODEC_ID_RV40) {
263  h->pred16x16[PLANE_PRED8x8 ] = ff_pred16x16_plane_rv40_8_mmxext;
264  } else {
265  h->pred16x16[PLANE_PRED8x8 ] = ff_pred16x16_plane_h264_8_mmxext;
266  }
267  }
268  }
269 
270  if (EXTERNAL_SSE(cpu_flags)) {
271  h->pred16x16[VERT_PRED8x8] = ff_pred16x16_vertical_8_sse;
272  }
273 
274  if (EXTERNAL_SSE2(cpu_flags)) {
275  h->pred16x16[DC_PRED8x8 ] = ff_pred16x16_dc_8_sse2;
276  h->pred8x8l [DIAG_DOWN_LEFT_PRED ] = ff_pred8x8l_down_left_8_sse2;
277  h->pred8x8l [DIAG_DOWN_RIGHT_PRED ] = ff_pred8x8l_down_right_8_sse2;
278  h->pred8x8l [VERT_RIGHT_PRED ] = ff_pred8x8l_vertical_right_8_sse2;
279  h->pred8x8l [VERT_LEFT_PRED ] = ff_pred8x8l_vertical_left_8_sse2;
280  h->pred8x8l [HOR_DOWN_PRED ] = ff_pred8x8l_horizontal_down_8_sse2;
282  h->pred16x16[PLANE_PRED8x8 ] = ff_pred16x16_tm_vp8_8_sse2;
283  h->pred8x8 [PLANE_PRED8x8 ] = ff_pred8x8_tm_vp8_8_sse2;
284  } else {
285  if (chroma_format_idc <= 1)
286  h->pred8x8 [PLANE_PRED8x8] = ff_pred8x8_plane_8_sse2;
287  if (codec_id == AV_CODEC_ID_SVQ3) {
288  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_svq3_8_sse2;
289  } else if (codec_id == AV_CODEC_ID_RV40) {
290  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_rv40_8_sse2;
291  } else {
292  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_h264_8_sse2;
293  }
294  }
295  }
296 
297  if (EXTERNAL_SSSE3(cpu_flags)) {
298  h->pred16x16[HOR_PRED8x8 ] = ff_pred16x16_horizontal_8_ssse3;
299  h->pred16x16[DC_PRED8x8 ] = ff_pred16x16_dc_8_ssse3;
300  if (chroma_format_idc <= 1)
301  h->pred8x8 [HOR_PRED8x8 ] = ff_pred8x8_horizontal_8_ssse3;
302  h->pred8x8l [TOP_DC_PRED ] = ff_pred8x8l_top_dc_8_ssse3;
303  h->pred8x8l [DC_PRED ] = ff_pred8x8l_dc_8_ssse3;
304  h->pred8x8l [HOR_PRED ] = ff_pred8x8l_horizontal_8_ssse3;
305  h->pred8x8l [VERT_PRED ] = ff_pred8x8l_vertical_8_ssse3;
306  h->pred8x8l [DIAG_DOWN_LEFT_PRED ] = ff_pred8x8l_down_left_8_ssse3;
307  h->pred8x8l [DIAG_DOWN_RIGHT_PRED ] = ff_pred8x8l_down_right_8_ssse3;
308  h->pred8x8l [VERT_RIGHT_PRED ] = ff_pred8x8l_vertical_right_8_ssse3;
309  h->pred8x8l [VERT_LEFT_PRED ] = ff_pred8x8l_vertical_left_8_ssse3;
310  h->pred8x8l [HOR_UP_PRED ] = ff_pred8x8l_horizontal_up_8_ssse3;
311  h->pred8x8l [HOR_DOWN_PRED ] = ff_pred8x8l_horizontal_down_8_ssse3;
313  h->pred8x8 [PLANE_PRED8x8 ] = ff_pred8x8_tm_vp8_8_ssse3;
314  h->pred4x4 [TM_VP8_PRED ] = ff_pred4x4_tm_vp8_8_ssse3;
315  } else {
316  if (chroma_format_idc <= 1)
317  h->pred8x8 [PLANE_PRED8x8] = ff_pred8x8_plane_8_ssse3;
318  if (codec_id == AV_CODEC_ID_SVQ3) {
319  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_svq3_8_ssse3;
320  } else if (codec_id == AV_CODEC_ID_RV40) {
321  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_rv40_8_ssse3;
322  } else {
323  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_h264_8_ssse3;
324  }
325  }
326  }
327 
329  if (codec_id == AV_CODEC_ID_VP8) {
330  h->pred16x16[PLANE_PRED8x8 ] = ff_pred16x16_tm_vp8_8_avx2;
331  }
332  }
333  } else if (bit_depth == 10) {
334  if (EXTERNAL_MMXEXT(cpu_flags)) {
335  h->pred4x4[DC_PRED ] = ff_pred4x4_dc_10_mmxext;
336  h->pred4x4[HOR_UP_PRED ] = ff_pred4x4_horizontal_up_10_mmxext;
337 
338  if (chroma_format_idc <= 1)
339  h->pred8x8[DC_PRED8x8 ] = ff_pred8x8_dc_10_mmxext;
340 
341  h->pred8x8l[DC_128_PRED ] = ff_pred8x8l_128_dc_10_mmxext;
342 
343  h->pred16x16[DC_PRED8x8 ] = ff_pred16x16_dc_10_mmxext;
344  h->pred16x16[TOP_DC_PRED8x8 ] = ff_pred16x16_top_dc_10_mmxext;
345  h->pred16x16[DC_128_PRED8x8 ] = ff_pred16x16_128_dc_10_mmxext;
346  h->pred16x16[LEFT_DC_PRED8x8 ] = ff_pred16x16_left_dc_10_mmxext;
347  h->pred16x16[VERT_PRED8x8 ] = ff_pred16x16_vertical_10_mmxext;
348  h->pred16x16[HOR_PRED8x8 ] = ff_pred16x16_horizontal_10_mmxext;
349  }
350  if (EXTERNAL_SSE2(cpu_flags)) {
351  h->pred4x4[DIAG_DOWN_LEFT_PRED ] = ff_pred4x4_down_left_10_sse2;
352  h->pred4x4[DIAG_DOWN_RIGHT_PRED] = ff_pred4x4_down_right_10_sse2;
353  h->pred4x4[VERT_LEFT_PRED ] = ff_pred4x4_vertical_left_10_sse2;
354  h->pred4x4[VERT_RIGHT_PRED ] = ff_pred4x4_vertical_right_10_sse2;
355  h->pred4x4[HOR_DOWN_PRED ] = ff_pred4x4_horizontal_down_10_sse2;
356 
357  if (chroma_format_idc <= 1) {
358  h->pred8x8[DC_PRED8x8 ] = ff_pred8x8_dc_10_sse2;
359  h->pred8x8[TOP_DC_PRED8x8 ] = ff_pred8x8_top_dc_10_sse2;
360  h->pred8x8[PLANE_PRED8x8 ] = ff_pred8x8_plane_10_sse2;
361  h->pred8x8[VERT_PRED8x8 ] = ff_pred8x8_vertical_10_sse2;
362  h->pred8x8[HOR_PRED8x8 ] = ff_pred8x8_horizontal_10_sse2;
363  }
364 
365  h->pred8x8l[VERT_PRED ] = ff_pred8x8l_vertical_10_sse2;
366  h->pred8x8l[HOR_PRED ] = ff_pred8x8l_horizontal_10_sse2;
367  h->pred8x8l[DC_PRED ] = ff_pred8x8l_dc_10_sse2;
368  h->pred8x8l[DC_128_PRED ] = ff_pred8x8l_128_dc_10_sse2;
369  h->pred8x8l[TOP_DC_PRED ] = ff_pred8x8l_top_dc_10_sse2;
370  h->pred8x8l[DIAG_DOWN_LEFT_PRED ] = ff_pred8x8l_down_left_10_sse2;
371  h->pred8x8l[DIAG_DOWN_RIGHT_PRED] = ff_pred8x8l_down_right_10_sse2;
372  h->pred8x8l[VERT_RIGHT_PRED ] = ff_pred8x8l_vertical_right_10_sse2;
373  h->pred8x8l[HOR_UP_PRED ] = ff_pred8x8l_horizontal_up_10_sse2;
374 
375  h->pred16x16[DC_PRED8x8 ] = ff_pred16x16_dc_10_sse2;
376  h->pred16x16[TOP_DC_PRED8x8 ] = ff_pred16x16_top_dc_10_sse2;
377  h->pred16x16[DC_128_PRED8x8 ] = ff_pred16x16_128_dc_10_sse2;
378  h->pred16x16[LEFT_DC_PRED8x8 ] = ff_pred16x16_left_dc_10_sse2;
379  h->pred16x16[VERT_PRED8x8 ] = ff_pred16x16_vertical_10_sse2;
380  h->pred16x16[HOR_PRED8x8 ] = ff_pred16x16_horizontal_10_sse2;
381  }
382  if (EXTERNAL_SSSE3(cpu_flags)) {
383  h->pred4x4[DIAG_DOWN_RIGHT_PRED] = ff_pred4x4_down_right_10_ssse3;
384  h->pred4x4[VERT_RIGHT_PRED ] = ff_pred4x4_vertical_right_10_ssse3;
385  h->pred4x4[HOR_DOWN_PRED ] = ff_pred4x4_horizontal_down_10_ssse3;
386 
387  h->pred8x8l[HOR_PRED ] = ff_pred8x8l_horizontal_10_ssse3;
388  h->pred8x8l[DIAG_DOWN_LEFT_PRED ] = ff_pred8x8l_down_left_10_ssse3;
389  h->pred8x8l[DIAG_DOWN_RIGHT_PRED] = ff_pred8x8l_down_right_10_ssse3;
390  h->pred8x8l[VERT_RIGHT_PRED ] = ff_pred8x8l_vertical_right_10_ssse3;
391  h->pred8x8l[HOR_UP_PRED ] = ff_pred8x8l_horizontal_up_10_ssse3;
392  }
393  if (EXTERNAL_AVX(cpu_flags)) {
394  h->pred4x4[DIAG_DOWN_LEFT_PRED ] = ff_pred4x4_down_left_10_avx;
395  h->pred4x4[DIAG_DOWN_RIGHT_PRED] = ff_pred4x4_down_right_10_avx;
396  h->pred4x4[VERT_LEFT_PRED ] = ff_pred4x4_vertical_left_10_avx;
397  h->pred4x4[VERT_RIGHT_PRED ] = ff_pred4x4_vertical_right_10_avx;
398  h->pred4x4[HOR_DOWN_PRED ] = ff_pred4x4_horizontal_down_10_avx;
399 
400  h->pred8x8l[VERT_PRED ] = ff_pred8x8l_vertical_10_avx;
401  h->pred8x8l[HOR_PRED ] = ff_pred8x8l_horizontal_10_avx;
402  h->pred8x8l[DC_PRED ] = ff_pred8x8l_dc_10_avx;
403  h->pred8x8l[TOP_DC_PRED ] = ff_pred8x8l_top_dc_10_avx;
404  h->pred8x8l[DIAG_DOWN_RIGHT_PRED] = ff_pred8x8l_down_right_10_avx;
405  h->pred8x8l[DIAG_DOWN_LEFT_PRED ] = ff_pred8x8l_down_left_10_avx;
406  h->pred8x8l[VERT_RIGHT_PRED ] = ff_pred8x8l_vertical_right_10_avx;
407  h->pred8x8l[HOR_UP_PRED ] = ff_pred8x8l_horizontal_up_10_avx;
408  }
409  }
410 }
static void bit_depth(AudioStatsContext *s, uint64_t mask, uint64_t imask, AVRational *depth)
Definition: af_astats.c:254
Macro definitions for various function/variable attributes.
#define av_cold
Definition: attributes.h:88
uint8_t pi<< 24) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0f/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S16, int16_t,(*(const int16_t *) pi >> 8)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0f/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S32, int32_t,(*(const int32_t *) pi >> 24)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0f/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_FLT, float, av_clip_uint8(lrintf(*(const float *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, float, av_clip_int16(lrintf(*(const float *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, float, av_clipl_int32(llrintf(*(const float *) pi *(1U<< 31)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_DBL, double, av_clip_uint8(lrint(*(const double *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, double, av_clip_int16(lrint(*(const double *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, double, av_clipl_int32(llrint(*(const double *) pi *(1U<< 31)))) #define SET_CONV_FUNC_GROUP(ofmt, ifmt) static void set_generic_function(AudioConvert *ac) { } void ff_audio_convert_free(AudioConvert **ac) { if(! *ac) return;ff_dither_free(&(*ac) ->dc);av_freep(ac);} AudioConvert *ff_audio_convert_alloc(AVAudioResampleContext *avr, enum AVSampleFormat out_fmt, enum AVSampleFormat in_fmt, int channels, int sample_rate, int apply_map) { AudioConvert *ac;int in_planar, out_planar;ac=av_mallocz(sizeof(*ac));if(!ac) return NULL;ac->avr=avr;ac->out_fmt=out_fmt;ac->in_fmt=in_fmt;ac->channels=channels;ac->apply_map=apply_map;if(avr->dither_method !=AV_RESAMPLE_DITHER_NONE &&av_get_packed_sample_fmt(out_fmt)==AV_SAMPLE_FMT_S16 &&av_get_bytes_per_sample(in_fmt) > 2) { ac->dc=ff_dither_alloc(avr, out_fmt, in_fmt, channels, sample_rate, apply_map);if(!ac->dc) { av_free(ac);return NULL;} return ac;} in_planar=ff_sample_fmt_is_planar(in_fmt, channels);out_planar=ff_sample_fmt_is_planar(out_fmt, channels);if(in_planar==out_planar) { ac->func_type=CONV_FUNC_TYPE_FLAT;ac->planes=in_planar ? ac->channels :1;} else if(in_planar) ac->func_type=CONV_FUNC_TYPE_INTERLEAVE;else ac->func_type=CONV_FUNC_TYPE_DEINTERLEAVE;set_generic_function(ac);if(ARCH_AARCH64) ff_audio_convert_init_aarch64(ac);if(ARCH_ARM) ff_audio_convert_init_arm(ac);if(ARCH_X86) ff_audio_convert_init_x86(ac);return ac;} int ff_audio_convert(AudioConvert *ac, AudioData *out, AudioData *in) { int use_generic=1;int len=in->nb_samples;int p;if(ac->dc) { av_log(ac->avr, AV_LOG_TRACE, "%d samples - audio_convert: %s to %s (dithered)\n", len, av_get_sample_fmt_name(ac->in_fmt), av_get_sample_fmt_name(ac->out_fmt));return ff_convert_dither(ac-> dc
Libavcodec external API header.
static atomic_int cpu_flags
Definition: cpu.c:50
int av_get_cpu_flags(void)
Return the flags which specify extensions supported by the CPU.
Definition: cpu.c:95
#define AV_CPU_FLAG_CMOV
supports cmov instruction
Definition: cpu.h:53
@ AV_CODEC_ID_SVQ3
Definition: codec_id.h:72
@ AV_CODEC_ID_H264
Definition: codec_id.h:76
@ AV_CODEC_ID_VP7
Definition: codec_id.h:230
@ AV_CODEC_ID_VP8
Definition: codec_id.h:189
@ AV_CODEC_ID_RV40
Definition: codec_id.h:118
#define PRED8x8L(TYPE, DEPTH, OPT)
#define PRED8x8(TYPE, DEPTH, OPT)
#define PRED16x16(TYPE, DEPTH, OPT)
#define PRED4x4(TYPE, DEPTH, OPT)
H.264 / AVC / MPEG-4 prediction functions.
#define TOP_DC_PRED8x8
Definition: h264pred.h:75
void ff_h264_pred_init_x86(H264PredContext *h, int codec_id, const int bit_depth, const int chroma_format_idc)
#define HOR_PRED8x8
Definition: h264pred.h:69
#define VERT_PRED8x8
Definition: h264pred.h:70
#define DC_PRED8x8
Definition: h264pred.h:68
#define LEFT_DC_PRED8x8
Definition: h264pred.h:74
#define PLANE_PRED8x8
Definition: h264pred.h:71
#define DC_128_PRED8x8
Definition: h264pred.h:76
static int sse(MpegEncContext *s, uint8_t *src1, uint8_t *src2, int w, int h, int stride)
Context for storing H.264 prediction functions.
Definition: h264pred.h:92
enum AVCodecID codec_id
Definition: vaapi_decode.c:369
@ VERT_RIGHT_PRED
Definition: vp9.h:51
@ TOP_DC_PRED
Definition: vp9.h:57
@ VERT_LEFT_PRED
Definition: vp9.h:53
@ HOR_UP_PRED
Definition: vp9.h:54
@ TM_VP8_PRED
Definition: vp9.h:55
@ DIAG_DOWN_LEFT_PRED
Definition: vp9.h:49
@ DIAG_DOWN_RIGHT_PRED
Definition: vp9.h:50
@ DC_128_PRED
Definition: vp9.h:58
@ VERT_PRED
Definition: vp9.h:46
@ HOR_DOWN_PRED
Definition: vp9.h:52
@ HOR_PRED
Definition: vp9.h:47
@ DC_PRED
Definition: vp9.h:48
#define EXTERNAL_SSE(flags)
Definition: cpu.h:58
#define EXTERNAL_AVX(flags)
Definition: cpu.h:70
#define EXTERNAL_MMXEXT(flags)
Definition: cpu.h:57
#define EXTERNAL_SSSE3(flags)
Definition: cpu.h:65
#define EXTERNAL_MMX(flags)
Definition: cpu.h:56
#define EXTERNAL_AVX2(flags)
Definition: cpu.h:78
#define EXTERNAL_SSE2(flags)
Definition: cpu.h:59