FFmpeg  4.0
h264_intrapred_init.c
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2010 Fiona Glaser <fiona@x264.com>
3  *
4  * This file is part of FFmpeg.
5  *
6  * FFmpeg is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * FFmpeg is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with FFmpeg; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19  */
20 
21 #include "libavutil/attributes.h"
22 #include "libavutil/cpu.h"
23 #include "libavutil/x86/cpu.h"
24 #include "libavcodec/avcodec.h"
25 #include "libavcodec/h264pred.h"
26 
27 #define PRED4x4(TYPE, DEPTH, OPT) \
28 void ff_pred4x4_ ## TYPE ## _ ## DEPTH ## _ ## OPT (uint8_t *src, \
29  const uint8_t *topright, \
30  ptrdiff_t stride);
31 
32 PRED4x4(dc, 10, mmxext)
33 PRED4x4(down_left, 10, sse2)
34 PRED4x4(down_left, 10, avx)
35 PRED4x4(down_right, 10, sse2)
36 PRED4x4(down_right, 10, ssse3)
37 PRED4x4(down_right, 10, avx)
38 PRED4x4(vertical_left, 10, sse2)
39 PRED4x4(vertical_left, 10, avx)
40 PRED4x4(vertical_right, 10, sse2)
41 PRED4x4(vertical_right, 10, ssse3)
42 PRED4x4(vertical_right, 10, avx)
43 PRED4x4(horizontal_up, 10, mmxext)
44 PRED4x4(horizontal_down, 10, sse2)
45 PRED4x4(horizontal_down, 10, ssse3)
46 PRED4x4(horizontal_down, 10, avx)
47 
48 #define PRED8x8(TYPE, DEPTH, OPT) \
49 void ff_pred8x8_ ## TYPE ## _ ## DEPTH ## _ ## OPT (uint8_t *src, \
50  ptrdiff_t stride);
51 
52 PRED8x8(dc, 10, mmxext)
53 PRED8x8(dc, 10, sse2)
54 PRED8x8(top_dc, 10, sse2)
55 PRED8x8(plane, 10, sse2)
56 PRED8x8(vertical, 10, sse2)
57 PRED8x8(horizontal, 10, sse2)
58 
59 #define PRED8x8L(TYPE, DEPTH, OPT)\
60 void ff_pred8x8l_ ## TYPE ## _ ## DEPTH ## _ ## OPT (uint8_t *src, \
61  int has_topleft, \
62  int has_topright, \
63  ptrdiff_t stride);
64 
65 PRED8x8L(dc, 10, sse2)
66 PRED8x8L(dc, 10, avx)
67 PRED8x8L(128_dc, 10, mmxext)
68 PRED8x8L(128_dc, 10, sse2)
69 PRED8x8L(top_dc, 10, sse2)
70 PRED8x8L(top_dc, 10, avx)
71 PRED8x8L(vertical, 10, sse2)
72 PRED8x8L(vertical, 10, avx)
73 PRED8x8L(horizontal, 10, sse2)
74 PRED8x8L(horizontal, 10, ssse3)
75 PRED8x8L(horizontal, 10, avx)
76 PRED8x8L(down_left, 10, sse2)
77 PRED8x8L(down_left, 10, ssse3)
78 PRED8x8L(down_left, 10, avx)
79 PRED8x8L(down_right, 10, sse2)
80 PRED8x8L(down_right, 10, ssse3)
81 PRED8x8L(down_right, 10, avx)
82 PRED8x8L(vertical_right, 10, sse2)
83 PRED8x8L(vertical_right, 10, ssse3)
84 PRED8x8L(vertical_right, 10, avx)
85 PRED8x8L(horizontal_up, 10, sse2)
86 PRED8x8L(horizontal_up, 10, ssse3)
87 PRED8x8L(horizontal_up, 10, avx)
88 
89 #define PRED16x16(TYPE, DEPTH, OPT)\
90 void ff_pred16x16_ ## TYPE ## _ ## DEPTH ## _ ## OPT (uint8_t *src, \
91  ptrdiff_t stride);
92 
93 PRED16x16(dc, 10, mmxext)
94 PRED16x16(dc, 10, sse2)
95 PRED16x16(top_dc, 10, mmxext)
96 PRED16x16(top_dc, 10, sse2)
97 PRED16x16(128_dc, 10, mmxext)
98 PRED16x16(128_dc, 10, sse2)
99 PRED16x16(left_dc, 10, mmxext)
100 PRED16x16(left_dc, 10, sse2)
101 PRED16x16(vertical, 10, mmxext)
102 PRED16x16(vertical, 10, sse2)
103 PRED16x16(horizontal, 10, mmxext)
104 PRED16x16(horizontal, 10, sse2)
105 
106 /* 8-bit versions */
107 PRED16x16(vertical, 8, mmx)
108 PRED16x16(vertical, 8, sse)
109 PRED16x16(horizontal, 8, mmx)
110 PRED16x16(horizontal, 8, mmxext)
111 PRED16x16(horizontal, 8, ssse3)
112 PRED16x16(dc, 8, mmxext)
113 PRED16x16(dc, 8, sse2)
114 PRED16x16(dc, 8, ssse3)
115 PRED16x16(plane_h264, 8, mmx)
116 PRED16x16(plane_h264, 8, mmxext)
117 PRED16x16(plane_h264, 8, sse2)
118 PRED16x16(plane_h264, 8, ssse3)
119 PRED16x16(plane_rv40, 8, mmx)
120 PRED16x16(plane_rv40, 8, mmxext)
121 PRED16x16(plane_rv40, 8, sse2)
122 PRED16x16(plane_rv40, 8, ssse3)
123 PRED16x16(plane_svq3, 8, mmx)
124 PRED16x16(plane_svq3, 8, mmxext)
125 PRED16x16(plane_svq3, 8, sse2)
126 PRED16x16(plane_svq3, 8, ssse3)
127 PRED16x16(tm_vp8, 8, mmx)
128 PRED16x16(tm_vp8, 8, mmxext)
129 PRED16x16(tm_vp8, 8, sse2)
130 PRED16x16(tm_vp8, 8, avx2)
131 
132 PRED8x8(top_dc, 8, mmxext)
133 PRED8x8(dc_rv40, 8, mmxext)
134 PRED8x8(dc, 8, mmxext)
135 PRED8x8(vertical, 8, mmx)
136 PRED8x8(horizontal, 8, mmx)
137 PRED8x8(horizontal, 8, mmxext)
138 PRED8x8(horizontal, 8, ssse3)
139 PRED8x8(plane, 8, mmx)
140 PRED8x8(plane, 8, mmxext)
141 PRED8x8(plane, 8, sse2)
142 PRED8x8(plane, 8, ssse3)
143 PRED8x8(tm_vp8, 8, mmx)
144 PRED8x8(tm_vp8, 8, mmxext)
145 PRED8x8(tm_vp8, 8, sse2)
146 PRED8x8(tm_vp8, 8, ssse3)
147 
148 PRED8x8L(top_dc, 8, mmxext)
149 PRED8x8L(top_dc, 8, ssse3)
150 PRED8x8L(dc, 8, mmxext)
151 PRED8x8L(dc, 8, ssse3)
152 PRED8x8L(horizontal, 8, mmxext)
153 PRED8x8L(horizontal, 8, ssse3)
154 PRED8x8L(vertical, 8, mmxext)
155 PRED8x8L(vertical, 8, ssse3)
156 PRED8x8L(down_left, 8, mmxext)
157 PRED8x8L(down_left, 8, sse2)
158 PRED8x8L(down_left, 8, ssse3)
159 PRED8x8L(down_right, 8, mmxext)
160 PRED8x8L(down_right, 8, sse2)
161 PRED8x8L(down_right, 8, ssse3)
162 PRED8x8L(vertical_right, 8, mmxext)
163 PRED8x8L(vertical_right, 8, sse2)
164 PRED8x8L(vertical_right, 8, ssse3)
165 PRED8x8L(vertical_left, 8, sse2)
166 PRED8x8L(vertical_left, 8, ssse3)
167 PRED8x8L(horizontal_up, 8, mmxext)
168 PRED8x8L(horizontal_up, 8, ssse3)
169 PRED8x8L(horizontal_down, 8, mmxext)
170 PRED8x8L(horizontal_down, 8, sse2)
171 PRED8x8L(horizontal_down, 8, ssse3)
172 
173 PRED4x4(dc, 8, mmxext)
174 PRED4x4(down_left, 8, mmxext)
175 PRED4x4(down_right, 8, mmxext)
176 PRED4x4(vertical_left, 8, mmxext)
177 PRED4x4(vertical_right, 8, mmxext)
178 PRED4x4(horizontal_up, 8, mmxext)
179 PRED4x4(horizontal_down, 8, mmxext)
180 PRED4x4(tm_vp8, 8, mmx)
181 PRED4x4(tm_vp8, 8, mmxext)
182 PRED4x4(tm_vp8, 8, ssse3)
183 PRED4x4(vertical_vp8, 8, mmxext)
184 
186  const int bit_depth,
187  const int chroma_format_idc)
188 {
189  int cpu_flags = av_get_cpu_flags();
190 
191  if (bit_depth == 8) {
192  if (EXTERNAL_MMX(cpu_flags)) {
193  h->pred16x16[VERT_PRED8x8 ] = ff_pred16x16_vertical_8_mmx;
194  h->pred16x16[HOR_PRED8x8 ] = ff_pred16x16_horizontal_8_mmx;
195  if (chroma_format_idc <= 1) {
196  h->pred8x8 [VERT_PRED8x8 ] = ff_pred8x8_vertical_8_mmx;
197  h->pred8x8 [HOR_PRED8x8 ] = ff_pred8x8_horizontal_8_mmx;
198  }
199  if (codec_id == AV_CODEC_ID_VP7 || codec_id == AV_CODEC_ID_VP8) {
200  h->pred16x16[PLANE_PRED8x8 ] = ff_pred16x16_tm_vp8_8_mmx;
201  h->pred8x8 [PLANE_PRED8x8 ] = ff_pred8x8_tm_vp8_8_mmx;
202  h->pred4x4 [TM_VP8_PRED ] = ff_pred4x4_tm_vp8_8_mmx;
203  } else {
204  if (chroma_format_idc <= 1)
205  h->pred8x8 [PLANE_PRED8x8] = ff_pred8x8_plane_8_mmx;
206  if (codec_id == AV_CODEC_ID_SVQ3) {
207  if (cpu_flags & AV_CPU_FLAG_CMOV)
208  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_svq3_8_mmx;
209  } else if (codec_id == AV_CODEC_ID_RV40) {
210  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_rv40_8_mmx;
211  } else {
212  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_h264_8_mmx;
213  }
214  }
215  }
216 
217  if (EXTERNAL_MMXEXT(cpu_flags)) {
218  h->pred16x16[HOR_PRED8x8 ] = ff_pred16x16_horizontal_8_mmxext;
219  h->pred16x16[DC_PRED8x8 ] = ff_pred16x16_dc_8_mmxext;
220  if (chroma_format_idc <= 1)
221  h->pred8x8[HOR_PRED8x8 ] = ff_pred8x8_horizontal_8_mmxext;
222  h->pred8x8l [TOP_DC_PRED ] = ff_pred8x8l_top_dc_8_mmxext;
223  h->pred8x8l [DC_PRED ] = ff_pred8x8l_dc_8_mmxext;
224  h->pred8x8l [HOR_PRED ] = ff_pred8x8l_horizontal_8_mmxext;
225  h->pred8x8l [VERT_PRED ] = ff_pred8x8l_vertical_8_mmxext;
226  h->pred8x8l [DIAG_DOWN_RIGHT_PRED ] = ff_pred8x8l_down_right_8_mmxext;
227  h->pred8x8l [VERT_RIGHT_PRED ] = ff_pred8x8l_vertical_right_8_mmxext;
228  h->pred8x8l [HOR_UP_PRED ] = ff_pred8x8l_horizontal_up_8_mmxext;
229  h->pred8x8l [DIAG_DOWN_LEFT_PRED ] = ff_pred8x8l_down_left_8_mmxext;
230  h->pred8x8l [HOR_DOWN_PRED ] = ff_pred8x8l_horizontal_down_8_mmxext;
231  h->pred4x4 [DIAG_DOWN_RIGHT_PRED ] = ff_pred4x4_down_right_8_mmxext;
232  h->pred4x4 [VERT_RIGHT_PRED ] = ff_pred4x4_vertical_right_8_mmxext;
233  h->pred4x4 [HOR_DOWN_PRED ] = ff_pred4x4_horizontal_down_8_mmxext;
234  h->pred4x4 [DC_PRED ] = ff_pred4x4_dc_8_mmxext;
235  if (codec_id == AV_CODEC_ID_VP7 || codec_id == AV_CODEC_ID_VP8 ||
236  codec_id == AV_CODEC_ID_H264) {
237  h->pred4x4 [DIAG_DOWN_LEFT_PRED] = ff_pred4x4_down_left_8_mmxext;
238  }
239  if (codec_id == AV_CODEC_ID_SVQ3 || codec_id == AV_CODEC_ID_H264) {
240  h->pred4x4 [VERT_LEFT_PRED ] = ff_pred4x4_vertical_left_8_mmxext;
241  }
242  if (codec_id != AV_CODEC_ID_RV40) {
243  h->pred4x4 [HOR_UP_PRED ] = ff_pred4x4_horizontal_up_8_mmxext;
244  }
245  if (codec_id == AV_CODEC_ID_SVQ3 || codec_id == AV_CODEC_ID_H264) {
246  if (chroma_format_idc <= 1) {
247  h->pred8x8[TOP_DC_PRED8x8 ] = ff_pred8x8_top_dc_8_mmxext;
248  h->pred8x8[DC_PRED8x8 ] = ff_pred8x8_dc_8_mmxext;
249  }
250  }
251  if (codec_id == AV_CODEC_ID_VP7 || codec_id == AV_CODEC_ID_VP8) {
252  h->pred16x16[PLANE_PRED8x8 ] = ff_pred16x16_tm_vp8_8_mmxext;
253  h->pred8x8 [DC_PRED8x8 ] = ff_pred8x8_dc_rv40_8_mmxext;
254  h->pred8x8 [PLANE_PRED8x8 ] = ff_pred8x8_tm_vp8_8_mmxext;
255  h->pred4x4 [TM_VP8_PRED ] = ff_pred4x4_tm_vp8_8_mmxext;
256  h->pred4x4 [VERT_PRED ] = ff_pred4x4_vertical_vp8_8_mmxext;
257  } else {
258  if (chroma_format_idc <= 1)
259  h->pred8x8 [PLANE_PRED8x8] = ff_pred8x8_plane_8_mmxext;
260  if (codec_id == AV_CODEC_ID_SVQ3) {
261  h->pred16x16[PLANE_PRED8x8 ] = ff_pred16x16_plane_svq3_8_mmxext;
262  } else if (codec_id == AV_CODEC_ID_RV40) {
263  h->pred16x16[PLANE_PRED8x8 ] = ff_pred16x16_plane_rv40_8_mmxext;
264  } else {
265  h->pred16x16[PLANE_PRED8x8 ] = ff_pred16x16_plane_h264_8_mmxext;
266  }
267  }
268  }
269 
270  if (EXTERNAL_SSE(cpu_flags)) {
271  h->pred16x16[VERT_PRED8x8] = ff_pred16x16_vertical_8_sse;
272  }
273 
274  if (EXTERNAL_SSE2(cpu_flags)) {
275  h->pred16x16[DC_PRED8x8 ] = ff_pred16x16_dc_8_sse2;
276  h->pred8x8l [DIAG_DOWN_LEFT_PRED ] = ff_pred8x8l_down_left_8_sse2;
277  h->pred8x8l [DIAG_DOWN_RIGHT_PRED ] = ff_pred8x8l_down_right_8_sse2;
278  h->pred8x8l [VERT_RIGHT_PRED ] = ff_pred8x8l_vertical_right_8_sse2;
279  h->pred8x8l [VERT_LEFT_PRED ] = ff_pred8x8l_vertical_left_8_sse2;
280  h->pred8x8l [HOR_DOWN_PRED ] = ff_pred8x8l_horizontal_down_8_sse2;
281  if (codec_id == AV_CODEC_ID_VP7 || codec_id == AV_CODEC_ID_VP8) {
282  h->pred16x16[PLANE_PRED8x8 ] = ff_pred16x16_tm_vp8_8_sse2;
283  h->pred8x8 [PLANE_PRED8x8 ] = ff_pred8x8_tm_vp8_8_sse2;
284  } else {
285  if (chroma_format_idc <= 1)
286  h->pred8x8 [PLANE_PRED8x8] = ff_pred8x8_plane_8_sse2;
287  if (codec_id == AV_CODEC_ID_SVQ3) {
288  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_svq3_8_sse2;
289  } else if (codec_id == AV_CODEC_ID_RV40) {
290  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_rv40_8_sse2;
291  } else {
292  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_h264_8_sse2;
293  }
294  }
295  }
296 
297  if (EXTERNAL_SSSE3(cpu_flags)) {
298  h->pred16x16[HOR_PRED8x8 ] = ff_pred16x16_horizontal_8_ssse3;
299  h->pred16x16[DC_PRED8x8 ] = ff_pred16x16_dc_8_ssse3;
300  if (chroma_format_idc <= 1)
301  h->pred8x8 [HOR_PRED8x8 ] = ff_pred8x8_horizontal_8_ssse3;
302  h->pred8x8l [TOP_DC_PRED ] = ff_pred8x8l_top_dc_8_ssse3;
303  h->pred8x8l [DC_PRED ] = ff_pred8x8l_dc_8_ssse3;
304  h->pred8x8l [HOR_PRED ] = ff_pred8x8l_horizontal_8_ssse3;
305  h->pred8x8l [VERT_PRED ] = ff_pred8x8l_vertical_8_ssse3;
306  h->pred8x8l [DIAG_DOWN_LEFT_PRED ] = ff_pred8x8l_down_left_8_ssse3;
307  h->pred8x8l [DIAG_DOWN_RIGHT_PRED ] = ff_pred8x8l_down_right_8_ssse3;
308  h->pred8x8l [VERT_RIGHT_PRED ] = ff_pred8x8l_vertical_right_8_ssse3;
309  h->pred8x8l [VERT_LEFT_PRED ] = ff_pred8x8l_vertical_left_8_ssse3;
310  h->pred8x8l [HOR_UP_PRED ] = ff_pred8x8l_horizontal_up_8_ssse3;
311  h->pred8x8l [HOR_DOWN_PRED ] = ff_pred8x8l_horizontal_down_8_ssse3;
312  if (codec_id == AV_CODEC_ID_VP7 || codec_id == AV_CODEC_ID_VP8) {
313  h->pred8x8 [PLANE_PRED8x8 ] = ff_pred8x8_tm_vp8_8_ssse3;
314  h->pred4x4 [TM_VP8_PRED ] = ff_pred4x4_tm_vp8_8_ssse3;
315  } else {
316  if (chroma_format_idc <= 1)
317  h->pred8x8 [PLANE_PRED8x8] = ff_pred8x8_plane_8_ssse3;
318  if (codec_id == AV_CODEC_ID_SVQ3) {
319  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_svq3_8_ssse3;
320  } else if (codec_id == AV_CODEC_ID_RV40) {
321  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_rv40_8_ssse3;
322  } else {
323  h->pred16x16[PLANE_PRED8x8] = ff_pred16x16_plane_h264_8_ssse3;
324  }
325  }
326  }
327 
328  if(EXTERNAL_AVX2(cpu_flags)){
329  if (codec_id == AV_CODEC_ID_VP8) {
330  h->pred16x16[PLANE_PRED8x8 ] = ff_pred16x16_tm_vp8_8_avx2;
331  }
332  }
333  } else if (bit_depth == 10) {
334  if (EXTERNAL_MMXEXT(cpu_flags)) {
335  h->pred4x4[DC_PRED ] = ff_pred4x4_dc_10_mmxext;
336  h->pred4x4[HOR_UP_PRED ] = ff_pred4x4_horizontal_up_10_mmxext;
337 
338  if (chroma_format_idc <= 1)
339  h->pred8x8[DC_PRED8x8 ] = ff_pred8x8_dc_10_mmxext;
340 
341  h->pred8x8l[DC_128_PRED ] = ff_pred8x8l_128_dc_10_mmxext;
342 
343  h->pred16x16[DC_PRED8x8 ] = ff_pred16x16_dc_10_mmxext;
344  h->pred16x16[TOP_DC_PRED8x8 ] = ff_pred16x16_top_dc_10_mmxext;
345  h->pred16x16[DC_128_PRED8x8 ] = ff_pred16x16_128_dc_10_mmxext;
346  h->pred16x16[LEFT_DC_PRED8x8 ] = ff_pred16x16_left_dc_10_mmxext;
347  h->pred16x16[VERT_PRED8x8 ] = ff_pred16x16_vertical_10_mmxext;
348  h->pred16x16[HOR_PRED8x8 ] = ff_pred16x16_horizontal_10_mmxext;
349  }
350  if (EXTERNAL_SSE2(cpu_flags)) {
351  h->pred4x4[DIAG_DOWN_LEFT_PRED ] = ff_pred4x4_down_left_10_sse2;
352  h->pred4x4[DIAG_DOWN_RIGHT_PRED] = ff_pred4x4_down_right_10_sse2;
353  h->pred4x4[VERT_LEFT_PRED ] = ff_pred4x4_vertical_left_10_sse2;
354  h->pred4x4[VERT_RIGHT_PRED ] = ff_pred4x4_vertical_right_10_sse2;
355  h->pred4x4[HOR_DOWN_PRED ] = ff_pred4x4_horizontal_down_10_sse2;
356 
357  if (chroma_format_idc <= 1) {
358  h->pred8x8[DC_PRED8x8 ] = ff_pred8x8_dc_10_sse2;
359  h->pred8x8[TOP_DC_PRED8x8 ] = ff_pred8x8_top_dc_10_sse2;
360  h->pred8x8[PLANE_PRED8x8 ] = ff_pred8x8_plane_10_sse2;
361  h->pred8x8[VERT_PRED8x8 ] = ff_pred8x8_vertical_10_sse2;
362  h->pred8x8[HOR_PRED8x8 ] = ff_pred8x8_horizontal_10_sse2;
363  }
364 
365  h->pred8x8l[VERT_PRED ] = ff_pred8x8l_vertical_10_sse2;
366  h->pred8x8l[HOR_PRED ] = ff_pred8x8l_horizontal_10_sse2;
367  h->pred8x8l[DC_PRED ] = ff_pred8x8l_dc_10_sse2;
368  h->pred8x8l[DC_128_PRED ] = ff_pred8x8l_128_dc_10_sse2;
369  h->pred8x8l[TOP_DC_PRED ] = ff_pred8x8l_top_dc_10_sse2;
370  h->pred8x8l[DIAG_DOWN_LEFT_PRED ] = ff_pred8x8l_down_left_10_sse2;
371  h->pred8x8l[DIAG_DOWN_RIGHT_PRED] = ff_pred8x8l_down_right_10_sse2;
372  h->pred8x8l[VERT_RIGHT_PRED ] = ff_pred8x8l_vertical_right_10_sse2;
373  h->pred8x8l[HOR_UP_PRED ] = ff_pred8x8l_horizontal_up_10_sse2;
374 
375  h->pred16x16[DC_PRED8x8 ] = ff_pred16x16_dc_10_sse2;
376  h->pred16x16[TOP_DC_PRED8x8 ] = ff_pred16x16_top_dc_10_sse2;
377  h->pred16x16[DC_128_PRED8x8 ] = ff_pred16x16_128_dc_10_sse2;
378  h->pred16x16[LEFT_DC_PRED8x8 ] = ff_pred16x16_left_dc_10_sse2;
379  h->pred16x16[VERT_PRED8x8 ] = ff_pred16x16_vertical_10_sse2;
380  h->pred16x16[HOR_PRED8x8 ] = ff_pred16x16_horizontal_10_sse2;
381  }
382  if (EXTERNAL_SSSE3(cpu_flags)) {
383  h->pred4x4[DIAG_DOWN_RIGHT_PRED] = ff_pred4x4_down_right_10_ssse3;
384  h->pred4x4[VERT_RIGHT_PRED ] = ff_pred4x4_vertical_right_10_ssse3;
385  h->pred4x4[HOR_DOWN_PRED ] = ff_pred4x4_horizontal_down_10_ssse3;
386 
387  h->pred8x8l[HOR_PRED ] = ff_pred8x8l_horizontal_10_ssse3;
388  h->pred8x8l[DIAG_DOWN_LEFT_PRED ] = ff_pred8x8l_down_left_10_ssse3;
389  h->pred8x8l[DIAG_DOWN_RIGHT_PRED] = ff_pred8x8l_down_right_10_ssse3;
390  h->pred8x8l[VERT_RIGHT_PRED ] = ff_pred8x8l_vertical_right_10_ssse3;
391  h->pred8x8l[HOR_UP_PRED ] = ff_pred8x8l_horizontal_up_10_ssse3;
392  }
393  if (EXTERNAL_AVX(cpu_flags)) {
394  h->pred4x4[DIAG_DOWN_LEFT_PRED ] = ff_pred4x4_down_left_10_avx;
395  h->pred4x4[DIAG_DOWN_RIGHT_PRED] = ff_pred4x4_down_right_10_avx;
396  h->pred4x4[VERT_LEFT_PRED ] = ff_pred4x4_vertical_left_10_avx;
397  h->pred4x4[VERT_RIGHT_PRED ] = ff_pred4x4_vertical_right_10_avx;
398  h->pred4x4[HOR_DOWN_PRED ] = ff_pred4x4_horizontal_down_10_avx;
399 
400  h->pred8x8l[VERT_PRED ] = ff_pred8x8l_vertical_10_avx;
401  h->pred8x8l[HOR_PRED ] = ff_pred8x8l_horizontal_10_avx;
402  h->pred8x8l[DC_PRED ] = ff_pred8x8l_dc_10_avx;
403  h->pred8x8l[TOP_DC_PRED ] = ff_pred8x8l_top_dc_10_avx;
404  h->pred8x8l[DIAG_DOWN_RIGHT_PRED] = ff_pred8x8l_down_right_10_avx;
405  h->pred8x8l[DIAG_DOWN_LEFT_PRED ] = ff_pred8x8l_down_left_10_avx;
406  h->pred8x8l[VERT_RIGHT_PRED ] = ff_pred8x8l_vertical_right_10_avx;
407  h->pred8x8l[HOR_UP_PRED ] = ff_pred8x8l_horizontal_up_10_avx;
408  }
409  }
410 }
#define EXTERNAL_MMX(flags)
Definition: cpu.h:56
int plane
Definition: avisynth_c.h:422
#define VERT_PRED8x8
Definition: h264pred.h:70
Definition: vp9.h:47
#define DC_128_PRED8x8
Definition: h264pred.h:76
void ff_h264_pred_init_x86(H264PredContext *h, int codec_id, const int bit_depth, const int chroma_format_idc)
#define PRED8x8(TYPE, DEPTH, OPT)
#define AV_CPU_FLAG_CMOV
supports cmov instruction
Definition: cpu.h:53
static int sse(MpegEncContext *s, uint8_t *src1, uint8_t *src2, int w, int h, int stride)
static atomic_int cpu_flags
Definition: cpu.c:50
#define EXTERNAL_SSE(flags)
Definition: cpu.h:58
#define HOR_PRED8x8
Definition: h264pred.h:69
Macro definitions for various function/variable attributes.
#define PRED16x16(TYPE, DEPTH, OPT)
#define PLANE_PRED8x8
Definition: h264pred.h:71
#define av_cold
Definition: attributes.h:82
#define DC_PRED8x8
Definition: h264pred.h:68
Definition: vp9.h:46
#define TOP_DC_PRED8x8
Definition: h264pred.h:75
Context for storing H.264 prediction functions.
Definition: h264pred.h:92
void(* pred8x8[4+3+4])(uint8_t *src, ptrdiff_t stride)
Definition: h264pred.h:97
#define PRED8x8L(TYPE, DEPTH, OPT)
void(* pred4x4[9+3+3])(uint8_t *src, const uint8_t *topright, ptrdiff_t stride)
Definition: h264pred.h:93
#define EXTERNAL_SSE2(flags)
Definition: cpu.h:59
#define PRED4x4(TYPE, DEPTH, OPT)
static void bit_depth(AudioStatsContext *s, uint64_t mask, uint64_t imask, AVRational *depth)
Definition: af_astats.c:152
enum AVCodecID codec_id
Definition: vaapi_decode.c:362
#define LEFT_DC_PRED8x8
Definition: h264pred.h:74
Libavcodec external API header.
void(* pred16x16[4+3+2])(uint8_t *src, ptrdiff_t stride)
Definition: h264pred.h:98
#define EXTERNAL_SSSE3(flags)
Definition: cpu.h:65
int av_get_cpu_flags(void)
Return the flags which specify extensions supported by the CPU.
Definition: cpu.c:93
uint8_t pi<< 24) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0f/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S16, int16_t,(*(const int16_t *) pi >> 8)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0f/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S32, int32_t,(*(const int32_t *) pi >> 24)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0f/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_FLT, float, av_clip_uint8(lrintf(*(const float *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, float, av_clip_int16(lrintf(*(const float *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, float, av_clipl_int32(llrintf(*(const float *) pi *(1U<< 31)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_DBL, double, av_clip_uint8(lrint(*(const double *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, double, av_clip_int16(lrint(*(const double *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, double, av_clipl_int32(llrint(*(const double *) pi *(1U<< 31)))) #define SET_CONV_FUNC_GROUP(ofmt, ifmt) static void set_generic_function(AudioConvert *ac) { } void ff_audio_convert_free(AudioConvert **ac) { if(! *ac) return;ff_dither_free(&(*ac) ->dc);av_freep(ac);} AudioConvert *ff_audio_convert_alloc(AVAudioResampleContext *avr, enum AVSampleFormat out_fmt, enum AVSampleFormat in_fmt, int channels, int sample_rate, int apply_map) { AudioConvert *ac;int in_planar, out_planar;ac=av_mallocz(sizeof(*ac));if(!ac) return NULL;ac->avr=avr;ac->out_fmt=out_fmt;ac->in_fmt=in_fmt;ac->channels=channels;ac->apply_map=apply_map;if(avr->dither_method !=AV_RESAMPLE_DITHER_NONE &&av_get_packed_sample_fmt(out_fmt)==AV_SAMPLE_FMT_S16 &&av_get_bytes_per_sample(in_fmt) > 2) { ac->dc=ff_dither_alloc(avr, out_fmt, in_fmt, channels, sample_rate, apply_map);if(!ac->dc) { av_free(ac);return NULL;} return ac;} in_planar=ff_sample_fmt_is_planar(in_fmt, channels);out_planar=ff_sample_fmt_is_planar(out_fmt, channels);if(in_planar==out_planar) { ac->func_type=CONV_FUNC_TYPE_FLAT;ac->planes=in_planar ? ac->channels :1;} else if(in_planar) ac->func_type=CONV_FUNC_TYPE_INTERLEAVE;else ac->func_type=CONV_FUNC_TYPE_DEINTERLEAVE;set_generic_function(ac);if(ARCH_AARCH64) ff_audio_convert_init_aarch64(ac);if(ARCH_ARM) ff_audio_convert_init_arm(ac);if(ARCH_X86) ff_audio_convert_init_x86(ac);return ac;} int ff_audio_convert(AudioConvert *ac, AudioData *out, AudioData *in) { int use_generic=1;int len=in->nb_samples;int p;if(ac->dc) { av_log(ac->avr, AV_LOG_TRACE, "%d samples - audio_convert: %s to %s (dithered)\", len, av_get_sample_fmt_name(ac->in_fmt), av_get_sample_fmt_name(ac->out_fmt));return ff_convert_dither(ac-> dc
#define EXTERNAL_AVX2(flags)
Definition: cpu.h:78
H.264 / AVC / MPEG-4 prediction functions.
#define EXTERNAL_MMXEXT(flags)
Definition: cpu.h:57
Definition: vp9.h:48
#define EXTERNAL_AVX(flags)
Definition: cpu.h:70
void(* pred8x8l[9+3])(uint8_t *src, int topleft, int topright, ptrdiff_t stride)
Definition: h264pred.h:95