FFmpeg  4.0
cpu.c
Go to the documentation of this file.
1 /*
2  * This file is part of FFmpeg.
3  *
4  * FFmpeg is free software; you can redistribute it and/or
5  * modify it under the terms of the GNU Lesser General Public
6  * License as published by the Free Software Foundation; either
7  * version 2.1 of the License, or (at your option) any later version.
8  *
9  * FFmpeg is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12  * Lesser General Public License for more details.
13  *
14  * You should have received a copy of the GNU Lesser General Public
15  * License along with FFmpeg; if not, write to the Free Software
16  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17  */
18 
19 #include <stdio.h>
20 
21 #include "config.h"
22 
23 #include "libavutil/cpu.h"
24 #include "libavutil/avstring.h"
25 
26 #if HAVE_UNISTD_H
27 #include <unistd.h>
28 #endif
29 #if !HAVE_GETOPT
30 #include "compat/getopt.c"
31 #endif
32 
33 static const struct {
34  int flag;
35  const char *name;
36 } cpu_flag_tab[] = {
37 #if ARCH_AARCH64
38  { AV_CPU_FLAG_ARMV8, "armv8" },
39  { AV_CPU_FLAG_NEON, "neon" },
40  { AV_CPU_FLAG_VFP, "vfp" },
41 #elif ARCH_ARM
42  { AV_CPU_FLAG_ARMV5TE, "armv5te" },
43  { AV_CPU_FLAG_ARMV6, "armv6" },
44  { AV_CPU_FLAG_ARMV6T2, "armv6t2" },
45  { AV_CPU_FLAG_VFP, "vfp" },
46  { AV_CPU_FLAG_VFP_VM, "vfp_vm" },
47  { AV_CPU_FLAG_VFPV3, "vfpv3" },
48  { AV_CPU_FLAG_NEON, "neon" },
49  { AV_CPU_FLAG_SETEND, "setend" },
50 #elif ARCH_PPC
51  { AV_CPU_FLAG_ALTIVEC, "altivec" },
52 #elif ARCH_X86
53  { AV_CPU_FLAG_MMX, "mmx" },
54  { AV_CPU_FLAG_MMXEXT, "mmxext" },
55  { AV_CPU_FLAG_SSE, "sse" },
56  { AV_CPU_FLAG_SSE2, "sse2" },
57  { AV_CPU_FLAG_SSE2SLOW, "sse2slow" },
58  { AV_CPU_FLAG_SSE3, "sse3" },
59  { AV_CPU_FLAG_SSE3SLOW, "sse3slow" },
60  { AV_CPU_FLAG_SSSE3, "ssse3" },
61  { AV_CPU_FLAG_ATOM, "atom" },
62  { AV_CPU_FLAG_SSE4, "sse4.1" },
63  { AV_CPU_FLAG_SSE42, "sse4.2" },
64  { AV_CPU_FLAG_AVX, "avx" },
65  { AV_CPU_FLAG_AVXSLOW, "avxslow" },
66  { AV_CPU_FLAG_XOP, "xop" },
67  { AV_CPU_FLAG_FMA3, "fma3" },
68  { AV_CPU_FLAG_FMA4, "fma4" },
69  { AV_CPU_FLAG_3DNOW, "3dnow" },
70  { AV_CPU_FLAG_3DNOWEXT, "3dnowext" },
71  { AV_CPU_FLAG_CMOV, "cmov" },
72  { AV_CPU_FLAG_AVX2, "avx2" },
73  { AV_CPU_FLAG_BMI1, "bmi1" },
74  { AV_CPU_FLAG_BMI2, "bmi2" },
75  { AV_CPU_FLAG_AESNI, "aesni" },
76  { AV_CPU_FLAG_AVX512, "avx512" },
77 #endif
78  { 0 }
79 };
80 
81 static void print_cpu_flags(int cpu_flags, const char *type)
82 {
83  int i;
84 
85  printf("cpu_flags(%s) = 0x%08X\n", type, cpu_flags);
86  printf("cpu_flags_str(%s) =", type);
87  for (i = 0; cpu_flag_tab[i].flag; i++)
88  if (cpu_flags & cpu_flag_tab[i].flag)
89  printf(" %s", cpu_flag_tab[i].name);
90  printf("\n");
91 }
92 
93 
94 int main(int argc, char **argv)
95 {
96  int cpu_flags_raw = av_get_cpu_flags();
97  int cpu_flags_eff;
98  int cpu_count = av_cpu_count();
99  char threads[5] = "auto";
100  int i;
101 
102  for(i = 0; cpu_flag_tab[i].flag; i++) {
103  unsigned tmp = 0;
104  if (av_parse_cpu_caps(&tmp, cpu_flag_tab[i].name) < 0) {
105  fprintf(stderr, "Table missing %s\n", cpu_flag_tab[i].name);
106  return 4;
107  }
108  }
109 
110  if (cpu_flags_raw < 0)
111  return 1;
112 
113  for (;;) {
114  int c = getopt(argc, argv, "c:t:");
115  if (c == -1)
116  break;
117  switch (c) {
118  case 'c':
119  {
120  unsigned flags = av_get_cpu_flags();
121  if (av_parse_cpu_caps(&flags, optarg) < 0)
122  return 2;
123 
124  av_force_cpu_flags(flags);
125  break;
126  }
127  case 't':
128  {
129  int len = av_strlcpy(threads, optarg, sizeof(threads));
130  if (len >= sizeof(threads)) {
131  fprintf(stderr, "Invalid thread count '%s'\n", optarg);
132  return 2;
133  }
134  }
135  }
136  }
137 
138  cpu_flags_eff = av_get_cpu_flags();
139 
140  if (cpu_flags_eff < 0)
141  return 3;
142 
143  print_cpu_flags(cpu_flags_raw, "raw");
144  print_cpu_flags(cpu_flags_eff, "effective");
145  printf("threads = %s (cpu_count = %d)\n", threads, cpu_count);
146 
147  return 0;
148 }
#define AV_CPU_FLAG_AVX
AVX functions: requires OS support even if YMM registers aren&#39;t used.
Definition: cpu.h:49
#define AV_CPU_FLAG_ALTIVEC
standard
Definition: cpu.h:60
int av_cpu_count(void)
Definition: cpu.c:267
#define AV_CPU_FLAG_SSE
SSE functions.
Definition: cpu.h:35
int flag
Definition: cpu.c:34
#define AV_CPU_FLAG_CMOV
supports cmov instruction
Definition: cpu.h:53
#define AV_CPU_FLAG_VFP
Definition: cpu.h:67
static atomic_int cpu_flags
Definition: cpu.c:50
static const struct @265 cpu_flag_tab[]
#define AV_CPU_FLAG_FMA3
Haswell FMA3 functions.
Definition: cpu.h:55
#define AV_CPU_FLAG_NEON
Definition: cpu.h:69
#define AV_CPU_FLAG_MMXEXT
SSE integer functions or AMD MMX ext.
Definition: cpu.h:32
const char * name
Definition: cpu.c:35
#define AV_CPU_FLAG_ATOM
Atom processor, some SSSE3 instructions are slower.
Definition: cpu.h:45
static int flags
Definition: log.c:55
#define AV_CPU_FLAG_AVX2
AVX2 functions: requires OS support even if YMM registers aren&#39;t used.
Definition: cpu.h:54
#define AV_CPU_FLAG_SSE2SLOW
SSE2 supported, but usually not faster.
Definition: cpu.h:37
#define AV_CPU_FLAG_XOP
Bulldozer XOP functions.
Definition: cpu.h:51
#define AV_CPU_FLAG_SSE42
Nehalem SSE4.2 functions.
Definition: cpu.h:47
#define AV_CPU_FLAG_SSSE3
Conroe SSSE3 functions.
Definition: cpu.h:43
#define AV_CPU_FLAG_ARMV6T2
Definition: cpu.h:66
#define AV_CPU_FLAG_AVX512
AVX-512 functions: requires OS support even if YMM/ZMM registers aren&#39;t used.
Definition: cpu.h:58
#define AV_CPU_FLAG_VFP_VM
VFPv2 vector mode, deprecated in ARMv7-A and unavailable in various CPUs implementations.
Definition: cpu.h:71
size_t av_strlcpy(char *dst, const char *src, size_t size)
Copy the string src to dst, but no more than size - 1 bytes, and null-terminate dst.
Definition: avstring.c:83
int av_parse_cpu_caps(unsigned *flags, const char *s)
Parse CPU caps from a string and update the given AV_CPU_* flags based on that.
Definition: cpu.c:191
#define AV_CPU_FLAG_ARMV5TE
Definition: cpu.h:64
#define AV_CPU_FLAG_SSE3
Prescott SSE3 functions.
Definition: cpu.h:40
#define AV_CPU_FLAG_BMI2
Bit Manipulation Instruction Set 2.
Definition: cpu.h:57
#define AV_CPU_FLAG_VFPV3
Definition: cpu.h:68
#define AV_CPU_FLAG_3DNOW
AMD 3DNOW.
Definition: cpu.h:34
#define AV_CPU_FLAG_ARMV6
Definition: cpu.h:65
#define AV_CPU_FLAG_SSE3SLOW
SSE3 supported, but usually not faster.
Definition: cpu.h:41
#define AV_CPU_FLAG_AVXSLOW
AVX supported, but slow when using YMM registers (e.g. Bulldozer)
Definition: cpu.h:50
#define AV_CPU_FLAG_BMI1
Bit Manipulation Instruction Set 1.
Definition: cpu.h:56
#define AV_CPU_FLAG_MMX
standard MMX
Definition: cpu.h:31
static int getopt(int argc, char *argv[], char *opts)
Definition: getopt.c:41
#define AV_CPU_FLAG_FMA4
Bulldozer FMA4 functions.
Definition: cpu.h:52
#define AV_CPU_FLAG_SSE4
Penryn SSE4.1 functions.
Definition: cpu.h:46
cl_device_type type
#define AV_CPU_FLAG_AESNI
Advanced Encryption Standard functions.
Definition: cpu.h:48
int av_get_cpu_flags(void)
Return the flags which specify extensions supported by the CPU.
Definition: cpu.c:93
#define AV_CPU_FLAG_3DNOWEXT
AMD 3DNowExt.
Definition: cpu.h:39
static double c[64]
#define AV_CPU_FLAG_ARMV8
Definition: cpu.h:70
static char * optarg
Definition: getopt.c:39
int main(int argc, char **argv)
Definition: cpu.c:94
int len
#define AV_CPU_FLAG_SETEND
Definition: cpu.h:72
#define AV_CPU_FLAG_SSE2
PIV SSE2 functions.
Definition: cpu.h:36
void av_force_cpu_flags(int arg)
Disables cpu detection and forces the specified flags.
Definition: cpu.c:65
static void print_cpu_flags(int cpu_flags, const char *type)
Definition: cpu.c:81
static uint8_t tmp[11]
Definition: aes_ctr.c:26