1 /*
2 * This file is part of FFmpeg.
3 *
4 * FFmpeg is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
8 *
9 * FFmpeg is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
13 *
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with FFmpeg; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17 */
18
19 #include <stdint.h>
20
26
27 #if HAVE_SCHED_GETAFFINITY
28 #ifndef _GNU_SOURCE
29 # define _GNU_SOURCE
30 #endif
31 #include <sched.h>
32 #endif
33 #if HAVE_GETPROCESSAFFINITYMASK || HAVE_WINRT
34 #include <windows.h>
35 #endif
36 #if HAVE_SYSCTL
37 #if HAVE_SYS_PARAM_H
38 #include <sys/param.h>
39 #endif
40 #include <sys/types.h>
41 #include <sys/sysctl.h>
42 #endif
43 #if HAVE_UNISTD_H
44 #include <unistd.h>
45 #endif
46
48
70 }
71
74 }
75
77 {
80
81 if (ARCH_AARCH64)
83 if (ARCH_ARM)
85 if (ARCH_PPC)
87 if (ARCH_X86)
89
92 }
93
95 {
99 }
100
102 {
103 #define CPUFLAG_MMXEXT (AV_CPU_FLAG_MMX | AV_CPU_FLAG_MMXEXT | AV_CPU_FLAG_CMOV)
104 #define CPUFLAG_3DNOW (AV_CPU_FLAG_3DNOW | AV_CPU_FLAG_MMX)
105 #define CPUFLAG_3DNOWEXT (AV_CPU_FLAG_3DNOWEXT | CPUFLAG_3DNOW)
106 #define CPUFLAG_SSE (AV_CPU_FLAG_SSE | CPUFLAG_MMXEXT)
107 #define CPUFLAG_SSE2 (AV_CPU_FLAG_SSE2 | CPUFLAG_SSE)
108 #define CPUFLAG_SSE2SLOW (AV_CPU_FLAG_SSE2SLOW | CPUFLAG_SSE2)
109 #define CPUFLAG_SSE3 (AV_CPU_FLAG_SSE3 | CPUFLAG_SSE2)
110 #define CPUFLAG_SSE3SLOW (AV_CPU_FLAG_SSE3SLOW | CPUFLAG_SSE3)
111 #define CPUFLAG_SSSE3 (AV_CPU_FLAG_SSSE3 | CPUFLAG_SSE3)
112 #define CPUFLAG_SSE4 (AV_CPU_FLAG_SSE4 | CPUFLAG_SSSE3)
113 #define CPUFLAG_SSE42 (AV_CPU_FLAG_SSE42 | CPUFLAG_SSE4)
114 #define CPUFLAG_AVX (AV_CPU_FLAG_AVX | CPUFLAG_SSE42)
115 #define CPUFLAG_AVXSLOW (AV_CPU_FLAG_AVXSLOW | CPUFLAG_AVX)
116 #define CPUFLAG_XOP (AV_CPU_FLAG_XOP | CPUFLAG_AVX)
117 #define CPUFLAG_FMA3 (AV_CPU_FLAG_FMA3 | CPUFLAG_AVX)
118 #define CPUFLAG_FMA4 (AV_CPU_FLAG_FMA4 | CPUFLAG_AVX)
119 #define CPUFLAG_AVX2 (AV_CPU_FLAG_AVX2 | CPUFLAG_AVX)
120 #define CPUFLAG_BMI2 (AV_CPU_FLAG_BMI2 | AV_CPU_FLAG_BMI1)
121 #define CPUFLAG_AESNI (AV_CPU_FLAG_AESNI | CPUFLAG_SSE42)
122 static const AVOption cpuflags_opts[] = {
124 #if ARCH_PPC
126 #elif ARCH_X86
150 #elif ARCH_ARM
158 #elif ARCH_AARCH64
162 #endif
164 };
168 .option = cpuflags_opts,
170 };
171
173 const AVClass *pclass = &
class;
174
176 return ret;
177
178 return flags & INT_MAX;
179 }
180
182 {
183 static const AVOption cpuflags_opts[] = {
185 #if ARCH_PPC
187 #elif ARCH_X86
212
213 #define CPU_FLAG_P2 AV_CPU_FLAG_CMOV | AV_CPU_FLAG_MMX
214 #define CPU_FLAG_P3 CPU_FLAG_P2 | AV_CPU_FLAG_MMX2 | AV_CPU_FLAG_SSE
215 #define CPU_FLAG_P4 CPU_FLAG_P3| AV_CPU_FLAG_SSE2
219
220 #define CPU_FLAG_K62 AV_CPU_FLAG_MMX | AV_CPU_FLAG_3DNOW
221 #define CPU_FLAG_ATHLON CPU_FLAG_K62 | AV_CPU_FLAG_CMOV | AV_CPU_FLAG_3DNOWEXT | AV_CPU_FLAG_MMX2
222 #define CPU_FLAG_ATHLONXP CPU_FLAG_ATHLON | AV_CPU_FLAG_SSE
223 #define CPU_FLAG_K8 CPU_FLAG_ATHLONXP | AV_CPU_FLAG_SSE2
229 #elif ARCH_ARM
238 #elif ARCH_AARCH64
242 #endif
244 };
248 .option = cpuflags_opts,
250 };
251 const AVClass *pclass = &
class;
252
254 }
255
257 {
258 static volatile int printed;
259
260 int nb_cpus = 1;
261 #if HAVE_WINRT
262 SYSTEM_INFO sysinfo;
263 #endif
264 #if HAVE_SCHED_GETAFFINITY && defined(CPU_COUNT)
265 cpu_set_t cpuset;
266
267 CPU_ZERO(&cpuset);
268
269 if (!sched_getaffinity(0, sizeof(cpuset), &cpuset))
270 nb_cpus = CPU_COUNT(&cpuset);
271 #elif HAVE_GETPROCESSAFFINITYMASK
273 if (GetProcessAffinityMask(GetCurrentProcess(), &proc_aff, &sys_aff))
274 nb_cpus = av_popcount64(proc_aff);
275 #elif HAVE_SYSCTL && defined(HW_NCPU)
276 int mib[2] = { CTL_HW, HW_NCPU };
277 size_t len =
sizeof(nb_cpus);
278
279 if (sysctl(mib, 2, &nb_cpus, &len,
NULL, 0) == -1)
280 nb_cpus = 0;
281 #elif HAVE_SYSCONF && defined(_SC_NPROC_ONLN)
282 nb_cpus = sysconf(_SC_NPROC_ONLN);
283 #elif HAVE_SYSCONF && defined(_SC_NPROCESSORS_ONLN)
284 nb_cpus = sysconf(_SC_NPROCESSORS_ONLN);
285 #elif HAVE_WINRT
286 GetNativeSystemInfo(&sysinfo);
287 nb_cpus = sysinfo.dwNumberOfProcessors;
288 #endif
289
290 if (!printed) {
292 printed = 1;
293 }
294
295 return nb_cpus;
296 }
297
298 #ifdef TEST
299
300 #include <stdio.h>
302
303 #if !HAVE_GETOPT
305 #endif
306
307 static const struct {
310 } cpu_flag_tab[] = {
311 #if ARCH_AARCH64
315 #elif ARCH_ARM
324 #elif ARCH_PPC
326 #elif ARCH_X86
350 #endif
351 { 0 }
352 };
353
354 static void print_cpu_flags(
int cpu_flags,
const char *
type)
355 {
356 int i;
357
358 printf("cpu_flags(%s) = 0x%08X\n", type, cpu_flags);
359 printf("cpu_flags_str(%s) =", type);
360 for (i = 0; cpu_flag_tab[i].flag; i++)
361 if (cpu_flags & cpu_flag_tab[i].
flag)
362 printf(
" %s", cpu_flag_tab[i].
name);
363 printf("\n");
364 }
365
366
367 int main(
int argc,
char **argv)
368 {
370 int cpu_flags_eff;
372 char threads[5] = "auto";
373 int i;
374
375 for(i = 0; cpu_flag_tab[i].flag; i++) {
376 unsigned tmp = 0;
378 fprintf(stderr, "Table missing %s\n", cpu_flag_tab[i].name);
379 return 4;
380 }
381 }
382
383 if (cpu_flags_raw < 0)
384 return 1;
385
386 for (;;) {
387 int c =
getopt(argc, argv,
"c:t:");
388 if (c == -1)
389 break;
390 switch (c) {
391 case 'c':
392 {
395 return 2;
396
398 break;
399 }
400 case 't':
401 {
403 if (len >= sizeof(threads)) {
404 fprintf(stderr,
"Invalid thread count '%s'\n",
optarg);
405 return 2;
406 }
407 }
408 }
409 }
410
412
413 if (cpu_flags_eff < 0)
414 return 3;
415
416 print_cpu_flags(cpu_flags_raw, "raw");
417 print_cpu_flags(cpu_flags_eff, "effective");
418 printf("threads = %s (cpu_count = %d)\n", threads, cpu_count);
419
420 return 0;
421 }
422
423 #endif
#define AV_CPU_FLAG_AVX
AVX functions: requires OS support even if YMM registers aren't used.
#define AV_CPU_FLAG_ALTIVEC
standard
#define AV_LOG_WARNING
Something somehow does not look correct.
#define LIBAVUTIL_VERSION_INT
#define AV_CPU_FLAG_SSE
SSE functions.
void av_set_cpu_flags_mask(int mask)
Set a mask on flags returned by av_get_cpu_flags().
#define AV_CPU_FLAG_MMX2
SSE integer functions or AMD MMX ext.
#define AV_CPU_FLAG_CMOV
supports cmov instruction
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
#define AV_CPU_FLAG_FMA3
Haswell FMA3 functions.
#define AV_CPU_FLAG_MMXEXT
SSE integer functions or AMD MMX ext.
int ff_get_cpu_flags_ppc(void)
This function MAY rely on signal() or fork() in order to make sure AltiVec is present.
int av_parse_cpu_flags(const char *s)
Parse CPU flags from a string.
#define AV_CPU_FLAG_ATOM
Atom processor, some SSSE3 instructions are slower.
#define AV_CPU_FLAG_AVX2
AVX2 functions: requires OS support even if YMM registers aren't used.
#define AV_CPU_FLAG_SSE2SLOW
SSE2 supported, but usually not faster.
#define AV_CPU_FLAG_XOP
Bulldozer XOP functions.
#define AV_CPU_FLAG_SSE42
Nehalem SSE4.2 functions.
#define AV_CPU_FLAG_SSSE3
Conroe SSSE3 functions.
static const uint16_t mask[17]
int av_opt_eval_flags(void *obj, const AVOption *o, const char *val, int *flags_out)
#define AV_LOG_DEBUG
Stuff which is only useful for libav* developers.
#define AV_CPU_FLAG_ARMV6T2
#define AV_CPU_FLAG_VFP_VM
VFPv2 vector mode, deprecated in ARMv7-A and unavailable in various CPUs implementations.
size_t av_strlcpy(char *dst, const char *src, size_t size)
Copy the string src to dst, but no more than size - 1 bytes, and null-terminate dst.
int av_parse_cpu_caps(unsigned *flags, const char *s)
Parse CPU caps from a string and update the given AV_CPU_* flags based on that.
#define AV_CPU_FLAG_ARMV5TE
#define AV_CPU_FLAG_SSE3
Prescott SSE3 functions.
int ff_get_cpu_flags_x86(void)
#define AV_CPU_FLAG_BMI2
Bit Manipulation Instruction Set 2.
#define AV_CPU_FLAG_VFPV3
#define AV_CPU_FLAG_3DNOW
AMD 3DNOW.
#define AV_CPU_FLAG_ARMV6
int ff_get_cpu_flags_aarch64(void)
#define AV_CPU_FLAG_SSE3SLOW
SSE3 supported, but usually not faster.
#define AV_CPU_FLAG_AVXSLOW
AVX supported, but slow when using YMM registers (e.g. Bulldozer)
#define AV_CPU_FLAG_BMI1
Bit Manipulation Instruction Set 1.
#define AV_CPU_FLAG_MMX
standard MMX
static int getopt(int argc, char *argv[], char *opts)
Describe the class of an AVClass context structure.
#define AV_CPU_FLAG_FMA4
Bulldozer FMA4 functions.
#define AV_CPU_FLAG_SSE4
Penryn SSE4.1 functions.
#define AV_CPU_FLAG_AESNI
Advanced Encryption Standard functions.
int av_get_cpu_flags(void)
Return the flags which specify extensions supported by the CPU.
#define AV_CPU_FLAG_3DNOWEXT
AMD 3DNowExt.
common internal and external API header
#define AV_CPU_FLAG_ARMV8
int ff_get_cpu_flags_arm(void)
#define AV_CPU_FLAG_SETEND
#define AV_CPU_FLAG_SSE2
PIV SSE2 functions.
void av_force_cpu_flags(int arg)
Disables cpu detection and forces the specified flags.
int main(int argc, char **argv)