/
SDL_cpuinfo.c
453 lines (417 loc) · 12.9 KB
1
2
/*
SDL - Simple DirectMedia Layer
3
Copyright (C) 1997-2004 Sam Lantinga
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
This library is free software; you can redistribute it and/or
modify it under the terms of the GNU Library General Public
License as published by the Free Software Foundation; either
version 2 of the License, or (at your option) any later version.
This library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Library General Public License for more details.
You should have received a copy of the GNU Library General Public
License along with this library; if not, write to the Free
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
Sam Lantinga
slouken@libsdl.org
*/
#ifdef SAVE_RCSID
static char rcsid =
"@(#) $Id$";
#endif
/* CPU feature detection for SDL */
30
31
32
33
34
35
#ifdef unix /* FIXME: Better setjmp detection? */
#define USE_SETJMP
#include <signal.h>
#include <setjmp.h>
#endif
36
#include "SDL.h"
37
#include "SDL_cpuinfo.h"
38
39
40
41
42
#ifdef MACOSX
#include <sys/sysctl.h> /* For AltiVec check */
#endif
43
44
#define CPU_HAS_RDTSC 0x00000001
#define CPU_HAS_MMX 0x00000002
45
46
47
48
49
50
#define CPU_HAS_MMXEXT 0x00000004
#define CPU_HAS_3DNOW 0x00000010
#define CPU_HAS_3DNOWEXT 0x00000020
#define CPU_HAS_SSE 0x00000040
#define CPU_HAS_SSE2 0x00000080
#define CPU_HAS_ALTIVEC 0x00000100
51
52
#if defined(USE_SETJMP) && defined(GCC_ALTIVEC)
53
54
55
56
57
58
59
60
61
62
/* This is the brute force way of detecting instruction sets...
the idea is borrowed from the libmpeg2 library - thanks!
*/
static jmp_buf jmpbuf;
static void illegal_instruction(int sig)
{
longjmp(jmpbuf, 1);
}
#endif // USE_SETJMP
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
static __inline__ int CPU_haveCPUID()
{
int has_CPUID = 0;
#if defined(__GNUC__) && defined(i386)
__asm__ (
" pushfl # Get original EFLAGS \n"
" popl %%eax \n"
" movl %%eax,%%ecx \n"
" xorl $0x200000,%%eax # Flip ID bit in EFLAGS \n"
" pushl %%eax # Save new EFLAGS value on stack \n"
" popfl # Replace current EFLAGS value \n"
" pushfl # Get new EFLAGS \n"
" popl %%eax # Store new EFLAGS in EAX \n"
" xorl %%ecx,%%eax # Can not toggle ID bit, \n"
" jz 1f # Processor=80486 \n"
" movl $1,%0 # We have CPUID support \n"
"1: \n"
80
: "=m" (has_CPUID)
81
82
83
:
: "%eax", "%ecx"
);
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
#elif defined(__GNUC__) && defined(__x86_64__)
/* Technically, if this is being compiled under __x86_64__ then it has
CPUid by definition. But it's nice to be able to prove it. :) */
__asm__ (
" pushfq # Get original EFLAGS \n"
" popq %%rax \n"
" movq %%rax,%%rcx \n"
" xorl $0x200000,%%eax # Flip ID bit in EFLAGS \n"
" pushq %%rax # Save new EFLAGS value on stack \n"
" popfq # Replace current EFLAGS value \n"
" pushfq # Get new EFLAGS \n"
" popq %%rax # Store new EFLAGS in EAX \n"
" xorl %%ecx,%%eax # Can not toggle ID bit, \n"
" jz 1f # Processor=80486 \n"
" movl $1,%0 # We have CPUID support \n"
"1: \n"
: "=m" (has_CPUID)
:
: "%rax", "%rcx"
);
104
#elif defined(_MSC_VER) && (defined(_M_IX86) || defined(_X86_))
105
__asm {
106
107
108
109
110
111
112
113
114
115
116
117
118
pushfd ; Get original EFLAGS
pop eax
mov ecx, eax
xor eax, 200000h ; Flip ID bit in EFLAGS
push eax ; Save new EFLAGS value on stack
popfd ; Replace current EFLAGS value
pushfd ; Get new EFLAGS
pop eax ; Store new EFLAGS in EAX
xor eax, ecx ; Can not toggle ID bit,
jz done ; Processor=80486
mov has_CPUID,1 ; We have CPUID support
done:
}
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
#elif defined(__sun) && defined(__x86)
__asm (
" pushfl \n"
" popl %eax \n"
" movl %eax,%ecx \n"
" xorl $0x200000,%eax \n"
" pushl %eax \n"
" popfl \n"
" pushfl \n"
" popl %eax \n"
" xorl %ecx,%eax \n"
" jz 1f \n"
" movl $1,-8(%ebp) \n"
"1: \n"
);
#elif defined(__sun) && defined(__amd64)
__asm (
" pushfq \n"
" popq %rax \n"
" movq %rax,%rcx \n"
" xorl $0x200000,%eax \n"
" pushq %rax \n"
" popfq \n"
" pushfq \n"
" popq %rax \n"
" xorl %ecx,%eax \n"
" jz 1f \n"
" movl $1,-8(%rbp) \n"
"1: \n"
);
149
150
151
152
153
154
155
#endif
return has_CPUID;
}
static __inline__ int CPU_getCPUIDFeatures()
{
int features = 0;
156
#if defined(__GNUC__) && ( defined(i386) || defined(__x86_64__) )
157
__asm__ (
158
" movl %%ebx,%%edi\n"
159
160
161
162
163
164
165
166
167
" xorl %%eax,%%eax # Set up for CPUID instruction \n"
" cpuid # Get and save vendor ID \n"
" cmpl $1,%%eax # Make sure 1 is valid input for CPUID\n"
" jl 1f # We dont have the CPUID instruction\n"
" xorl %%eax,%%eax \n"
" incl %%eax \n"
" cpuid # Get family/model/stepping/features\n"
" movl %%edx,%0 \n"
"1: \n"
168
" movl %%edi,%%ebx\n"
169
: "=m" (features)
170
:
171
: "%eax", "%ecx", "%edx", "%edi"
172
);
173
#elif defined(_MSC_VER) && (defined(_M_IX86) || defined(_X86_))
174
__asm {
175
176
177
178
179
180
181
182
183
184
xor eax, eax ; Set up for CPUID instruction
cpuid ; Get and save vendor ID
cmp eax, 1 ; Make sure 1 is valid input for CPUID
jl done ; We dont have the CPUID instruction
xor eax, eax
inc eax
cpuid ; Get family/model/stepping/features
mov features, edx
done:
}
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
#elif defined(__sun) && (defined(__x86) || defined(__amd64))
__asm(
" movl %ebx,%edi\n"
" xorl %eax,%eax \n"
" cpuid \n"
" cmpl $1,%eax \n"
" jl 1f \n"
" xorl %eax,%eax \n"
" incl %eax \n"
" cpuid \n"
#ifdef __i386
" movl %edx,-8(%ebp) \n"
#else
" movl %edx,-8(%rbp) \n"
#endif
"1: \n"
" movl %edi,%ebx\n" );
202
203
204
205
#endif
return features;
}
206
static __inline__ int CPU_getCPUIDFeaturesExt()
207
{
208
int features = 0;
209
#if defined(__GNUC__) && (defined(i386) || defined (__x86_64__) )
210
__asm__ (
211
" movl %%ebx,%%edi\n"
212
213
214
" movl $0x80000000,%%eax # Query for extended functions \n"
" cpuid # Get extended function limit \n"
" cmpl $0x80000001,%%eax \n"
215
" jl 1f # Nope, we dont have function 800000001h\n"
216
217
" movl $0x80000001,%%eax # Setup extended function 800000001h\n"
" cpuid # and get the information \n"
218
" movl %%edx,%0 \n"
219
"1: \n"
220
221
" movl %%edi,%%ebx\n"
: "=m" (features)
222
:
223
: "%eax", "%ecx", "%edx", "%edi"
224
);
225
#elif defined(_MSC_VER) && (defined(_M_IX86) || defined(_X86_))
226
__asm {
227
228
229
mov eax,80000000h ; Query for extended functions
cpuid ; Get extended function limit
cmp eax,80000001h
230
jl done ; Nope, we dont have function 800000001h
231
232
mov eax,80000001h ; Setup extended function 800000001h
cpuid ; and get the information
233
mov features,edx
234
235
done:
}
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
#elif defined(__sun) && ( defined(__i386) || defined(__amd64) )
__asm (
" movl %ebx,%edi\n"
" movl $0x80000000,%eax \n"
" cpuid \n"
" cmpl $0x80000001,%eax \n"
" jl 1f \n"
" movl $0x80000001,%eax \n"
" cpuid \n"
#ifdef __i386
" movl %edx,-8(%ebp) \n"
#else
" movl %edx,-8(%rbp) \n"
#endif
"1: \n"
" movl %edi,%ebx\n"
);
253
#endif
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
return features;
}
static __inline__ int CPU_haveRDTSC()
{
if ( CPU_haveCPUID() ) {
return (CPU_getCPUIDFeatures() & 0x00000010);
}
return 0;
}
static __inline__ int CPU_haveMMX()
{
if ( CPU_haveCPUID() ) {
return (CPU_getCPUIDFeatures() & 0x00800000);
}
return 0;
}
static __inline__ int CPU_haveMMXExt()
{
if ( CPU_haveCPUID() ) {
return (CPU_getCPUIDFeaturesExt() & 0x00400000);
}
return 0;
}
static __inline__ int CPU_have3DNow()
{
if ( CPU_haveCPUID() ) {
return (CPU_getCPUIDFeaturesExt() & 0x80000000);
}
return 0;
}
static __inline__ int CPU_have3DNowExt()
{
if ( CPU_haveCPUID() ) {
return (CPU_getCPUIDFeaturesExt() & 0x40000000);
}
return 0;
295
296
297
298
299
300
301
302
303
}
static __inline__ int CPU_haveSSE()
{
if ( CPU_haveCPUID() ) {
return (CPU_getCPUIDFeatures() & 0x02000000);
}
return 0;
}
304
305
306
307
308
309
310
311
312
static __inline__ int CPU_haveSSE2()
{
if ( CPU_haveCPUID() ) {
return (CPU_getCPUIDFeatures() & 0x04000000);
}
return 0;
}
313
314
static __inline__ int CPU_haveAltiVec()
{
315
volatile int altivec = 0;
316
317
318
319
320
321
#ifdef MACOSX
int selectors[2] = { CTL_HW, HW_VECTORUNIT };
int hasVectorUnit = 0;
size_t length = sizeof(hasVectorUnit);
int error = sysctl(selectors, 2, &hasVectorUnit, &length, NULL, 0);
if( 0 == error )
322
altivec = (hasVectorUnit != 0);
323
#elif defined(USE_SETJMP) && defined(GCC_ALTIVEC)
324
325
326
327
328
329
330
331
332
333
void (*handler)(int sig);
handler = signal(SIGILL, illegal_instruction);
if ( setjmp(jmpbuf) == 0 ) {
asm volatile ("mtspr 256, %0\n\t"
"vand %%v0, %%v0, %%v0"
:
: "r" (-1));
altivec = 1;
}
signal(SIGILL, handler);
334
#endif
335
return altivec;
336
337
}
338
339
340
341
342
343
static Uint32 SDL_CPUFeatures = 0xFFFFFFFF;
static Uint32 SDL_GetCPUFeatures()
{
if ( SDL_CPUFeatures == 0xFFFFFFFF ) {
SDL_CPUFeatures = 0;
344
345
346
if ( CPU_haveRDTSC() ) {
SDL_CPUFeatures |= CPU_HAS_RDTSC;
}
347
348
349
if ( CPU_haveMMX() ) {
SDL_CPUFeatures |= CPU_HAS_MMX;
}
350
351
352
if ( CPU_haveMMXExt() ) {
SDL_CPUFeatures |= CPU_HAS_MMXEXT;
}
353
354
355
if ( CPU_have3DNow() ) {
SDL_CPUFeatures |= CPU_HAS_3DNOW;
}
356
357
358
if ( CPU_have3DNowExt() ) {
SDL_CPUFeatures |= CPU_HAS_3DNOWEXT;
}
359
360
361
if ( CPU_haveSSE() ) {
SDL_CPUFeatures |= CPU_HAS_SSE;
}
362
363
364
if ( CPU_haveSSE2() ) {
SDL_CPUFeatures |= CPU_HAS_SSE2;
}
365
366
367
if ( CPU_haveAltiVec() ) {
SDL_CPUFeatures |= CPU_HAS_ALTIVEC;
}
368
369
370
371
}
return SDL_CPUFeatures;
}
372
373
374
375
376
377
378
379
SDL_bool SDL_HasRDTSC()
{
if ( SDL_GetCPUFeatures() & CPU_HAS_RDTSC ) {
return SDL_TRUE;
}
return SDL_FALSE;
}
380
381
382
383
384
385
386
387
SDL_bool SDL_HasMMX()
{
if ( SDL_GetCPUFeatures() & CPU_HAS_MMX ) {
return SDL_TRUE;
}
return SDL_FALSE;
}
388
SDL_bool SDL_HasMMXExt()
389
{
390
if ( SDL_GetCPUFeatures() & CPU_HAS_MMXEXT ) {
391
392
393
394
395
return SDL_TRUE;
}
return SDL_FALSE;
}
396
SDL_bool SDL_Has3DNow()
397
{
398
if ( SDL_GetCPUFeatures() & CPU_HAS_3DNOW ) {
399
400
401
402
403
return SDL_TRUE;
}
return SDL_FALSE;
}
404
SDL_bool SDL_Has3DNowExt()
405
{
406
if ( SDL_GetCPUFeatures() & CPU_HAS_3DNOWEXT ) {
407
408
409
410
411
return SDL_TRUE;
}
return SDL_FALSE;
}
412
SDL_bool SDL_HasSSE()
413
{
414
415
416
417
if ( SDL_GetCPUFeatures() & CPU_HAS_SSE ) {
return SDL_TRUE;
}
return SDL_FALSE;
418
419
}
420
SDL_bool SDL_HasSSE2()
421
{
422
423
424
425
if ( SDL_GetCPUFeatures() & CPU_HAS_SSE2 ) {
return SDL_TRUE;
}
return SDL_FALSE;
426
427
}
428
SDL_bool SDL_HasAltiVec()
429
{
430
431
432
433
if ( SDL_GetCPUFeatures() & CPU_HAS_ALTIVEC ) {
return SDL_TRUE;
}
return SDL_FALSE;
434
435
}
436
437
438
439
440
441
#ifdef TEST_MAIN
#include <stdio.h>
int main()
{
442
printf("RDTSC: %d\n", SDL_HasRDTSC());
443
printf("MMX: %d\n", SDL_HasMMX());
444
printf("MMXExt: %d\n", SDL_HasMMXExt());
445
printf("3DNow: %d\n", SDL_Has3DNow());
446
printf("3DNowExt: %d\n", SDL_Has3DNowExt());
447
printf("SSE: %d\n", SDL_HasSSE());
448
printf("SSE2: %d\n", SDL_HasSSE2());
449
printf("AltiVec: %d\n", SDL_HasAltiVec());
450
return 0;
451
452
453
}
#endif /* TEST_MAIN */