2010-01-06 23:39:22 -05:00
|
|
|
! Copyright (C) 2009, 2010 Slava Pestov.
|
2009-05-31 16:02:14 -04:00
|
|
|
! See http://factorcode.org/license.txt for BSD license.
|
2012-09-19 11:40:18 -04:00
|
|
|
USING: alien alien.c-types arrays assocs combinators
|
|
|
|
compiler.codegen.labels cpu.architecture cpu.x86.assembler
|
|
|
|
cpu.x86.assembler.operands init kernel math math.order
|
|
|
|
math.parser memoize namespaces sequences
|
2012-09-19 13:12:25 -04:00
|
|
|
specialized-arrays system math.bitwise combinators.smart ;
|
2012-09-18 21:40:29 -04:00
|
|
|
SPECIALIZED-ARRAY: uint
|
2009-05-31 16:02:14 -04:00
|
|
|
IN: cpu.x86.features
|
|
|
|
|
|
|
|
<PRIVATE
|
|
|
|
|
2010-05-16 03:43:02 -04:00
|
|
|
: return-reg ( -- reg ) int-regs return-regs at first ;
|
|
|
|
|
2010-01-06 23:39:22 -05:00
|
|
|
: (sse-version) ( -- n )
|
2010-03-31 22:20:35 -04:00
|
|
|
int { } cdecl [
|
2010-01-06 23:39:22 -05:00
|
|
|
"sse-42" define-label
|
|
|
|
"sse-41" define-label
|
|
|
|
"ssse-3" define-label
|
|
|
|
"sse-3" define-label
|
|
|
|
"sse-2" define-label
|
|
|
|
"sse-1" define-label
|
|
|
|
"end" define-label
|
2009-05-31 16:02:14 -04:00
|
|
|
|
2010-05-16 03:43:02 -04:00
|
|
|
return-reg 1 MOV
|
2010-01-06 23:39:22 -05:00
|
|
|
|
|
|
|
CPUID
|
|
|
|
|
2010-05-15 16:26:14 -04:00
|
|
|
ECX 20 BT
|
|
|
|
"sse-42" get JB
|
2010-01-06 23:39:22 -05:00
|
|
|
|
2010-05-15 16:26:14 -04:00
|
|
|
ECX 19 BT
|
|
|
|
"sse-41" get JB
|
2010-01-06 23:39:22 -05:00
|
|
|
|
2010-05-15 16:26:14 -04:00
|
|
|
ECX 9 BT
|
|
|
|
"ssse-3" get JB
|
2010-01-06 23:39:22 -05:00
|
|
|
|
2010-05-15 16:26:14 -04:00
|
|
|
ECX 0 BT
|
|
|
|
"sse-3" get JB
|
2010-01-06 23:39:22 -05:00
|
|
|
|
2010-05-15 16:26:14 -04:00
|
|
|
EDX 26 BT
|
|
|
|
"sse-2" get JB
|
2010-01-06 23:39:22 -05:00
|
|
|
|
2010-05-15 16:26:14 -04:00
|
|
|
EDX 25 BT
|
|
|
|
"sse-1" get JB
|
2010-01-06 23:39:22 -05:00
|
|
|
|
2010-05-16 03:43:02 -04:00
|
|
|
return-reg 0 MOV
|
2010-01-06 23:39:22 -05:00
|
|
|
"end" get JMP
|
|
|
|
|
|
|
|
"sse-42" resolve-label
|
2010-05-16 03:43:02 -04:00
|
|
|
return-reg 42 MOV
|
2010-01-06 23:39:22 -05:00
|
|
|
"end" get JMP
|
|
|
|
|
|
|
|
"sse-41" resolve-label
|
2010-05-16 03:43:02 -04:00
|
|
|
return-reg 41 MOV
|
2010-01-06 23:39:22 -05:00
|
|
|
"end" get JMP
|
|
|
|
|
|
|
|
"ssse-3" resolve-label
|
2010-05-16 03:43:02 -04:00
|
|
|
return-reg 33 MOV
|
2010-01-06 23:39:22 -05:00
|
|
|
"end" get JMP
|
|
|
|
|
|
|
|
"sse-3" resolve-label
|
2010-05-16 03:43:02 -04:00
|
|
|
return-reg 30 MOV
|
2010-01-06 23:39:22 -05:00
|
|
|
"end" get JMP
|
|
|
|
|
|
|
|
"sse-2" resolve-label
|
2010-05-16 03:43:02 -04:00
|
|
|
return-reg 20 MOV
|
2010-01-06 23:39:22 -05:00
|
|
|
"end" get JMP
|
|
|
|
|
|
|
|
"sse-1" resolve-label
|
2010-05-16 03:43:02 -04:00
|
|
|
return-reg 10 MOV
|
2010-01-06 23:39:22 -05:00
|
|
|
|
|
|
|
"end" resolve-label
|
|
|
|
] alien-assembly ;
|
2009-05-31 16:02:14 -04:00
|
|
|
|
|
|
|
PRIVATE>
|
|
|
|
|
2009-09-23 06:13:15 -04:00
|
|
|
MEMO: sse-version ( -- n )
|
2010-01-06 23:39:22 -05:00
|
|
|
(sse-version) "sse-version" get string>number [ min ] when* ;
|
2009-09-23 06:13:15 -04:00
|
|
|
|
|
|
|
: sse? ( -- ? ) sse-version 10 >= ;
|
|
|
|
: sse2? ( -- ? ) sse-version 20 >= ;
|
|
|
|
: sse3? ( -- ? ) sse-version 30 >= ;
|
|
|
|
: ssse3? ( -- ? ) sse-version 33 >= ;
|
|
|
|
: sse4.1? ( -- ? ) sse-version 41 >= ;
|
|
|
|
: sse4.2? ( -- ? ) sse-version 42 >= ;
|
2009-05-31 16:02:14 -04:00
|
|
|
|
2012-09-19 14:30:54 -04:00
|
|
|
HOOK: (cpuid) cpu ( rax rcx regs -- )
|
2012-09-18 21:40:29 -04:00
|
|
|
|
2012-09-19 14:30:54 -04:00
|
|
|
|
|
|
|
: cpuid-extended ( rax rcx -- 4array )
|
2012-09-18 21:40:29 -04:00
|
|
|
4 <uint-array> [ (cpuid) ] keep >array ;
|
|
|
|
|
2012-09-19 14:30:54 -04:00
|
|
|
: cpuid ( rax -- 4array ) 0 cpuid-extended ;
|
|
|
|
|
2012-09-19 13:12:25 -04:00
|
|
|
: cpu-stepping ( -- n ) 1 cpuid first 4 bits ;
|
|
|
|
: cpu-model ( -- n ) 1 cpuid first -4 shift 4 bits ;
|
|
|
|
: cpu-family ( -- n ) 1 cpuid first -8 shift 4 bits ;
|
|
|
|
: cpu-processor-type ( -- n ) 1 cpuid first -12 shift 2 bits ;
|
|
|
|
: cpu-extended-model ( -- n ) 1 cpuid first -16 shift 4 bits ;
|
|
|
|
: cpu-extended-family ( -- n ) 1 cpuid first -20 shift 8 bits ;
|
|
|
|
|
|
|
|
: cpu-family-model-string ( -- string )
|
|
|
|
[
|
|
|
|
cpu-extended-family cpu-family [ >hex ] bi@
|
|
|
|
"_"
|
|
|
|
cpu-extended-model cpu-model [ >hex ] bi@
|
|
|
|
] "" append-outputs-as ;
|
|
|
|
|
2012-09-19 13:41:54 -04:00
|
|
|
: popcnt? ( -- ? )
|
|
|
|
bool { } cdecl [
|
|
|
|
return-reg 1 MOV
|
|
|
|
CPUID
|
|
|
|
return-reg dup XOR
|
|
|
|
ECX 23 BT
|
|
|
|
return-reg SETB
|
|
|
|
] alien-assembly ;
|
|
|
|
|
2012-09-19 13:12:25 -04:00
|
|
|
: tscdeadline? ( -- ? ) 1 cpuid third 24 bit? ;
|
|
|
|
: aes? ( -- ? ) 1 cpuid third 25 bit? ;
|
|
|
|
: xsave? ( -- ? ) 1 cpuid third 26 bit? ;
|
|
|
|
: osxsave? ( -- ? ) 1 cpuid third 27 bit? ;
|
|
|
|
: avx? ( -- ? ) 1 cpuid third 28 bit? ;
|
|
|
|
: f16c? ( -- ? ) 1 cpuid third 29 bit? ;
|
|
|
|
: rdrnd? ( -- ? ) 1 cpuid third 30 bit? ;
|
|
|
|
|
|
|
|
: msr? ( -- ? ) 1 cpuid fourth 5 bit? ;
|
|
|
|
: tm1? ( -- ? ) 1 cpuid fourth 29 bit? ;
|
|
|
|
: tm2? ( -- ? ) 1 cpuid third 8 bit? ;
|
2010-05-15 16:26:14 -04:00
|
|
|
|
2011-12-12 19:43:49 -05:00
|
|
|
MEMO: enable-popcnt? ( -- ? )
|
2012-09-18 20:14:31 -04:00
|
|
|
popcnt? "disable-popcnt" get not and ;
|
2011-12-12 19:43:49 -05:00
|
|
|
|
|
|
|
[ { sse-version enable-popcnt? } [ reset-memoized ] each ]
|
|
|
|
"cpu.x86.features" add-startup-hook
|
|
|
|
|
2009-09-03 04:28:38 -04:00
|
|
|
: sse-string ( version -- string )
|
|
|
|
{
|
|
|
|
{ 00 [ "no SSE" ] }
|
|
|
|
{ 10 [ "SSE1" ] }
|
|
|
|
{ 20 [ "SSE2" ] }
|
|
|
|
{ 30 [ "SSE3" ] }
|
|
|
|
{ 33 [ "SSSE3" ] }
|
|
|
|
{ 41 [ "SSE4.1" ] }
|
|
|
|
{ 42 [ "SSE4.2" ] }
|
|
|
|
} case ;
|
2009-05-31 16:02:14 -04:00
|
|
|
|
|
|
|
HOOK: instruction-count cpu ( -- n )
|
|
|
|
|
2010-01-06 23:39:22 -05:00
|
|
|
M: x86.32 instruction-count
|
2010-03-31 22:20:35 -04:00
|
|
|
longlong { } cdecl [
|
2010-01-06 23:39:22 -05:00
|
|
|
RDTSC
|
|
|
|
] alien-assembly ;
|
|
|
|
|
|
|
|
M: x86.64 instruction-count
|
2010-03-31 22:20:35 -04:00
|
|
|
longlong { } cdecl [
|
2010-01-06 23:39:22 -05:00
|
|
|
RAX 0 MOV
|
|
|
|
RDTSC
|
|
|
|
RDX 32 SHL
|
|
|
|
RAX RDX OR
|
|
|
|
] alien-assembly ;
|
2009-05-31 16:02:14 -04:00
|
|
|
|
|
|
|
: count-instructions ( quot -- n )
|
2010-01-06 23:39:22 -05:00
|
|
|
instruction-count [ call instruction-count ] dip - ; inline
|