2010-01-06 23:39:22 -05:00
|
|
|
! Copyright (C) 2009, 2010 Slava Pestov.
|
2009-05-31 16:02:14 -04:00
|
|
|
! See http://factorcode.org/license.txt for BSD license.
|
2015-08-16 00:37:33 -04:00
|
|
|
USING: alien alien.c-types alien.data arrays assocs combinators
|
2012-09-19 11:40:18 -04:00
|
|
|
compiler.codegen.labels cpu.architecture cpu.x86.assembler
|
|
|
|
cpu.x86.assembler.operands init kernel math math.order
|
|
|
|
math.parser memoize namespaces sequences
|
2012-09-19 13:12:25 -04:00
|
|
|
specialized-arrays system math.bitwise combinators.smart ;
|
2012-09-18 21:40:29 -04:00
|
|
|
SPECIALIZED-ARRAY: uint
|
2009-05-31 16:02:14 -04:00
|
|
|
IN: cpu.x86.features
|
|
|
|
|
|
|
|
<PRIVATE
|
|
|
|
|
2010-05-16 03:43:02 -04:00
|
|
|
: return-reg ( -- reg ) int-regs return-regs at first ;
|
|
|
|
|
2010-01-06 23:39:22 -05:00
|
|
|
: (sse-version) ( -- n )
|
2010-03-31 22:20:35 -04:00
|
|
|
int { } cdecl [
|
2010-01-06 23:39:22 -05:00
|
|
|
"sse-42" define-label
|
|
|
|
"sse-41" define-label
|
|
|
|
"ssse-3" define-label
|
|
|
|
"sse-3" define-label
|
|
|
|
"sse-2" define-label
|
|
|
|
"sse-1" define-label
|
|
|
|
"end" define-label
|
2009-05-31 16:02:14 -04:00
|
|
|
|
2010-05-16 03:43:02 -04:00
|
|
|
return-reg 1 MOV
|
2010-01-06 23:39:22 -05:00
|
|
|
|
|
|
|
CPUID
|
|
|
|
|
2010-05-15 16:26:14 -04:00
|
|
|
ECX 20 BT
|
|
|
|
"sse-42" get JB
|
2010-01-06 23:39:22 -05:00
|
|
|
|
2010-05-15 16:26:14 -04:00
|
|
|
ECX 19 BT
|
|
|
|
"sse-41" get JB
|
2010-01-06 23:39:22 -05:00
|
|
|
|
2010-05-15 16:26:14 -04:00
|
|
|
ECX 9 BT
|
|
|
|
"ssse-3" get JB
|
2010-01-06 23:39:22 -05:00
|
|
|
|
2010-05-15 16:26:14 -04:00
|
|
|
ECX 0 BT
|
|
|
|
"sse-3" get JB
|
2010-01-06 23:39:22 -05:00
|
|
|
|
2010-05-15 16:26:14 -04:00
|
|
|
EDX 26 BT
|
|
|
|
"sse-2" get JB
|
2010-01-06 23:39:22 -05:00
|
|
|
|
2010-05-15 16:26:14 -04:00
|
|
|
EDX 25 BT
|
|
|
|
"sse-1" get JB
|
2010-01-06 23:39:22 -05:00
|
|
|
|
2010-05-16 03:43:02 -04:00
|
|
|
return-reg 0 MOV
|
2010-01-06 23:39:22 -05:00
|
|
|
"end" get JMP
|
|
|
|
|
|
|
|
"sse-42" resolve-label
|
2010-05-16 03:43:02 -04:00
|
|
|
return-reg 42 MOV
|
2010-01-06 23:39:22 -05:00
|
|
|
"end" get JMP
|
|
|
|
|
|
|
|
"sse-41" resolve-label
|
2010-05-16 03:43:02 -04:00
|
|
|
return-reg 41 MOV
|
2010-01-06 23:39:22 -05:00
|
|
|
"end" get JMP
|
|
|
|
|
|
|
|
"ssse-3" resolve-label
|
2010-05-16 03:43:02 -04:00
|
|
|
return-reg 33 MOV
|
2010-01-06 23:39:22 -05:00
|
|
|
"end" get JMP
|
|
|
|
|
|
|
|
"sse-3" resolve-label
|
2010-05-16 03:43:02 -04:00
|
|
|
return-reg 30 MOV
|
2010-01-06 23:39:22 -05:00
|
|
|
"end" get JMP
|
|
|
|
|
|
|
|
"sse-2" resolve-label
|
2010-05-16 03:43:02 -04:00
|
|
|
return-reg 20 MOV
|
2010-01-06 23:39:22 -05:00
|
|
|
"end" get JMP
|
|
|
|
|
|
|
|
"sse-1" resolve-label
|
2010-05-16 03:43:02 -04:00
|
|
|
return-reg 10 MOV
|
2010-01-06 23:39:22 -05:00
|
|
|
|
|
|
|
"end" resolve-label
|
|
|
|
] alien-assembly ;
|
2009-05-31 16:02:14 -04:00
|
|
|
|
|
|
|
PRIVATE>
|
|
|
|
|
2009-09-23 06:13:15 -04:00
|
|
|
MEMO: sse-version ( -- n )
|
2010-01-06 23:39:22 -05:00
|
|
|
(sse-version) "sse-version" get string>number [ min ] when* ;
|
2009-09-23 06:13:15 -04:00
|
|
|
|
|
|
|
: sse? ( -- ? ) sse-version 10 >= ;
|
|
|
|
: sse2? ( -- ? ) sse-version 20 >= ;
|
|
|
|
: sse3? ( -- ? ) sse-version 30 >= ;
|
|
|
|
: ssse3? ( -- ? ) sse-version 33 >= ;
|
|
|
|
: sse4.1? ( -- ? ) sse-version 41 >= ;
|
|
|
|
: sse4.2? ( -- ? ) sse-version 42 >= ;
|
2009-05-31 16:02:14 -04:00
|
|
|
|
2012-09-19 14:30:54 -04:00
|
|
|
HOOK: (cpuid) cpu ( rax rcx regs -- )
|
2012-09-18 21:40:29 -04:00
|
|
|
|
2012-09-19 14:30:54 -04:00
|
|
|
|
|
|
|
: cpuid-extended ( rax rcx -- 4array )
|
2015-08-16 00:37:33 -04:00
|
|
|
4 uint <c-array> [ (cpuid) ] keep >array ;
|
2012-09-18 21:40:29 -04:00
|
|
|
|
2012-09-19 14:30:54 -04:00
|
|
|
: cpuid ( rax -- 4array ) 0 cpuid-extended ;
|
|
|
|
|
2012-09-19 17:55:28 -04:00
|
|
|
: cpuid-processor-info ( -- eax ) 1 cpuid first ; inline
|
|
|
|
|
|
|
|
: parse-stepping ( eax -- n ) 3 0 bit-range ; inline
|
|
|
|
: parse-model ( eax -- n ) 7 4 bit-range ; inline
|
|
|
|
: parse-family ( eax -- n ) 11 8 bit-range ; inline
|
|
|
|
: parse-processor-type ( eax -- n ) 13 12 bit-range ; inline
|
|
|
|
: parse-extended-model ( eax -- n ) 19 16 bit-range ; inline
|
|
|
|
: parse-extended-family ( eax -- n ) 27 20 bit-range ; inline
|
|
|
|
|
|
|
|
: cpu-stepping ( -- n ) cpuid-processor-info parse-stepping ;
|
|
|
|
: cpu-model ( -- n ) cpuid-processor-info parse-model ;
|
|
|
|
: cpu-family ( -- n ) cpuid-processor-info parse-family ;
|
|
|
|
: cpu-processor-type ( -- n ) cpuid-processor-info parse-processor-type ;
|
|
|
|
: cpu-extended-model ( -- n ) cpuid-processor-info parse-extended-model ;
|
|
|
|
: cpu-extended-family ( -- n ) cpuid-processor-info parse-extended-family ;
|
2012-09-19 13:12:25 -04:00
|
|
|
|
|
|
|
: cpu-family-model-string ( -- string )
|
|
|
|
[
|
2012-09-19 17:55:28 -04:00
|
|
|
cpuid-processor-info {
|
|
|
|
[ parse-extended-family >hex ]
|
|
|
|
[ parse-family >hex ]
|
|
|
|
[ drop "_" ]
|
|
|
|
[ parse-extended-model >hex ]
|
|
|
|
[ parse-model >hex ]
|
|
|
|
} cleave
|
2012-09-19 13:12:25 -04:00
|
|
|
] "" append-outputs-as ;
|
|
|
|
|
2012-09-19 13:41:54 -04:00
|
|
|
: popcnt? ( -- ? )
|
|
|
|
bool { } cdecl [
|
|
|
|
return-reg 1 MOV
|
|
|
|
CPUID
|
|
|
|
return-reg dup XOR
|
|
|
|
ECX 23 BT
|
|
|
|
return-reg SETB
|
|
|
|
] alien-assembly ;
|
|
|
|
|
2012-09-19 13:12:25 -04:00
|
|
|
: tscdeadline? ( -- ? ) 1 cpuid third 24 bit? ;
|
|
|
|
: aes? ( -- ? ) 1 cpuid third 25 bit? ;
|
|
|
|
: xsave? ( -- ? ) 1 cpuid third 26 bit? ;
|
|
|
|
: osxsave? ( -- ? ) 1 cpuid third 27 bit? ;
|
|
|
|
: avx? ( -- ? ) 1 cpuid third 28 bit? ;
|
|
|
|
: f16c? ( -- ? ) 1 cpuid third 29 bit? ;
|
2012-09-20 15:03:10 -04:00
|
|
|
: rdrand? ( -- ? ) 1 cpuid third 30 bit? ;
|
2012-09-19 13:12:25 -04:00
|
|
|
|
|
|
|
: msr? ( -- ? ) 1 cpuid fourth 5 bit? ;
|
|
|
|
: tm1? ( -- ? ) 1 cpuid fourth 29 bit? ;
|
|
|
|
: tm2? ( -- ? ) 1 cpuid third 8 bit? ;
|
2010-05-15 16:26:14 -04:00
|
|
|
|
2012-09-20 14:54:44 -04:00
|
|
|
: rdrand8 ( -- x )
|
|
|
|
uchar { } cdecl [
|
|
|
|
AL RDRAND
|
|
|
|
] alien-assembly ;
|
|
|
|
|
|
|
|
: rdrand16 ( -- x )
|
|
|
|
ushort { } cdecl [
|
|
|
|
AX RDRAND
|
|
|
|
] alien-assembly ;
|
|
|
|
|
|
|
|
: rdrand32 ( -- x )
|
|
|
|
uint { } cdecl [
|
|
|
|
EAX RDRAND
|
|
|
|
] alien-assembly ;
|
|
|
|
|
|
|
|
: rdrand64 ( -- x )
|
|
|
|
ulonglong { } cdecl [
|
|
|
|
RAX RDRAND
|
|
|
|
] alien-assembly ;
|
|
|
|
|
2011-12-12 19:43:49 -05:00
|
|
|
MEMO: enable-popcnt? ( -- ? )
|
2012-09-18 20:14:31 -04:00
|
|
|
popcnt? "disable-popcnt" get not and ;
|
2011-12-12 19:43:49 -05:00
|
|
|
|
|
|
|
[ { sse-version enable-popcnt? } [ reset-memoized ] each ]
|
|
|
|
"cpu.x86.features" add-startup-hook
|
|
|
|
|
2009-09-03 04:28:38 -04:00
|
|
|
: sse-string ( version -- string )
|
|
|
|
{
|
|
|
|
{ 00 [ "no SSE" ] }
|
|
|
|
{ 10 [ "SSE1" ] }
|
|
|
|
{ 20 [ "SSE2" ] }
|
|
|
|
{ 30 [ "SSE3" ] }
|
|
|
|
{ 33 [ "SSSE3" ] }
|
|
|
|
{ 41 [ "SSE4.1" ] }
|
|
|
|
{ 42 [ "SSE4.2" ] }
|
|
|
|
} case ;
|
2009-05-31 16:02:14 -04:00
|
|
|
|
|
|
|
HOOK: instruction-count cpu ( -- n )
|
|
|
|
|
2010-01-06 23:39:22 -05:00
|
|
|
M: x86.32 instruction-count
|
2010-03-31 22:20:35 -04:00
|
|
|
longlong { } cdecl [
|
2010-01-06 23:39:22 -05:00
|
|
|
RDTSC
|
|
|
|
] alien-assembly ;
|
|
|
|
|
|
|
|
M: x86.64 instruction-count
|
2010-03-31 22:20:35 -04:00
|
|
|
longlong { } cdecl [
|
2010-01-06 23:39:22 -05:00
|
|
|
RAX 0 MOV
|
|
|
|
RDTSC
|
|
|
|
RDX 32 SHL
|
|
|
|
RAX RDX OR
|
|
|
|
] alien-assembly ;
|
2009-05-31 16:02:14 -04:00
|
|
|
|
|
|
|
: count-instructions ( quot -- n )
|
2010-01-06 23:39:22 -05:00
|
|
|
instruction-count [ call instruction-count ] dip - ; inline
|