198 lines
		
	
	
		
			4.8 KiB
		
	
	
	
		
			Factor
		
	
	
			
		
		
	
	
			198 lines
		
	
	
		
			4.8 KiB
		
	
	
	
		
			Factor
		
	
	
! Copyright (C) 2009, 2010 Slava Pestov.
 | 
						|
! See http://factorcode.org/license.txt for BSD license.
 | 
						|
USING: alien alien.c-types arrays assocs combinators
 | 
						|
compiler.codegen.labels cpu.architecture cpu.x86.assembler
 | 
						|
cpu.x86.assembler.operands init kernel math math.order
 | 
						|
math.parser memoize namespaces sequences
 | 
						|
specialized-arrays system math.bitwise combinators.smart ;
 | 
						|
SPECIALIZED-ARRAY: uint
 | 
						|
IN: cpu.x86.features
 | 
						|
 | 
						|
<PRIVATE
 | 
						|
 | 
						|
: return-reg ( -- reg ) int-regs return-regs at first ;
 | 
						|
 | 
						|
: (sse-version) ( -- n )
 | 
						|
    int { } cdecl [
 | 
						|
        "sse-42" define-label
 | 
						|
        "sse-41" define-label
 | 
						|
        "ssse-3" define-label
 | 
						|
        "sse-3" define-label
 | 
						|
        "sse-2" define-label
 | 
						|
        "sse-1" define-label
 | 
						|
        "end" define-label
 | 
						|
 | 
						|
        return-reg 1 MOV
 | 
						|
 | 
						|
        CPUID
 | 
						|
 | 
						|
        ECX 20 BT
 | 
						|
        "sse-42" get JB
 | 
						|
 | 
						|
        ECX 19 BT
 | 
						|
        "sse-41" get JB
 | 
						|
 | 
						|
        ECX  9 BT
 | 
						|
        "ssse-3" get JB
 | 
						|
 | 
						|
        ECX  0 BT
 | 
						|
        "sse-3" get JB
 | 
						|
 | 
						|
        EDX 26 BT
 | 
						|
        "sse-2" get JB
 | 
						|
 | 
						|
        EDX 25 BT
 | 
						|
        "sse-1" get JB
 | 
						|
 | 
						|
        return-reg 0 MOV
 | 
						|
        "end" get JMP
 | 
						|
 | 
						|
        "sse-42" resolve-label
 | 
						|
        return-reg 42 MOV
 | 
						|
        "end" get JMP
 | 
						|
 | 
						|
        "sse-41" resolve-label
 | 
						|
        return-reg 41 MOV
 | 
						|
        "end" get JMP
 | 
						|
 | 
						|
        "ssse-3" resolve-label
 | 
						|
        return-reg 33 MOV
 | 
						|
        "end" get JMP
 | 
						|
 | 
						|
        "sse-3" resolve-label
 | 
						|
        return-reg 30 MOV
 | 
						|
        "end" get JMP
 | 
						|
 | 
						|
        "sse-2" resolve-label
 | 
						|
        return-reg 20 MOV
 | 
						|
        "end" get JMP
 | 
						|
 | 
						|
        "sse-1" resolve-label
 | 
						|
        return-reg 10 MOV
 | 
						|
 | 
						|
        "end" resolve-label
 | 
						|
    ] alien-assembly ;
 | 
						|
 | 
						|
PRIVATE>
 | 
						|
 | 
						|
MEMO: sse-version ( -- n )
 | 
						|
    (sse-version) "sse-version" get string>number [ min ] when* ;
 | 
						|
 | 
						|
: sse? ( -- ? ) sse-version 10 >= ;
 | 
						|
: sse2? ( -- ? ) sse-version 20 >= ;
 | 
						|
: sse3? ( -- ? ) sse-version 30 >= ;
 | 
						|
: ssse3? ( -- ? ) sse-version 33 >= ;
 | 
						|
: sse4.1? ( -- ? ) sse-version 41 >= ;
 | 
						|
: sse4.2? ( -- ? ) sse-version 42 >= ;
 | 
						|
 | 
						|
HOOK: (cpuid) cpu ( rax rcx regs -- )
 | 
						|
 | 
						|
 | 
						|
: cpuid-extended ( rax rcx -- 4array )
 | 
						|
   4 <uint-array> [ (cpuid) ] keep >array ;
 | 
						|
 | 
						|
: cpuid ( rax -- 4array ) 0 cpuid-extended ;
 | 
						|
 | 
						|
: cpuid-processor-info ( -- eax ) 1 cpuid first ; inline
 | 
						|
 | 
						|
: parse-stepping ( eax -- n ) 3 0 bit-range ; inline
 | 
						|
: parse-model ( eax -- n ) 7 4 bit-range ; inline
 | 
						|
: parse-family ( eax -- n ) 11 8 bit-range ; inline
 | 
						|
: parse-processor-type ( eax -- n ) 13 12 bit-range ; inline
 | 
						|
: parse-extended-model ( eax -- n ) 19 16 bit-range ; inline
 | 
						|
: parse-extended-family ( eax -- n ) 27 20 bit-range ; inline
 | 
						|
 | 
						|
: cpu-stepping ( -- n ) cpuid-processor-info parse-stepping ;
 | 
						|
: cpu-model ( -- n ) cpuid-processor-info parse-model ;
 | 
						|
: cpu-family ( -- n ) cpuid-processor-info parse-family ;
 | 
						|
: cpu-processor-type ( -- n ) cpuid-processor-info parse-processor-type ;
 | 
						|
: cpu-extended-model ( -- n ) cpuid-processor-info parse-extended-model ;
 | 
						|
: cpu-extended-family ( -- n ) cpuid-processor-info parse-extended-family ;
 | 
						|
 | 
						|
: cpu-family-model-string ( -- string )
 | 
						|
    [
 | 
						|
        cpuid-processor-info {
 | 
						|
            [ parse-extended-family >hex ]
 | 
						|
            [ parse-family >hex ]
 | 
						|
            [ drop "_" ]
 | 
						|
            [ parse-extended-model >hex ]
 | 
						|
            [ parse-model >hex ]
 | 
						|
        } cleave
 | 
						|
    ] "" append-outputs-as ;
 | 
						|
 | 
						|
: popcnt? ( -- ? )
 | 
						|
    bool { } cdecl [
 | 
						|
        return-reg 1 MOV
 | 
						|
        CPUID
 | 
						|
        return-reg dup XOR
 | 
						|
        ECX 23 BT
 | 
						|
        return-reg SETB
 | 
						|
    ] alien-assembly ;
 | 
						|
 | 
						|
: tscdeadline? ( -- ? ) 1 cpuid third 24 bit? ;
 | 
						|
: aes? ( -- ? ) 1 cpuid third 25 bit? ;
 | 
						|
: xsave? ( -- ? ) 1 cpuid third 26 bit? ;
 | 
						|
: osxsave? ( -- ? ) 1 cpuid third 27 bit? ;
 | 
						|
: avx? ( -- ? ) 1 cpuid third 28 bit? ;
 | 
						|
: f16c? ( -- ? ) 1 cpuid third 29 bit? ;
 | 
						|
: rdrand? ( -- ? ) 1 cpuid third 30 bit? ;
 | 
						|
 | 
						|
: msr? ( -- ? ) 1 cpuid fourth 5 bit? ;
 | 
						|
: tm1? ( -- ? ) 1 cpuid fourth 29 bit? ;
 | 
						|
: tm2? ( -- ? ) 1 cpuid third 8 bit? ;
 | 
						|
 | 
						|
: rdrand8 ( -- x )
 | 
						|
    uchar { } cdecl [
 | 
						|
        AL RDRAND
 | 
						|
    ] alien-assembly ;
 | 
						|
 | 
						|
: rdrand16 ( -- x )
 | 
						|
    ushort { } cdecl [
 | 
						|
        AX RDRAND
 | 
						|
    ] alien-assembly ;
 | 
						|
 | 
						|
: rdrand32 ( -- x )
 | 
						|
    uint { } cdecl [
 | 
						|
        EAX RDRAND
 | 
						|
    ] alien-assembly ;
 | 
						|
 | 
						|
: rdrand64 ( -- x )
 | 
						|
    ulonglong { } cdecl [
 | 
						|
        RAX RDRAND
 | 
						|
    ] alien-assembly ;
 | 
						|
 | 
						|
MEMO: enable-popcnt? ( -- ? )
 | 
						|
    popcnt? "disable-popcnt" get not and ;
 | 
						|
 | 
						|
[ { sse-version enable-popcnt? } [ reset-memoized ] each ]
 | 
						|
"cpu.x86.features" add-startup-hook
 | 
						|
 | 
						|
: sse-string ( version -- string )
 | 
						|
    {
 | 
						|
        { 00 [ "no SSE" ] }
 | 
						|
        { 10 [ "SSE1" ] }
 | 
						|
        { 20 [ "SSE2" ] }
 | 
						|
        { 30 [ "SSE3" ] }
 | 
						|
        { 33 [ "SSSE3" ] }
 | 
						|
        { 41 [ "SSE4.1" ] }
 | 
						|
        { 42 [ "SSE4.2" ] }
 | 
						|
    } case ;
 | 
						|
 | 
						|
HOOK: instruction-count cpu ( -- n )
 | 
						|
 | 
						|
M: x86.32 instruction-count
 | 
						|
    longlong { } cdecl [
 | 
						|
        RDTSC
 | 
						|
    ] alien-assembly ;
 | 
						|
 | 
						|
M: x86.64 instruction-count
 | 
						|
    longlong { } cdecl [
 | 
						|
        RAX 0 MOV
 | 
						|
        RDTSC
 | 
						|
        RDX 32 SHL
 | 
						|
        RAX RDX OR
 | 
						|
    ] alien-assembly ;
 | 
						|
 | 
						|
: count-instructions ( quot -- n )
 | 
						|
    instruction-count [ call instruction-count ] dip - ; inline
 |