From d655c3c9cca88d9cd952082c9ae24d7e2bfa8b38 Mon Sep 17 00:00:00 2001 From: Joe Groff Date: Tue, 3 Nov 2009 21:38:29 -0600 Subject: [PATCH] make horizontal shift available to float vectors (it'd still be faster than the software fallback despite pipeline penalty) --- basis/cpu/x86/x86.factor | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/basis/cpu/x86/x86.factor b/basis/cpu/x86/x86.factor index 53c9c98ed3..b0a5dc0897 100644 --- a/basis/cpu/x86/x86.factor +++ b/basis/cpu/x86/x86.factor @@ -1166,7 +1166,7 @@ M: x86 %horizontal-shl-vector-imm ( dst src1 src2 rep -- ) M: x86 %horizontal-shl-vector-imm-reps { - { sse2? { char-16-rep uchar-16-rep short-8-rep ushort-8-rep int-4-rep uint-4-rep longlong-2-rep ulonglong-2-rep } } + { sse2? { char-16-rep uchar-16-rep short-8-rep ushort-8-rep int-4-rep uint-4-rep longlong-2-rep ulonglong-2-rep float-4-rep double-2-rep } } } available-reps ; M: x86 %horizontal-shr-vector-imm ( dst src1 src2 rep -- ) @@ -1174,7 +1174,7 @@ M: x86 %horizontal-shr-vector-imm ( dst src1 src2 rep -- ) M: x86 %horizontal-shr-vector-imm-reps { - { sse2? { char-16-rep uchar-16-rep short-8-rep ushort-8-rep int-4-rep uint-4-rep longlong-2-rep ulonglong-2-rep } } + { sse2? { char-16-rep uchar-16-rep short-8-rep ushort-8-rep int-4-rep uint-4-rep longlong-2-rep ulonglong-2-rep float-4-rep double-2-rep } } } available-reps ; M: x86 %abs-vector ( dst src rep -- )