math.vectors.simd: add v<< and v>> intrinsics for bitwise shifts on elements

author Slava Pestov <slava@slava-pestovs-macbook-pro.local>

Thu, 24 Sep 2009 08:32:39 +0000 (03:32 -0500)

committer Slava Pestov <slava@slava-pestovs-macbook-pro.local>

Thu, 24 Sep 2009 08:32:39 +0000 (03:32 -0500)
author Slava Pestov <slava@slava-pestovs-macbook-pro.local>
Thu, 24 Sep 2009 08:32:39 +0000 (03:32 -0500)
committer Slava Pestov <slava@slava-pestovs-macbook-pro.local>
Thu, 24 Sep 2009 08:32:39 +0000 (03:32 -0500)
diff --git a/basis/compiler/cfg/instructions/instructions.factor b/basis/compiler/cfg/instructions/instructions.factor

index 874093ed40f371a25997a80ca0a8fa0cef46b121..c366682092d7bf2c8510aba2192a6e7c00246563 100644 (file)
--- a/basis/compiler/cfg/instructions/instructions.factor
+++ b/basis/compiler/cfg/instructions/instructions.factor
@@ -380,6 +380,27 @@ def: dst
  use: src1 src2
  literal: rep ;
  
+PURE-INSN: ##shl-vector
+def: dst
+use: src1 src2/scalar-rep
+literal: rep ;
+
+PURE-INSN: ##shr-vector
+def: dst
+use: src1 src2/scalar-rep
+literal: rep ;
+
+! Scalar/integer conversion
+PURE-INSN: ##scalar>integer
+def: dst/int-rep
+use: src
+literal: rep ;
+
+PURE-INSN: ##integer>scalar
+def: dst
+use: src/int-rep
+literal: rep ;
+
  ! Boxing and unboxing aliens
  PURE-INSN: ##box-alien
  def: dst/int-rep
diff --git a/basis/compiler/cfg/intrinsics/intrinsics.factor b/basis/compiler/cfg/intrinsics/intrinsics.factor

index d2f158f06d0c603bad463abba570ff923d12b8c3..98f5ed9a85b07079ddbf7dd9cbf4f603ed578350 100644 (file)
--- a/basis/compiler/cfg/intrinsics/intrinsics.factor
+++ b/basis/compiler/cfg/intrinsics/intrinsics.factor
@@ -169,6 +169,8 @@ IN: compiler.cfg.intrinsics
          { math.vectors.simd.intrinsics:(simd-vbitand) [ [ ^^and-vector ] emit-binary-vector-op ] }
          { math.vectors.simd.intrinsics:(simd-vbitor) [ [ ^^or-vector ] emit-binary-vector-op ] }
          { math.vectors.simd.intrinsics:(simd-vbitxor) [ [ ^^xor-vector ] emit-binary-vector-op ] }
+        { math.vectors.simd.intrinsics:(simd-v<<) [ [ ^^shl-vector ] emit-binary-vector-op ] }
+        { math.vectors.simd.intrinsics:(simd-v>>) [ [ ^^shr-vector ] emit-binary-vector-op ] }
          { math.vectors.simd.intrinsics:(simd-broadcast) [ [ ^^broadcast-vector ] emit-unary-vector-op ] }
          { math.vectors.simd.intrinsics:(simd-gather-2) [ emit-gather-vector-2 ] }
          { math.vectors.simd.intrinsics:(simd-gather-4) [ emit-gather-vector-4 ] }
diff --git a/basis/compiler/cfg/representations/preferred/preferred.factor b/basis/compiler/cfg/representations/preferred/preferred.factor

index 389b78c33362d4f6880ba5359d5c70f7d6ad5a20..4444290f057ece86c2a2c0a43ee2899c209e2b8e 100644 (file)
--- a/basis/compiler/cfg/representations/preferred/preferred.factor
+++ b/basis/compiler/cfg/representations/preferred/preferred.factor
@@ -3,8 +3,8 @@
  USING: kernel accessors sequences arrays fry namespaces generic
  words sets combinators generalizations cpu.architecture compiler.units
  compiler.cfg.utilities compiler.cfg compiler.cfg.rpo
-compiler.cfg.instructions compiler.cfg.instructions.syntax
-compiler.cfg.def-use ;
+compiler.cfg.instructions compiler.cfg.def-use ;
+FROM: compiler.cfg.instructions.syntax => insn-def-slot insn-use-slots insn-temp-slots scalar-rep ;
  IN: compiler.cfg.representations.preferred
  
  GENERIC: defs-vreg-rep ( insn -- rep/f )
diff --git a/basis/compiler/cfg/representations/representations.factor b/basis/compiler/cfg/representations/representations.factor

index ec2856f6476569d652288ef95a80cfc0e5b8353b..d9c2eab6c3369f31c08764d1d626fefbd305ed55 100644 (file)
--- a/basis/compiler/cfg/representations/representations.factor
+++ b/basis/compiler/cfg/representations/representations.factor
@@ -1,7 +1,7 @@
  ! Copyright (C) 2009 Slava Pestov
  ! See http://factorcode.org/license.txt for BSD license.
  USING: kernel fry accessors sequences assocs sets namespaces
-arrays combinators make locals deques dlists
+arrays combinators make locals deques dlists layouts
  cpu.architecture compiler.utilities
  compiler.cfg
  compiler.cfg.rpo
@@ -22,19 +22,18 @@ ERROR: bad-conversion dst src dst-rep src-rep ;
  GENERIC: emit-box ( dst src rep -- )
  GENERIC: emit-unbox ( dst src rep -- )
  
-M: float-rep emit-box
-    drop
-    [ double-rep next-vreg-rep dup ] dip ##single>double-float
-    int-rep next-vreg-rep ##box-float ;
+M:: float-rep emit-box ( dst src rep -- )
+    double-rep next-vreg-rep :> temp
+    temp src ##single>double-float
+    dst temp int-rep next-vreg-rep ##box-float ;
  
-M: float-rep emit-unbox
-    drop
-    [ double-rep next-vreg-rep dup ] dip ##unbox-float
-    ##double>single-float ;
+M:: float-rep emit-unbox ( dst src rep -- )
+    double-rep next-vreg-rep :> temp
+    temp src ##unbox-float
+    dst temp ##double>single-float ;
  
  M: double-rep emit-box
-    drop
-    int-rep next-vreg-rep ##box-float ;
+    drop int-rep next-vreg-rep ##box-float ;
  
  M: double-rep emit-unbox
      drop ##unbox-float ;
@@ -45,6 +44,16 @@ M: vector-rep emit-box
  M: vector-rep emit-unbox
      ##unbox-vector ;
  
+M:: scalar-rep emit-box ( dst src rep -- )
+    int-rep next-vreg-rep :> temp
+    temp src rep ##scalar>integer
+    dst temp tag-bits get ##shl-imm ;
+
+M:: scalar-rep emit-unbox ( dst src rep -- )
+    int-rep next-vreg-rep :> temp
+    temp src tag-bits get ##sar-imm
+    dst temp rep ##integer>scalar ;
+
  : emit-conversion ( dst src dst-rep src-rep -- )
      {
          { [ 2dup eq? ] [ drop ##copy ] }
diff --git a/basis/compiler/cfg/two-operand/two-operand.factor b/basis/compiler/cfg/two-operand/two-operand.factor

index 45d248f8f4c020059dbf6efcca7218e4be609b57..4434e0b7b851594f61d048516117221c08b644b0 100644 (file)
--- a/basis/compiler/cfg/two-operand/two-operand.factor
+++ b/basis/compiler/cfg/two-operand/two-operand.factor
@@ -58,7 +58,9 @@ UNION: two-operand-insn
      ##max-vector
      ##and-vector
      ##or-vector
-    ##xor-vector ;
+    ##xor-vector
+    ##shl-vector
+    ##shr-vector ;
  
  GENERIC: convert-two-operand* ( insn -- )
  
diff --git a/basis/compiler/codegen/codegen.factor b/basis/compiler/codegen/codegen.factor

index 43d11b5d4fe4550142b27f3a772e608fb458452b..bff640d93b6c6320a2ee1d5ed6a90754ee6c8799 100755 (executable)
--- a/basis/compiler/codegen/codegen.factor
+++ b/basis/compiler/codegen/codegen.factor
@@ -184,6 +184,10 @@ CODEGEN: ##abs-vector %abs-vector
  CODEGEN: ##and-vector %and-vector
  CODEGEN: ##or-vector %or-vector
  CODEGEN: ##xor-vector %xor-vector
+CODEGEN: ##shl-vector %shl-vector
+CODEGEN: ##shr-vector %shr-vector
+CODEGEN: ##integer>scalar %integer>scalar
+CODEGEN: ##scalar>integer %scalar>integer
  CODEGEN: ##box-alien %box-alien
  CODEGEN: ##box-displaced-alien %box-displaced-alien
  CODEGEN: ##unbox-alien %unbox-alien
diff --git a/basis/compiler/tree/propagation/simd/simd.factor b/basis/compiler/tree/propagation/simd/simd.factor

index fadb382398eac557fde5e72cd29cbfe07060e74f..c0651d106b34d63c8bf496cd65cc5c595712e9c3 100644 (file)
--- a/basis/compiler/tree/propagation/simd/simd.factor
+++ b/basis/compiler/tree/propagation/simd/simd.factor
@@ -19,6 +19,8 @@ IN: compiler.tree.propagation.simd
      (simd-vbitand)
      (simd-vbitor)
      (simd-vbitxor)
+    (simd-v<<)
+    (simd-v>>)
      (simd-broadcast)
      (simd-gather-2)
      (simd-gather-4)
@@ -30,7 +32,7 @@ IN: compiler.tree.propagation.simd
          literal>> scalar-rep-of {
              { float-rep [ float ] }
              { double-rep [ float ] }
-            { int-rep [ integer ] }
+            [ integer ]
          } case
      ] [ drop real ] if
      <class-info>
diff --git a/basis/cpu/architecture/architecture.factor b/basis/cpu/architecture/architecture.factor

index dd817117b6b3e7c6564106b95f622db66114a347..3c5abf668aaa63edd6922f983cf0da5f2d42173d 100644 (file)
--- a/basis/cpu/architecture/architecture.factor
+++ b/basis/cpu/architecture/architecture.factor
@@ -31,6 +31,17 @@ uint-4-rep
  longlong-2-rep
  ulonglong-2-rep ;
  
+! Scalar values in the high component of a vector register
+SINGLETONS:
+char-scalar-rep
+uchar-scalar-rep
+short-scalar-rep
+ushort-scalar-rep
+int-scalar-rep
+uint-scalar-rep
+longlong-scalar-rep
+ulonglong-scalar-rep ;
+
  SINGLETONS:
  float-4-rep
  double-2-rep ;
@@ -45,6 +56,16 @@ uint-4-rep
  longlong-2-rep
  ulonglong-2-rep ;
  
+UNION: scalar-rep
+char-scalar-rep
+uchar-scalar-rep
+short-scalar-rep
+ushort-scalar-rep
+int-scalar-rep
+uint-scalar-rep
+longlong-scalar-rep
+ulonglong-scalar-rep ;
+
  UNION: float-vector-rep
  float-4-rep
  double-2-rep ;
@@ -59,7 +80,8 @@ tagged-rep
  int-rep
  float-rep
  double-rep
-vector-rep ;
+vector-rep
+scalar-rep ;
  
  ! Register classes
  SINGLETONS: int-regs float-regs ;
@@ -70,13 +92,18 @@ CONSTANT: reg-classes { int-regs float-regs }
  ! A pseudo-register class for parameters spilled on the stack
  SINGLETON: stack-params
  
+! On x86, vectors and floats are stored in the same register bank
+! On PowerPC they are distinct
+HOOK: vector-regs cpu ( -- reg-class )
+
  GENERIC: reg-class-of ( rep -- reg-class )
  
  M: tagged-rep reg-class-of drop int-regs ;
  M: int-rep reg-class-of drop int-regs ;
  M: float-rep reg-class-of drop float-regs ;
  M: double-rep reg-class-of drop float-regs ;
-M: vector-rep reg-class-of drop float-regs ;
+M: vector-rep reg-class-of drop vector-regs ;
+M: scalar-rep reg-class-of drop vector-regs ;
  M: stack-params reg-class-of drop stack-params ;
  
  GENERIC: rep-size ( rep -- n ) foldable
@@ -96,7 +123,14 @@ GENERIC: scalar-rep-of ( rep -- rep' )
  
  M: float-4-rep scalar-rep-of drop float-rep ;
  M: double-2-rep scalar-rep-of drop double-rep ;
-M: int-vector-rep scalar-rep-of drop int-rep ;
+M: char-16-rep scalar-rep-of drop char-scalar-rep ;
+M: uchar-16-rep scalar-rep-of drop uchar-scalar-rep ;
+M: short-8-rep scalar-rep-of drop short-scalar-rep ;
+M: ushort-8-rep scalar-rep-of drop ushort-scalar-rep ;
+M: int-4-rep scalar-rep-of drop int-scalar-rep ;
+M: uint-4-rep scalar-rep-of drop uint-scalar-rep ;
+M: longlong-2-rep scalar-rep-of drop longlong-scalar-rep ;
+M: ulonglong-2-rep scalar-rep-of drop ulonglong-scalar-rep ;
  
  ! Mapping from register class to machine registers
  HOOK: machine-registers cpu ( -- assoc )
@@ -200,6 +234,11 @@ HOOK: %abs-vector cpu ( dst src rep -- )
  HOOK: %and-vector cpu ( dst src1 src2 rep -- )
  HOOK: %or-vector cpu ( dst src1 src2 rep -- )
  HOOK: %xor-vector cpu ( dst src1 src2 rep -- )
+HOOK: %shl-vector cpu ( dst src1 src2 rep -- )
+HOOK: %shr-vector cpu ( dst src1 src2 rep -- )
+
+HOOK: %integer>scalar cpu ( dst src rep -- )
+HOOK: %scalar>integer cpu ( dst src rep -- )
  
  HOOK: %broadcast-vector-reps cpu ( -- reps )
  HOOK: %gather-vector-2-reps cpu ( -- reps )
@@ -220,6 +259,8 @@ HOOK: %abs-vector-reps cpu ( -- reps )
  HOOK: %and-vector-reps cpu ( -- reps )
  HOOK: %or-vector-reps cpu ( -- reps )
  HOOK: %xor-vector-reps cpu ( -- reps )
+HOOK: %shl-vector-reps cpu ( -- reps )
+HOOK: %shr-vector-reps cpu ( -- reps )
  
  HOOK: %unbox-alien cpu ( dst src -- )
  HOOK: %unbox-any-c-ptr cpu ( dst src temp -- )
diff --git a/basis/cpu/x86/x86.factor b/basis/cpu/x86/x86.factor

index 5bed068a7a6cf67d8755dc275b94991055699f49..07234ff83caa1b477e3d56d81a501c02adf29fd8 100644 (file)
--- a/basis/cpu/x86/x86.factor
+++ b/basis/cpu/x86/x86.factor
@@ -22,6 +22,8 @@ M: label JUMPcc [ 0 ] dip JUMPcc rc-relative label-fixup ;
  
  M: x86 two-operand? t ;
  
+M: x86 vector-regs float-regs ;
+
  HOOK: stack-reg cpu ( -- reg )
  
  HOOK: reserved-area-size cpu ( -- n )
@@ -523,6 +525,39 @@ M: x86 %xor-vector-reps
          { sse2? { double-2-rep char-16-rep uchar-16-rep short-8-rep ushort-8-rep int-4-rep uint-4-rep longlong-2-rep ulonglong-2-rep } }
      } available-reps ;
  
+M: x86 %shl-vector ( dst src1 src2 rep -- )
+    {
+        { short-8-rep [ PSLLW ] }
+        { ushort-8-rep [ PSLLW ] }
+        { int-4-rep [ PSLLD ] }
+        { uint-4-rep [ PSLLD ] }
+        { longlong-2-rep [ PSLLQ ] }
+        { ulonglong-2-rep [ PSLLQ ] }
+    } case drop ;
+
+M: x86 %shl-vector-reps
+    {
+        { sse2? { short-8-rep ushort-8-rep int-4-rep uint-4-rep longlong-2-rep ulonglong-2-rep } }
+    } available-reps ;
+
+M: x86 %shr-vector ( dst src1 src2 rep -- )
+    {
+        { short-8-rep [ PSRAW ] }
+        { ushort-8-rep [ PSRLW ] }
+        { int-4-rep [ PSRAD ] }
+        { uint-4-rep [ PSRLD ] }
+        { ulonglong-2-rep [ PSRLQ ] }
+    } case drop ;
+
+M: x86 %shr-vector-reps
+    {
+        { sse2? { short-8-rep ushort-8-rep int-4-rep uint-4-rep ulonglong-2-rep } }
+    } available-reps ;
+
+M: x86 %integer>scalar drop MOVD ;
+
+M: x86 %scalar>integer drop MOVD ;
+
  M: x86 %unbox-alien ( dst src -- )
      alien-offset [+] MOV ;
  
diff --git a/basis/math/vectors/simd/functor/functor.factor b/basis/math/vectors/simd/functor/functor.factor

index e934a641c49ea4e67b39ffe65e33fd0430fb713f..c76ed573d5ef218d29f0e21406ed0dd094f9e4b7 100644 (file)
--- a/basis/math/vectors/simd/functor/functor.factor
+++ b/basis/math/vectors/simd/functor/functor.factor
@@ -78,12 +78,13 @@ ERROR: bad-schema schema ;
          } append
      ] when ;
  
-:: simd-vector-words ( class ctor rep vv->v v->v v->n -- )
+:: simd-vector-words ( class ctor rep vv->v vn->v v->v v->n -- )
      rep rep-component-type c-type-boxed-class :> elt-class
      class
      elt-class
      {
          { { +vector+ +vector+ -> +vector+ } vv->v }
+        { { +vector+ +scalar+ -> +vector+ } vn->v }
          { { +vector+ -> +vector+ } v->v }
          { { +vector+ -> +scalar+ } v->n }
          { { +vector+ -> +nonnegative+ } v->n }
@@ -118,6 +119,7 @@ SET-NTH      [ T dup c-setter array-accessor ]
  
  A-rep        [ A name>> "-rep" append "cpu.architecture" lookup ]
  A-vv->v-op   DEFINES-PRIVATE ${A}-vv->v-op
+A-vn->v-op   DEFINES-PRIVATE ${A}-vn->v-op
  A-v->v-op    DEFINES-PRIVATE ${A}-v->v-op
  A-v->n-op    DEFINES-PRIVATE ${A}-v->n-op
  
@@ -175,13 +177,16 @@ INSTANCE: A sequence
  : A-vv->v-op ( v1 v2 quot -- v3 )
      [ [ underlying>> ] bi@ A-rep ] dip call \ A boa ; inline
  
+: A-vn->v-op ( v1 v2 quot -- v3 )
+    [ [ underlying>> ] dip A-rep ] dip call \ A boa ; inline
+
  : A-v->v-op ( v1 quot -- v2 )
      [ underlying>> A-rep ] dip call \ A boa ; inline
  
  : A-v->n-op ( v quot -- n )
      [ underlying>> A-rep ] dip call ; inline
  
-\ A \ A-with \ A-rep \ A-vv->v-op \ A-v->v-op \ A-v->n-op simd-vector-words
+\ A \ A-with \ A-rep \ A-vv->v-op \ A-vn->v-op \ A-v->v-op \ A-v->n-op simd-vector-words
  \ A \ A-rep define-simd-128-type
  
  PRIVATE>
@@ -230,6 +235,7 @@ A-deref      DEFINES-PRIVATE ${A}-deref
  
  A-rep        [ A/2 name>> "-rep" append "cpu.architecture" lookup ]
  A-vv->v-op   DEFINES-PRIVATE ${A}-vv->v-op
+A-vn->v-op   DEFINES-PRIVATE ${A}-vn->v-op
  A-v->v-op    DEFINES-PRIVATE ${A}-v->v-op
  A-v->n-op    DEFINES-PRIVATE ${A}-v->n-op
  
@@ -296,6 +302,11 @@ INSTANCE: A sequence
      [ [ [ underlying2>> ] bi@ A-rep ] dip call ] 3bi
      \ A boa ; inline
  
+: A-vn->v-op ( v1 v2 quot -- v3 )
+    [ [ [ underlying1>> ] dip A-rep ] dip call ]
+    [ [ [ underlying2>> ] dip A-rep ] dip call ] 3bi
+    \ A boa ; inline
+
  : A-v->v-op ( v1 combine-quot -- v2 )
      [ [ underlying1>> A-rep ] dip call ]
      [ [ underlying2>> A-rep ] dip call ] 2bi
@@ -304,7 +315,7 @@ INSTANCE: A sequence
  : A-v->n-op ( v1 combine-quot -- v2 )
      [ [ underlying1>> ] [ underlying2>> ] bi A-rep (simd-v+) A-rep ] dip call ; inline
  
-\ A \ A-with \ A-rep \ A-vv->v-op \ A-v->v-op \ A-v->n-op simd-vector-words
+\ A \ A-with \ A-rep \ A-vv->v-op \ A-vn->v-op \ A-v->v-op \ A-v->n-op simd-vector-words
  \ A \ A-rep define-simd-256-type
  
  ;FUNCTOR
diff --git a/basis/math/vectors/simd/intrinsics/intrinsics.factor b/basis/math/vectors/simd/intrinsics/intrinsics.factor

index 2c1f76cfe1f08c10815f716177a02764c7cf5bae..2dc034551c685cf8838c3d3579ba44a3428aefc9 100644 (file)
--- a/basis/math/vectors/simd/intrinsics/intrinsics.factor
+++ b/basis/math/vectors/simd/intrinsics/intrinsics.factor
@@ -42,6 +42,8 @@ SIMD-OP: vabs
  SIMD-OP: vbitand
  SIMD-OP: vbitor
  SIMD-OP: vbitxor
+SIMD-OP: v<<
+SIMD-OP: v>>
  
  : (simd-broadcast) ( x rep -- v ) bad-simd-call ;
  : (simd-gather-2) ( a b rep -- v ) bad-simd-call ;
@@ -110,6 +112,8 @@ M: vector-rep supported-simd-op?
          { \ (simd-vbitand)   [ %and-vector-reps            ] }
          { \ (simd-vbitor)    [ %or-vector-reps             ] }
          { \ (simd-vbitxor)   [ %xor-vector-reps            ] }
+        { \ (simd-v<<)       [ %shl-vector-reps            ] }
+        { \ (simd-v>>)       [ %shr-vector-reps            ] }
          { \ (simd-broadcast) [ %broadcast-vector-reps      ] }
          { \ (simd-gather-2)  [ %gather-vector-2-reps       ] }
          { \ (simd-gather-4)  [ %gather-vector-4-reps       ] }
diff --git a/basis/math/vectors/simd/simd-tests.factor b/basis/math/vectors/simd/simd-tests.factor

index 312dfc2cbd1f58fda74765e5bb31a3219915dadd..284aa3a9aefd3987e28d65477c80042473bbe7cb 100644 (file)
--- a/basis/math/vectors/simd/simd-tests.factor
+++ b/basis/math/vectors/simd/simd-tests.factor
@@ -141,9 +141,12 @@ CONSTANT: simd-classes
  : remove-float-words ( alist -- alist' )
      [ drop { vsqrt n/v v/n v/ normalize } member? not ] assoc-filter ;
  
+: remove-integer-words ( alist -- alist' )
+    [ drop { v<< v>> } member? not ] assoc-filter ;
+
  : ops-to-check ( elt-class -- alist )
      [ vector-words >alist ] dip
-    float = [ remove-float-words ] unless ;
+    float = [ remove-integer-words ] [ remove-float-words ] if ;
  
  : check-vector-ops ( class elt-class compare-quot -- )
      [
@@ -168,7 +171,7 @@ CONSTANT: simd-classes
      simd-classes [
          {
              { [ dup name>> "float" head? ] [ float [ approx= ] ] }
-            { [ dup name>> "double" tail? ] [ float [ = ] ] }
+            { [ dup name>> "double" head? ] [ float [ = ] ] }
              [ fixnum [ = ] ]
          } cond 3array
      ] map ;
diff --git a/basis/math/vectors/specialization/specialization.factor b/basis/math/vectors/specialization/specialization.factor

index bf2dac29d65d75884bdc77e9a465aa04f7d16b19..07099df23c8050ce7536dc1e2e876be10b71da87 100644 (file)
--- a/basis/math/vectors/specialization/specialization.factor
+++ b/basis/math/vectors/specialization/specialization.factor
@@ -1,9 +1,9 @@
  ! Copyright (C) 2009 Slava Pestov.
  ! See http://factorcode.org/license.txt for BSD license.
-USING: alien.c-types words kernel make sequences effects
-kernel.private accessors combinators math math.intervals
-math.vectors namespaces assocs fry splitting classes.algebra
-generalizations locals compiler.tree.propagation.info ;
+USING: words kernel make sequences effects sets kernel.private
+accessors combinators math math.intervals math.vectors
+namespaces assocs fry splitting classes.algebra generalizations
+locals compiler.tree.propagation.info ;
  IN: math.vectors.specialization
  
  SYMBOLS: -> +vector+ +scalar+ +nonnegative+ ;
@@ -77,6 +77,8 @@ H{
      { vbitand { +vector+ +vector+ -> +vector+ } }
      { vbitor { +vector+ +vector+ -> +vector+ } }
      { vbitxor { +vector+ +vector+ -> +vector+ } }
+    { v>> { +vector+ +scalar+ -> +vector+ } }
+    { v<< { +vector+ +scalar+ -> +vector+ } }
  }
  
  PREDICATE: vector-word < word vector-words key? ;
@@ -107,15 +109,22 @@ M: vector-word subwords specializations values [ word? ] filter ;
  :: input-signature ( word array-type elt-type -- signature )
      array-type elt-type word word-schema inputs signature-for-schema ;
  
+: vector-words-for-type ( elt-type -- alist )
+    {
+        ! Can't do shifts on floats
+        { [ dup float class<= ] [ vector-words keys { v<< v>> } diff ] }
+        ! Can't divide integers
+        { [ dup integer class<= ] [ vector-words keys { vsqrt n/v v/n v/ normalize } diff ] }
+        [ { } ]
+    } cond nip ;
+
  :: specialize-vector-words ( array-type elt-type simd -- )
-    elt-type number class<= [
-        vector-words keys [
-            [ array-type elt-type simd specialize-vector-word ]
-            [ array-type elt-type input-signature ]
-            [ ]
-            tri add-specialization
-        ] each
-    ] when ;
+    elt-type vector-words-for-type [
+        [ array-type elt-type simd specialize-vector-word ]
+        [ array-type elt-type input-signature ]
+        [ ]
+        tri add-specialization
+    ] each ;
  
  : find-specialization ( classes word -- word/f )
      specializations
diff --git a/basis/math/vectors/vectors-docs.factor b/basis/math/vectors/vectors-docs.factor

index 3790e38d55976da573c8f56f980579bfcdcef025..13175ea8d1f6d1d5ea6e6e12c4899b91908dfa2c 100644 (file)
--- a/basis/math/vectors/vectors-docs.factor
+++ b/basis/math/vectors/vectors-docs.factor
@@ -38,6 +38,8 @@ $nl
  { $subsection vbitand }
  { $subsection vbitor }
  { $subsection vbitxor }
+{ $subsection v<< }
+{ $subsection v>> }
  "Inner product and norm:"
  { $subsection v. }
  { $subsection norm }
@@ -209,6 +211,14 @@ HELP: vbitxor
  { $description "Takes the bitwise exclusive or of " { $snippet "u" } " and " { $snippet "v" } " component-wise." }
  { $notes "Unlike " { $link bitxor } ", this word may be used on a specialized array of floats or doubles, in which case the bitwise representation of the floating point numbers is operated upon." } ;
  
+HELP: v<<
+{ $values { "u" "a sequence of integers" } { "n" "a non-negative integer" } { "w" "a sequence of integers" } }
+{ $description "Shifts each element of " { $snippet "u" } " to the left by " { $snippet "n" } " bits." } ;
+
+HELP: v>>
+{ $values { "u" "a sequence of integers" } { "n" "a non-negative integer" } { "w" "a sequence of integers" } }
+{ $description "Shifts each element of " { $snippet "u" } " to the right by " { $snippet "n" } " bits." } ;
+
  HELP: norm-sq
  { $values { "v" "a sequence of numbers" } { "x" "a non-negative real number" } }
  { $description "Computes the squared length of a mathematical vector." } ;
diff --git a/basis/math/vectors/vectors.factor b/basis/math/vectors/vectors.factor

index 4b6f67544a9a705c031c17778fa77dde42092794..adaed6abdd322259dfe587c88ee4337f81d71201 100644 (file)
--- a/basis/math/vectors/vectors.factor
+++ b/basis/math/vectors/vectors.factor
@@ -61,6 +61,9 @@ PRIVATE>
  : vbitor ( u v -- w ) over '[ _ [ bitor ] fp-bitwise-op ] 2map ;
  : vbitxor ( u v -- w ) over '[ _ [ bitxor ] fp-bitwise-op ] 2map ;
  
+: v<< ( u n -- w ) '[ _ shift ] map ;
+: v>> ( u n -- w ) neg '[ _ shift ] map ;
+
  : vfloor    ( u -- v ) [ floor ] map ;
  : vceiling  ( u -- v ) [ ceiling ] map ;
  : vtruncate ( u -- v ) [ truncate ] map ;
author	Slava Pestov <slava@slava-pestovs-macbook-pro.local>
	Thu, 24 Sep 2009 08:32:39 +0000 (03:32 -0500)
committer	Slava Pestov <slava@slava-pestovs-macbook-pro.local>
	Thu, 24 Sep 2009 08:32:39 +0000 (03:32 -0500)
basis/compiler/cfg/instructions/instructions.factor		patch \| blob \| history
basis/compiler/cfg/intrinsics/intrinsics.factor		patch \| blob \| history
basis/compiler/cfg/representations/preferred/preferred.factor		patch \| blob \| history
basis/compiler/cfg/representations/representations.factor		patch \| blob \| history
basis/compiler/cfg/two-operand/two-operand.factor		patch \| blob \| history
basis/compiler/codegen/codegen.factor		patch \| blob \| history
basis/compiler/tree/propagation/simd/simd.factor		patch \| blob \| history
basis/cpu/architecture/architecture.factor		patch \| blob \| history
basis/cpu/x86/x86.factor		patch \| blob \| history
basis/math/vectors/simd/functor/functor.factor		patch \| blob \| history
basis/math/vectors/simd/intrinsics/intrinsics.factor		patch \| blob \| history
basis/math/vectors/simd/simd-tests.factor		patch \| blob \| history
basis/math/vectors/specialization/specialization.factor		patch \| blob \| history
basis/math/vectors/vectors-docs.factor		patch \| blob \| history
basis/math/vectors/vectors.factor		patch \| blob \| history