1 ! Copyright (C) 2009 Slava Pestov.
2 ! See http://factorcode.org/license.txt for BSD license.
3 USING: accessors byte-arrays fry cpu.architecture kernel math
4 sequences math.vectors.simd.intrinsics macros generalizations
5 combinators combinators.short-circuit arrays locals
6 compiler.tree.propagation.info compiler.cfg.builder.blocks
7 compiler.cfg.comparisons
8 compiler.cfg.stacks compiler.cfg.stacks.local compiler.cfg.hats
9 compiler.cfg.instructions compiler.cfg.registers
10 compiler.cfg.intrinsics.alien
12 FROM: alien.c-types => float double ;
13 SPECIALIZED-ARRAYS: float double ;
14 IN: compiler.cfg.intrinsics.simd
16 MACRO: check-elements ( quots -- )
17 [ length '[ _ firstn ] ]
19 [ length 1 - \ and <repetition> [ ] like ]
22 MACRO: if-literals-match ( quots -- )
23 [ length ] [ ] [ length ] tri
29 _ tail-slice* [ literal>> ] map
36 ] [ 2drop emit-primitive ] if
39 : emit-vector-op ( node quot: ( rep -- ) -- )
40 { [ representation? ] } if-literals-match ; inline
42 : [binary] ( quot -- quot' )
43 '[ [ ds-drop 2inputs ] dip @ ds-push ] ; inline
45 : emit-binary-vector-op ( node quot -- )
46 [binary] emit-vector-op ; inline
48 : [unary] ( quot -- quot' )
49 '[ [ ds-drop ds-pop ] dip @ ds-push ] ; inline
51 : emit-unary-vector-op ( node quot -- )
52 [unary] emit-vector-op ; inline
54 : [unary/param] ( quot -- quot' )
55 '[ [ -2 inc-d ds-pop ] 2dip @ ds-push ] ; inline
57 : emit-horizontal-shift ( node quot -- )
59 { [ integer? ] [ representation? ] } if-literals-match ; inline
61 : emit-gather-vector-2 ( node -- )
62 [ ^^gather-vector-2 ] emit-binary-vector-op ;
64 : emit-gather-vector-4 ( node -- )
78 : shuffle? ( obj -- ? ) { [ array? ] [ [ integer? ] all? ] } 1&& ;
80 : emit-shuffle-vector ( node -- )
81 ! Pad the permutation with zeroes if its too short, since we
82 ! can't throw an error at this point.
83 [ [ rep-components 0 pad-tail ] keep ^^shuffle-vector ] [unary/param]
84 { [ shuffle? ] [ representation? ] } if-literals-match ;
86 : ^^broadcast-vector ( src n rep -- dst )
87 [ rep-components swap <array> ] keep
90 : emit-broadcast-vector ( node -- )
91 [ ^^broadcast-vector ] [unary/param]
92 { [ integer? ] [ representation? ] } if-literals-match ;
94 : ^^with-vector ( src rep -- dst )
95 [ ^^scalar>vector ] keep [ 0 ] dip ^^broadcast-vector ;
97 : ^^select-vector ( src n rep -- dst )
98 [ ^^broadcast-vector ] keep ^^vector>scalar ;
100 : emit-select-vector ( node -- )
101 [ ^^select-vector ] [unary/param]
102 { [ integer? ] [ representation? ] } if-literals-match ; inline
104 : emit-alien-vector ( node -- )
107 ds-drop prepare-alien-getter
108 _ ^^alien-vector ds-push
110 [ inline-alien-getter? ] inline-alien
111 ] with emit-vector-op ;
113 : emit-set-alien-vector ( node -- )
116 ds-drop prepare-alien-setter ds-pop
119 [ byte-array inline-alien-setter? ]
121 ] with emit-vector-op ;
123 : generate-not-vector ( src rep -- dst )
124 dup %not-vector-reps member?
126 [ [ ^^fill-vector ] [ ^^xor-vector ] bi ] if ;
128 :: (generate-compare-vector) ( src1 src2 rep {cc,swap} -- dst )
129 {cc,swap} first2 :> swap? :> cc
131 [ src2 src1 rep cc ^^compare-vector ]
132 [ src1 src2 rep cc ^^compare-vector ] if ;
134 :: generate-compare-vector ( src1 src2 rep orig-cc -- dst )
135 rep orig-cc %compare-vector-ccs :> not? :> ccs
138 [ rep not? [ ^^fill-vector ] [ ^^zero-vector ] if ]
140 ccs unclip :> first-cc :> rest-ccs
141 src1 src2 rep first-cc (generate-compare-vector) :> first-dst
144 [ [ src1 src2 rep ] dip (generate-compare-vector) rep ^^or-vector ]
147 not? [ rep generate-not-vector ] when
150 :: generate-unpack-vector-head ( src rep -- dst )
153 [ rep %unpack-vector-head-reps member? ]
154 [ src rep ^^unpack-vector-head ]
157 rep ^^zero-vector :> zero
158 zero src rep cc> ^^compare-vector :> sign
159 src sign rep ^^merge-vector-head
163 :: generate-unpack-vector-tail ( src rep -- dst )
166 [ rep %unpack-vector-tail-reps member? ]
167 [ src rep ^^unpack-vector-tail ]
170 [ rep %unpack-vector-head-reps member? ]
172 src rep ^^tail>head-vector :> tail
173 tail rep ^^unpack-vector-head
177 rep ^^zero-vector :> zero
178 zero src rep cc> ^^compare-vector :> sign
179 src sign rep ^^merge-vector-tail
183 :: generate-neg-vector ( src rep -- dst )
185 { float-4-rep [ float-array{ -0.0 -0.0 -0.0 -0.0 } underlying>> ^^load-constant ] }
186 { double-2-rep [ double-array{ -0.0 -0.0 } underlying>> ^^load-constant ] }
187 [ drop rep ^^zero-vector ]
189 src rep ^^sub-vector ;