1 ! Copyright (C) 2009 Joe Groff.
2 ! See http://factorcode.org/license.txt for BSD license.
3 USING: accessors arrays classes combinators
4 compiler.cfg.instructions compiler.cfg.registers
5 compiler.cfg.stacks compiler.cfg.stacks.local
6 compiler.tree.propagation.info cpu.architecture fry
7 generalizations kernel locals macros make math quotations
8 sequences sequences.generalizations ;
9 IN: compiler.cfg.intrinsics.simd.backend
11 ! Selection of implementation based on available CPU instructions
13 GENERIC: insn-available? ( ## -- reps )
15 M: object insn-available? drop t ;
17 M: ##zero-vector insn-available? rep>> %zero-vector-reps member? ;
18 M: ##fill-vector insn-available? rep>> %fill-vector-reps member? ;
19 M: ##gather-vector-2 insn-available? rep>> %gather-vector-2-reps member? ;
20 M: ##gather-vector-4 insn-available? rep>> %gather-vector-4-reps member? ;
21 M: ##gather-int-vector-2 insn-available? rep>> %gather-int-vector-2-reps member? ;
22 M: ##gather-int-vector-4 insn-available? rep>> %gather-int-vector-4-reps member? ;
23 M: ##select-vector insn-available? rep>> %select-vector-reps member? ;
24 M: ##store-memory-imm insn-available? rep>> %alien-vector-reps member? ;
25 M: ##shuffle-vector insn-available? rep>> %shuffle-vector-reps member? ;
26 M: ##shuffle-vector-imm insn-available? rep>> %shuffle-vector-imm-reps member? ;
27 M: ##shuffle-vector-halves-imm insn-available? rep>> %shuffle-vector-halves-imm-reps member? ;
28 M: ##merge-vector-head insn-available? rep>> %merge-vector-reps member? ;
29 M: ##merge-vector-tail insn-available? rep>> %merge-vector-reps member? ;
30 M: ##float-pack-vector insn-available? rep>> %float-pack-vector-reps member? ;
31 M: ##signed-pack-vector insn-available? rep>> %signed-pack-vector-reps member? ;
32 M: ##unsigned-pack-vector insn-available? rep>> %unsigned-pack-vector-reps member? ;
33 M: ##unpack-vector-head insn-available? rep>> %unpack-vector-head-reps member? ;
34 M: ##unpack-vector-tail insn-available? rep>> %unpack-vector-tail-reps member? ;
35 M: ##tail>head-vector insn-available? rep>> %unpack-vector-head-reps member? ;
36 M: ##integer>float-vector insn-available? rep>> %integer>float-vector-reps member? ;
37 M: ##float>integer-vector insn-available? rep>> %float>integer-vector-reps member? ;
38 M: ##compare-vector insn-available? [ rep>> ] [ cc>> ] bi %compare-vector-reps member? ;
39 M: ##move-vector-mask insn-available? rep>> %move-vector-mask-reps member? ;
40 M: ##test-vector insn-available? rep>> %test-vector-reps member? ;
41 M: ##add-vector insn-available? rep>> %add-vector-reps member? ;
42 M: ##saturated-add-vector insn-available? rep>> %saturated-add-vector-reps member? ;
43 M: ##add-sub-vector insn-available? rep>> %add-sub-vector-reps member? ;
44 M: ##sub-vector insn-available? rep>> %sub-vector-reps member? ;
45 M: ##saturated-sub-vector insn-available? rep>> %saturated-sub-vector-reps member? ;
46 M: ##mul-vector insn-available? rep>> %mul-vector-reps member? ;
47 M: ##mul-high-vector insn-available? rep>> %mul-high-vector-reps member? ;
48 M: ##mul-horizontal-add-vector insn-available? rep>> %mul-horizontal-add-vector-reps member? ;
49 M: ##saturated-mul-vector insn-available? rep>> %saturated-mul-vector-reps member? ;
50 M: ##div-vector insn-available? rep>> %div-vector-reps member? ;
51 M: ##min-vector insn-available? rep>> %min-vector-reps member? ;
52 M: ##max-vector insn-available? rep>> %max-vector-reps member? ;
53 M: ##avg-vector insn-available? rep>> %avg-vector-reps member? ;
54 M: ##dot-vector insn-available? rep>> %dot-vector-reps member? ;
55 M: ##sad-vector insn-available? rep>> %sad-vector-reps member? ;
56 M: ##sqrt-vector insn-available? rep>> %sqrt-vector-reps member? ;
57 M: ##horizontal-add-vector insn-available? rep>> %horizontal-add-vector-reps member? ;
58 M: ##horizontal-sub-vector insn-available? rep>> %horizontal-sub-vector-reps member? ;
59 M: ##abs-vector insn-available? rep>> %abs-vector-reps member? ;
60 M: ##and-vector insn-available? rep>> %and-vector-reps member? ;
61 M: ##andn-vector insn-available? rep>> %andn-vector-reps member? ;
62 M: ##or-vector insn-available? rep>> %or-vector-reps member? ;
63 M: ##xor-vector insn-available? rep>> %xor-vector-reps member? ;
64 M: ##not-vector insn-available? rep>> %not-vector-reps member? ;
65 M: ##shl-vector insn-available? rep>> %shl-vector-reps member? ;
66 M: ##shr-vector insn-available? rep>> %shr-vector-reps member? ;
67 M: ##shl-vector-imm insn-available? rep>> %shl-vector-imm-reps member? ;
68 M: ##shr-vector-imm insn-available? rep>> %shr-vector-imm-reps member? ;
69 M: ##horizontal-shl-vector-imm insn-available? rep>> %horizontal-shl-vector-imm-reps member? ;
70 M: ##horizontal-shr-vector-imm insn-available? rep>> %horizontal-shr-vector-imm-reps member? ;
72 : [vector-op-checked] ( #dup quot -- quot )
73 '[ _ ndup _ { } make dup [ insn-available? ] all? ] ;
75 GENERIC#: >vector-op-cond 2 ( quot #pick #dup -- quotpair )
76 M:: callable >vector-op-cond ( quot #pick #dup -- quotpair )
77 #dup quot [vector-op-checked] '[ 2drop @ ]
81 M:: pair >vector-op-cond ( pair #pick #dup -- quotpair )
82 pair first2 :> ( class quot )
83 #pick class #dup quot [vector-op-checked]
84 '[ 2drop _ npick _ instance? _ [ f f f ] if ]
88 MACRO: v-vector-op ( trials -- quot )
89 [ 1 2 >vector-op-cond ] map '[ f f _ cond ] ;
90 MACRO: vl-vector-op ( trials -- quot )
91 [ 1 3 >vector-op-cond ] map '[ f f _ cond ] ;
92 MACRO: vvl-vector-op ( trials -- quot )
93 [ 1 4 >vector-op-cond ] map '[ f f _ cond ] ;
94 MACRO: vv-vector-op ( trials -- quot )
95 [ 1 3 >vector-op-cond ] map '[ f f _ cond ] ;
96 MACRO: vv-cc-vector-op ( trials -- quot )
97 [ 2 4 >vector-op-cond ] map '[ f f _ cond ] ;
98 MACRO: vvvv-vector-op ( trials -- quot )
99 [ 1 5 >vector-op-cond ] map '[ f f _ cond ] ;
101 ! Intrinsic code emission
103 MACRO: check-elements ( quots -- quot )
104 [ length '[ _ firstn ] ]
106 [ length 1 - \ and <repetition> [ ] like ]
109 ERROR: bad-simd-intrinsic node ;
111 MACRO: if-literals-match ( quots -- quot )
112 [ length ] [ ] [ length ] tri
118 _ tail-slice* [ literal>> ] map
123 [ _ firstn ] dip call
125 ] [ 2drop bad-simd-intrinsic ] if
128 CONSTANT: unary [ ds-drop ds-pop ]
129 CONSTANT: unary/param [ [ -2 <ds-loc> inc-stack ds-pop ] dip ]
130 CONSTANT: binary [ ds-drop 2inputs ]
131 CONSTANT: binary/param [ [ -2 <ds-loc> inc-stack 2inputs ] dip ]
139 -4 <ds-loc> inc-stack
142 :: emit-vector-op ( trials params-quot op-quot literal-preds -- quot )
143 params-quot trials op-quot literal-preds
144 '[ [ _ dip _ @ ds-push ] _ if-literals-match ] ;
146 MACRO: emit-v-vector-op ( trials -- quot )
147 unary [ v-vector-op ] { [ representation? ] } emit-vector-op ;
148 MACRO: emit-vl-vector-op ( trials literal-pred -- quot )
149 [ unary/param [ vl-vector-op ] { [ representation? ] } ] dip prefix emit-vector-op ;
150 MACRO: emit-vv-vector-op ( trials -- quot )
151 binary [ vv-vector-op ] { [ representation? ] } emit-vector-op ;
152 MACRO: emit-vvl-vector-op ( trials literal-pred -- quot )
153 [ binary/param [ vvl-vector-op ] { [ representation? ] } ] dip prefix emit-vector-op ;
154 MACRO: emit-vvvv-vector-op ( trials -- quot )
155 quaternary [ vvvv-vector-op ] { [ representation? ] } emit-vector-op ;
157 MACRO:: emit-vv-or-vl-vector-op ( var-trials imm-trials literal-pred -- quot )
158 literal-pred imm-trials literal-pred var-trials
160 dup node-input-infos 2 tail-slice* first literal>> @
161 [ _ _ emit-vl-vector-op ]
162 [ _ emit-vv-vector-op ] if