]> gitweb.factorcode.org Git - factor.git/blob - basis/compiler/tree/propagation/simd/simd.factor
More integer SIMD work
[factor.git] / basis / compiler / tree / propagation / simd / simd.factor
1 ! Copyright (C) 2009 Slava Pestov.
2 ! See http://factorcode.org/license.txt for BSD license.
3 USING: accessors byte-arrays combinators fry
4 compiler.tree.propagation.info cpu.architecture kernel words math
5 math.intervals math.vectors.simd.intrinsics ;
6 IN: compiler.tree.propagation.simd
7
8 \ (simd-v+) { byte-array } "default-output-classes" set-word-prop
9
10 \ (simd-v-) { byte-array } "default-output-classes" set-word-prop
11
12 \ (simd-v*) { byte-array } "default-output-classes" set-word-prop
13
14 \ (simd-v/) { byte-array } "default-output-classes" set-word-prop
15
16 \ (simd-vmin) { byte-array } "default-output-classes" set-word-prop
17
18 \ (simd-vmax) { byte-array } "default-output-classes" set-word-prop
19
20 \ (simd-vsqrt) { byte-array } "default-output-classes" set-word-prop
21
22 \ (simd-sum) [
23     nip dup literal?>> [
24         literal>> scalar-rep-of {
25             { float-rep [ float ] }
26             { double-rep [ float ] }
27             { int-rep [ integer ] }
28         } case
29     ] [ drop real ] if
30     <class-info>
31 ] "outputs" set-word-prop
32
33 \ (simd-broadcast) { byte-array } "default-output-classes" set-word-prop
34
35 \ (simd-gather-2) { byte-array } "default-output-classes" set-word-prop
36
37 \ (simd-gather-4) { byte-array } "default-output-classes" set-word-prop
38
39 \ assert-positive [
40     real [0,inf] <class/interval-info> value-info-intersect
41 ] "outputs" set-word-prop
42
43 \ alien-vector { byte-array } "default-output-classes" set-word-prop
44
45 ! If SIMD is not available, inline alien-vector and set-alien-vector
46 ! to get a speedup
47 : inline-unless-intrinsic ( word -- )
48     dup '[ drop _ dup "intrinsic" word-prop [ drop f ] [ def>> ] if ]
49     "custom-inlining" set-word-prop ;
50
51 \ alien-vector inline-unless-intrinsic
52
53 \ set-alien-vector inline-unless-intrinsic