1 USING: accessors arrays classes compiler compiler.tree.debugger
2 effects fry io kernel kernel.private math math.functions
3 math.private math.vectors math.vectors.simd
4 math.vectors.simd.private prettyprint random sequences system
5 tools.test vocabs assocs compiler.cfg.debugger words
6 locals combinators cpu.architecture namespaces byte-arrays alien
7 specialized-arrays classes.struct eval classes.algebra sets
8 quotations math.constants compiler.units splitting ;
9 FROM: math.vectors.simd.intrinsics => alien-vector set-alien-vector ;
10 QUALIFIED-WITH: alien.c-types c
11 SPECIALIZED-ARRAY: c:float
12 IN: math.vectors.simd.tests
14 ! Test type propagation
15 [ V{ float } ] [ [ { float-4 } declare norm-sq ] final-classes ] unit-test
17 [ V{ float } ] [ [ { float-4 } declare norm ] final-classes ] unit-test
19 [ V{ float-4 } ] [ [ { float-4 } declare normalize ] final-classes ] unit-test
21 [ V{ float-4 } ] [ [ { float-4 float-4 } declare v+ ] final-classes ] unit-test
23 [ V{ float } ] [ [ { float-4 } declare second ] final-classes ] unit-test
25 [ V{ int-4 } ] [ [ { int-4 int-4 } declare v+ ] final-classes ] unit-test
27 [ t ] [ [ { int-4 } declare second ] final-classes first integer class<= ] unit-test
29 [ V{ longlong-2 } ] [ [ { longlong-2 longlong-2 } declare v+ ] final-classes ] unit-test
31 [ V{ integer } ] [ [ { longlong-2 } declare second ] final-classes ] unit-test
33 ! Test puns; only on x86
35 [ double-2{ 4 1024 } ] [
37 [ { float-4 } declare dup v+ underlying>> double-2 boa dup v+ ] compile-call
42 CONSTANT: simd-classes
56 SYMBOLS: -> +vector+ +any-vector+ +scalar+ +boolean+ +nonnegative+ +literal+ ;
58 CONSTANT: vector-words
60 { [v-] { +vector+ +vector+ -> +vector+ } }
61 { distance { +vector+ +vector+ -> +nonnegative+ } }
62 { n*v { +scalar+ +vector+ -> +vector+ } }
63 { n+v { +scalar+ +vector+ -> +vector+ } }
64 { n-v { +scalar+ +vector+ -> +vector+ } }
65 { n/v { +scalar+ +vector+ -> +vector+ } }
66 { norm { +vector+ -> +nonnegative+ } }
67 { norm-sq { +vector+ -> +nonnegative+ } }
68 { normalize { +vector+ -> +vector+ } }
69 { v* { +vector+ +vector+ -> +vector+ } }
70 { vs* { +vector+ +vector+ -> +vector+ } }
71 { v*n { +vector+ +scalar+ -> +vector+ } }
72 { v*high { +vector+ +vector+ -> +vector+ } }
73 { v*hs+ { +vector+ +vector+ -> +vector+ } }
74 { v+ { +vector+ +vector+ -> +vector+ } }
75 { vs+ { +vector+ +vector+ -> +vector+ } }
76 { v+- { +vector+ +vector+ -> +vector+ } }
77 { v+n { +vector+ +scalar+ -> +vector+ } }
78 { v- { +vector+ +vector+ -> +vector+ } }
79 { vneg { +vector+ -> +vector+ } }
80 { vs- { +vector+ +vector+ -> +vector+ } }
81 { v-n { +vector+ +scalar+ -> +vector+ } }
82 { v. { +vector+ +vector+ -> +scalar+ } }
83 { vsad { +vector+ +vector+ -> +scalar+ } }
84 { v/ { +vector+ +vector+ -> +vector+ } }
85 { v/n { +vector+ +scalar+ -> +vector+ } }
86 { vceiling { +vector+ -> +vector+ } }
87 { vfloor { +vector+ -> +vector+ } }
88 { vmax { +vector+ +vector+ -> +vector+ } }
89 { vmin { +vector+ +vector+ -> +vector+ } }
90 { vavg { +vector+ +vector+ -> +vector+ } }
91 { vneg { +vector+ -> +vector+ } }
92 { vtruncate { +vector+ -> +vector+ } }
93 { sum { +vector+ -> +scalar+ } }
94 { vabs { +vector+ -> +vector+ } }
95 { vsqrt { +vector+ -> +vector+ } }
96 { vbitand { +vector+ +vector+ -> +vector+ } }
97 { vbitandn { +vector+ +vector+ -> +vector+ } }
98 { vbitor { +vector+ +vector+ -> +vector+ } }
99 { vbitxor { +vector+ +vector+ -> +vector+ } }
100 { vbitnot { +vector+ -> +vector+ } }
101 { vand { +vector+ +vector+ -> +vector+ } }
102 { vandn { +vector+ +vector+ -> +vector+ } }
103 { vor { +vector+ +vector+ -> +vector+ } }
104 { vxor { +vector+ +vector+ -> +vector+ } }
105 { vnot { +vector+ -> +vector+ } }
106 { vlshift { +vector+ +scalar+ -> +vector+ } }
107 { vrshift { +vector+ +scalar+ -> +vector+ } }
108 { (vmerge-head) { +vector+ +vector+ -> +vector+ } }
109 { (vmerge-tail) { +vector+ +vector+ -> +vector+ } }
110 { v<= { +vector+ +vector+ -> +vector+ } }
111 { v< { +vector+ +vector+ -> +vector+ } }
112 { v= { +vector+ +vector+ -> +vector+ } }
113 { v> { +vector+ +vector+ -> +vector+ } }
114 { v>= { +vector+ +vector+ -> +vector+ } }
115 { vunordered? { +vector+ +vector+ -> +vector+ } }
118 : vector-word-inputs ( schema -- seq ) { -> } split first ;
120 : with-ctors ( -- seq )
121 simd-classes [ [ name>> "-with" append ] [ vocabulary>> ] bi lookup ] map ;
123 : boa-ctors ( -- seq )
124 simd-classes [ [ name>> "-boa" append ] [ vocabulary>> ] bi lookup ] map ;
126 : check-optimizer ( seq quot eq-quot -- failures )
129 [ dup [ class ] { } map-as ] dip '[ _ declare @ ]
131 [ "print-mr" get [ nip test-mr mr. ] [ 2drop ] if ]
132 [ "print-checks" get [ [ . ] bi@ ] [ 2drop ] if ]
133 [ [ [ call ] dip call ] call( quot quot -- result ) ]
134 [ [ [ call ] dip compile-call ] call( quot quot -- result ) ]
135 [ [ t "always-inline-simd-intrinsics" [ [ call ] dip compile-call ] with-variable ] call( quot quot -- result ) ]
137 [ drop @ ] [ nip @ ] 3bi and not
140 "== Checking -new constructors" print
143 simd-classes [ [ [ ] ] dip '[ _ new ] ] [ = ] check-optimizer
147 simd-classes [ '[ _ new ] compile-call [ zero? ] all? not ] filter
150 "== Checking -with constructors" print
154 [ 1000 random '[ _ ] ] dip '[ _ execute ]
155 ] [ = ] check-optimizer
158 [ HEX: ffffffff ] [ HEX: ffffffff uint-4-with first ] unit-test
160 [ HEX: ffffffff ] [ HEX: ffffffff [ uint-4-with ] compile-call first ] unit-test
162 [ HEX: ffffffff ] [ [ HEX: ffffffff uint-4-with ] compile-call first ] unit-test
164 "== Checking -boa constructors" print
168 [ stack-effect in>> length [ 1000 random ] [ ] replicate-as ] keep
170 ] [ = ] check-optimizer
173 [ HEX: ffffffff ] [ HEX: ffffffff 2 3 4 [ uint-4-boa ] compile-call first ] unit-test
175 "== Checking vector operations" print
177 : random-int-vector ( class -- vec )
178 new [ drop 1,000 random ] map ;
179 : random-float-vector ( class -- vec )
183 10 swap <array> 0/0. suffix random
186 : random-vector ( class elt-class -- vec )
188 [ random-float-vector ]
189 [ random-int-vector ] if ;
191 :: check-vector-op ( word inputs class elt-class -- inputs quot )
194 { +vector+ [ class elt-class random-vector ] }
195 { +scalar+ [ 1000 random elt-class float = [ >float ] when ] }
198 word '[ _ execute ] ;
200 : remove-float-words ( alist -- alist' )
201 { vsqrt n/v v/n v/ normalize } unique assoc-diff ;
203 : remove-integer-words ( alist -- alist' )
204 { vlshift vrshift v*high v*hs+ } unique assoc-diff ;
206 : boolean-ops ( -- words )
207 { vand vandn vor vxor vnot } ;
209 : remove-boolean-words ( alist -- alist' )
210 boolean-ops unique assoc-diff ;
212 : ops-to-check ( elt-class -- alist )
213 [ vector-words >alist ] dip
214 float = [ remove-integer-words ] [ remove-float-words ] if
215 remove-boolean-words ;
217 : check-vector-ops ( class elt-class compare-quot -- )
219 [ nip ops-to-check ] 2keep
220 '[ first2 vector-word-inputs _ _ check-vector-op ]
221 ] dip check-optimizer ; inline
223 : (approx=) ( x y -- ? )
225 { [ 2dup [ fp-nan? ] both? ] [ 2drop t ] }
226 { [ 2dup [ fp-nan? ] either? ] [ 2drop f ] }
227 { [ 2dup [ fp-infinity? ] either? ] [ fp-bitwise= ] }
228 { [ 2dup [ float? ] both? ] [ -1.e8 ~ ] }
231 : approx= ( x y -- ? )
232 2dup [ sequence? ] both?
233 [ [ (approx=) ] 2all? ] [ (approx=) ] if ;
235 : exact= ( x y -- ? )
237 { [ 2dup [ float? ] both? ] [ fp-bitwise= ] }
238 { [ 2dup [ sequence? ] both? ] [ [ fp-bitwise= ] 2all? ] }
241 : simd-classes&reps ( -- alist )
244 { [ dup name>> "float" head? ] [ float [ approx= ] ] }
245 { [ dup name>> "double" head? ] [ float [ exact= ] ] }
251 [ [ { } ] ] dip first3 '[ _ _ _ check-vector-ops ] unit-test
254 "== Checking boolean operations" print
256 : random-boolean-vector ( class -- vec )
257 new [ drop 2 random zero? ] map ;
259 :: check-boolean-op ( word inputs class elt-class -- inputs quot )
262 { +vector+ [ class random-boolean-vector ] }
263 { +scalar+ [ 1000 random elt-class float = [ >float ] when ] }
266 word '[ _ execute ] ;
268 : check-boolean-ops ( class elt-class compare-quot -- seq )
270 [ boolean-ops [ dup vector-words at ] { } map>assoc ] 2dip
271 '[ first2 vector-word-inputs _ _ check-boolean-op ]
272 ] dip check-optimizer ; inline
275 [ [ { } ] ] dip first3 '[ _ _ _ check-boolean-ops ] unit-test
278 "== Checking vector blend" print
280 [ char-16{ 0 1 22 33 4 5 6 77 8 99 110 121 12 143 14 15 } ]
282 char-16{ t t f f t t t f t f f f t f t t }
283 char-16{ 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 }
284 char-16{ 0 11 22 33 44 55 66 77 88 99 110 121 132 143 154 165 } v?
287 [ char-16{ 0 1 22 33 4 5 6 77 8 99 110 121 12 143 14 15 } ]
289 char-16{ t t f f t t t f t f f f t f t t }
290 char-16{ 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 }
291 char-16{ 0 11 22 33 44 55 66 77 88 99 110 121 132 143 154 165 }
292 [ { char-16 char-16 char-16 } declare v? ] compile-call
295 [ int-4{ 1 22 33 4 } ]
296 [ int-4{ t f f t } int-4{ 1 2 3 4 } int-4{ 11 22 33 44 } v? ] unit-test
298 [ int-4{ 1 22 33 4 } ]
300 int-4{ t f f t } int-4{ 1 2 3 4 } int-4{ 11 22 33 44 }
301 [ { int-4 int-4 int-4 } declare v? ] compile-call
304 [ float-4{ 1.0 22.0 33.0 4.0 } ]
305 [ float-4{ t f f t } float-4{ 1.0 2.0 3.0 4.0 } float-4{ 11.0 22.0 33.0 44.0 } v? ] unit-test
307 [ float-4{ 1.0 22.0 33.0 4.0 } ]
309 float-4{ t f f t } float-4{ 1.0 2.0 3.0 4.0 } float-4{ 11.0 22.0 33.0 44.0 }
310 [ { float-4 float-4 float-4 } declare v? ] compile-call
313 "== Checking shifts and permutations" print
315 [ char-16{ 0 1 2 4 8 1 2 4 8 1 2 4 8 1 2 4 } ]
316 [ char-16{ 1 2 4 8 1 2 4 8 1 2 4 8 1 2 4 8 } 1 hlshift ] unit-test
318 [ char-16{ 0 1 2 4 8 1 2 4 8 1 2 4 8 1 2 4 } ]
319 [ char-16{ 1 2 4 8 1 2 4 8 1 2 4 8 1 2 4 8 } [ { char-16 } declare 1 hlshift ] compile-call ] unit-test
321 [ char-16{ 0 1 2 4 8 1 2 4 8 1 2 4 8 1 2 4 } ]
322 [ char-16{ 1 2 4 8 1 2 4 8 1 2 4 8 1 2 4 8 } 1 [ { char-16 fixnum } declare hlshift ] compile-call ] unit-test
324 [ char-16{ 2 4 8 1 2 4 8 1 2 4 8 1 2 4 8 0 } ]
325 [ char-16{ 1 2 4 8 1 2 4 8 1 2 4 8 1 2 4 8 } 1 hrshift ] unit-test
327 [ char-16{ 2 4 8 1 2 4 8 1 2 4 8 1 2 4 8 0 } ]
328 [ char-16{ 1 2 4 8 1 2 4 8 1 2 4 8 1 2 4 8 } [ { char-16 } declare 1 hrshift ] compile-call ] unit-test
330 [ char-16{ 2 4 8 1 2 4 8 1 2 4 8 1 2 4 8 0 } ]
331 [ char-16{ 1 2 4 8 1 2 4 8 1 2 4 8 1 2 4 8 } 1 [ { char-16 fixnum } declare hrshift ] compile-call ] unit-test
333 ! Invalid inputs should not cause the compiler to throw errors
335 [ [ { int-4 } declare t hrshift ] (( a -- b )) define-temp drop ] with-compilation-unit
339 [ [ { int-4 } declare { 3 2 1 } vshuffle ] (( a -- b )) define-temp drop ] with-compilation-unit
343 : shuffles-for ( n -- shuffles )
374 [ dup '[ _ random ] replicate 1array ]
379 [ new length shuffles-for ] keep
381 _ [ [ _ new [ length iota ] keep like 1quotation ] dip '[ _ vshuffle ] ]
382 [ = ] check-optimizer
386 "== Checking variable shuffles" print
388 : random-shift-vector ( class -- vec )
389 new [ drop 16 random ] map ;
391 :: test-shift-vector ( class -- ? )
393 class random-int-vector :> src
394 char-16 random-shift-vector :> perm
395 { class char-16 } :> decl
398 src perm [ decl declare vshuffle ] compile-call
402 { char-16 uchar-16 short-8 ushort-8 int-4 uint-4 longlong-2 ulonglong-2 }
403 [ 10 swap '[ [ t ] [ _ test-shift-vector ] unit-test ] times ] each
405 "== Checking vector tests" print
407 :: test-vector-tests-bool ( vector declaration -- none? any? all? )
410 [ [ declaration declare vnone? ] compile-call ]
411 [ [ declaration declare vany? ] compile-call ]
412 [ [ declaration declare vall? ] compile-call ] tri
413 ] call( -- none? any? all? ) ;
418 :: test-vector-tests-branch ( vector declaration -- none? any? all? )
421 [ [ declaration declare vnone? [ yes ] [ no ] if ] compile-call ]
422 [ [ declaration declare vany? [ yes ] [ no ] if ] compile-call ]
423 [ [ declaration declare vall? [ yes ] [ no ] if ] compile-call ] tri
424 ] call( -- none? any? all? ) ;
426 TUPLE: inconsistent-vector-test bool branch ;
428 : ?inconsistent ( bool branch -- ?/inconsistent )
429 2dup = [ drop ] [ inconsistent-vector-test boa ] if ;
431 :: test-vector-tests ( vector decl -- none? any? all? )
433 vector decl test-vector-tests-bool :> ( bool-none bool-any bool-all )
434 vector decl test-vector-tests-branch :> ( branch-none branch-any branch-all )
436 bool-none branch-none ?inconsistent
437 bool-any branch-any ?inconsistent
438 bool-all branch-all ?inconsistent
439 ] call( -- none? any? all? ) ;
442 [ float-4{ t t t t } { float-4 } test-vector-tests ] unit-test
444 [ float-4{ f t t t } { float-4 } test-vector-tests ] unit-test
446 [ float-4{ f f f f } { float-4 } test-vector-tests ] unit-test
449 [ double-2{ t t } { double-2 } test-vector-tests ] unit-test
451 [ double-2{ f t } { double-2 } test-vector-tests ] unit-test
453 [ double-2{ f f } { double-2 } test-vector-tests ] unit-test
456 [ int-4{ t t t t } { int-4 } test-vector-tests ] unit-test
458 [ int-4{ f t t t } { int-4 } test-vector-tests ] unit-test
460 [ int-4{ f f f f } { int-4 } test-vector-tests ] unit-test
462 "== Checking element access" print
464 ! Test element access -- it should box bignums for int-4 on x86
465 : test-accesses ( seq -- failures )
466 [ length >array ] keep
467 '[ [ _ 1quotation ] dip '[ _ swap nth ] ] [ = ] check-optimizer ; inline
469 [ { } ] [ float-4{ 1.0 2.0 3.0 4.0 } test-accesses ] unit-test
470 [ { } ] [ int-4{ HEX: 7fffffff 3 4 -8 } test-accesses ] unit-test
471 [ { } ] [ uint-4{ HEX: ffffffff 2 3 4 } test-accesses ] unit-test
473 [ HEX: 7fffffff ] [ int-4{ HEX: 7fffffff 3 4 -8 } first ] unit-test
474 [ -8 ] [ int-4{ HEX: 7fffffff 3 4 -8 } last ] unit-test
475 [ HEX: ffffffff ] [ uint-4{ HEX: ffffffff 2 3 4 } first ] unit-test
477 [ { } ] [ double-2{ 1.0 2.0 } test-accesses ] unit-test
478 [ { } ] [ longlong-2{ 1 2 } test-accesses ] unit-test
479 [ { } ] [ ulonglong-2{ 1 2 } test-accesses ] unit-test
481 "== Checking broadcast" print
482 : test-broadcast ( seq -- failures )
483 [ length >array ] keep
484 '[ [ _ 1quotation ] dip '[ _ vbroadcast ] ] [ = ] check-optimizer ;
486 [ { } ] [ float-4{ 1.0 2.0 3.0 4.0 } test-broadcast ] unit-test
487 [ { } ] [ int-4{ HEX: 7fffffff 3 4 -8 } test-broadcast ] unit-test
488 [ { } ] [ uint-4{ HEX: ffffffff 2 3 4 } test-broadcast ] unit-test
490 [ { } ] [ double-2{ 1.0 2.0 } test-broadcast ] unit-test
491 [ { } ] [ longlong-2{ 1 2 } test-broadcast ] unit-test
492 [ { } ] [ ulonglong-2{ 1 2 } test-broadcast ] unit-test
494 ! Make sure we use the fallback in the correct situations
495 [ int-4{ 3 3 3 3 } ] [ int-4{ 12 34 3 17 } 2 [ { int-4 fixnum } declare vbroadcast ] compile-call ] unit-test
497 "== Checking alien operations" print
499 [ float-4{ 1 2 3 4 } ] [
502 underlying>> 0 float-4-rep alien-vector
503 ] compile-call float-4 boa
506 [ B{ 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 } ] [
507 16 [ 1 ] B{ } replicate-as 16 <byte-array>
510 { byte-array c-ptr fixnum } declare
511 float-4-rep set-alien-vector
516 [ float-array{ 1 2 3 4 } ] [
518 float-array{ 1 2 3 4 } underlying>>
519 float-array{ 4 3 2 1 } clone
520 [ underlying>> 0 float-4-rep set-alien-vector ] keep
530 [ t ] [ [ simd-struct <struct> ] compile-call >c-ptr [ 0 = ] all? ] unit-test
539 float-4{ 1 2 3 4 } >>x
540 longlong-2{ 2 1 } >>y
543 { [ x>> ] [ y>> ] [ z>> ] [ w>> ] } cleave
554 float-4{ 1 2 3 4 } >>x
555 longlong-2{ 2 1 } >>y
558 { [ x>> ] [ y>> ] [ z>> ] [ w>> ] } cleave
562 "== Misc tests" print
564 [ ] [ char-16 new 1array stack. ] unit-test
568 int-4{ 1000 1000 1000 1000 }
569 [ { int-4 } declare dup [ * ] [ + ] 2map-reduce ] compile-call
572 ! Coalescing was too aggressive
573 :: broken ( axis theta -- a b c )
574 axis { float-4 } declare drop
575 theta { float } declare drop
577 theta cos float-4-with :> cc
578 theta sin float-4-with :> ss
580 axis cc v+ :> diagonal
582 diagonal cc ss ; inline
585 float-4{ 1.0 0.0 1.0 0.0 } pi [ broken 3array ]
586 [ compile-call ] [ call ] 3bi =
589 ! Spilling SIMD values -- this basically just tests that the
590 ! stack was aligned properly by the runtime
592 : simd-spill-test-1 ( a b c -- v )
593 { float-4 float-4 float } declare
596 [ float-4{ 0 0 0 0 } ]
597 [ float-4{ 1 2 3 4 } float-4{ 4 5 6 7 } 0.0 simd-spill-test-1 ] unit-test
599 : simd-spill-test-2 ( a b d c -- v )
600 { float float-4 float-4 float } declare
601 [ [ 3.0 + ] 2dip v+ ] dip sin v*n n*v ;
603 [ float-4{ 0 0 0 0 } ]
604 [ 5.0 float-4{ 1 2 3 4 } float-4{ 4 5 6 7 } 0.0 simd-spill-test-2 ] unit-test