1 ! Copyright (C) 2005, 2009 Slava Pestov.
2 ! See http://factorcode.org/license.txt for BSD license.
3 USING: accessors assocs sequences kernel combinators make math
4 math.order math.ranges system namespaces locals layouts words
5 alien alien.accessors alien.c-types literals cpu.architecture
6 cpu.ppc.assembler cpu.ppc.assembler.backend literals compiler.cfg.registers
7 compiler.cfg.instructions compiler.constants compiler.codegen
8 compiler.codegen.fixup compiler.cfg.intrinsics
9 compiler.cfg.stack-frame compiler.units ;
12 ! PowerPC register assignments:
13 ! r2-r12: integer vregs
15 ! r30: integer scratch
19 ! Add some methods to the assembler that are useful to us
20 M: label (B) [ 0 ] 2dip (B) rc-relative-ppc-3 label-fixup ;
21 M: label BC [ 0 BC ] dip rc-relative-ppc-2 label-fixup ;
23 enable-float-intrinsics
26 \ ##integer>float t frame-required? set-word-prop
27 \ ##float>integer t frame-required? set-word-prop
30 M: ppc machine-registers
32 { int-regs $[ 2 12 [a,b] 15 29 [a,b] append ] }
33 { double-float-regs $[ 0 29 [a,b] ] }
36 CONSTANT: scratch-reg 30
37 CONSTANT: fp-scratch-reg 30
39 M: ppc two-operand? f ;
41 M: ppc %load-immediate ( reg n -- ) swap LOAD ;
43 M: ppc %load-reference ( reg obj -- )
44 [ 0 swap LOAD32 ] [ rc-absolute-ppc-2/2 rel-immediate ] bi* ;
46 M: ppc %alien-global ( register symbol dll -- )
47 [ 0 swap LOAD32 ] 2dip rc-absolute-ppc-2/2 rel-dlsym ;
52 GENERIC: loc-reg ( loc -- reg )
54 M: ds-loc loc-reg drop ds-reg ;
55 M: rs-loc loc-reg drop rs-reg ;
57 : loc>operand ( loc -- reg n )
58 [ loc-reg ] [ n>> cells neg ] bi ; inline
60 M: ppc %peek loc>operand LWZ ;
61 M: ppc %replace loc>operand STW ;
63 : (%inc) ( n reg -- ) dup rot cells ADDI ; inline
65 M: ppc %inc-d ( n -- ) ds-reg (%inc) ;
66 M: ppc %inc-r ( n -- ) rs-reg (%inc) ;
68 HOOK: reserved-area-size os ( -- n )
70 ! The start of the stack frame contains the size of this frame
71 ! as well as the currently executing XT
72 : factor-area-size ( -- n ) 2 cells ; foldable
73 : next-save ( n -- i ) cell - ;
74 : xt-save ( n -- i ) 2 cells - ;
76 ! Next, we have the spill area as well as the FFI parameter area.
77 ! They overlap, since basic blocks with FFI calls will never
79 : param@ ( n -- x ) reserved-area-size + ; inline
81 : param-save-size ( -- n ) 8 cells ; foldable
84 reserved-area-size param-save-size + + ; inline
86 : spill-integer-base ( -- n )
87 stack-frame get spill-counts>> double-float-regs swap at
88 double-float-regs reg-size * ;
90 : spill-integer@ ( n -- offset )
91 cells spill-integer-base + param@ ;
93 : spill-float@ ( n -- offset )
94 double-float-regs reg-size * param@ ;
96 ! Some FP intrinsics need a temporary scratch area in the stack
97 ! frame, 8 bytes in size
98 : scratch@ ( n -- offset )
99 stack-frame get total-size>>
104 ! Finally we have the linkage area
105 HOOK: lr-save os ( -- n )
107 M: ppc stack-frame-size ( stack-frame -- i )
108 [ spill-counts>> [ swap reg-size * ] { } assoc>map sum ]
117 M: ppc %call ( word -- ) 0 BL rc-relative-ppc-3 rel-word-pic ;
119 M: ppc %jump ( word -- )
120 0 6 LOAD32 8 rc-absolute-ppc-2/2 rel-here
121 0 B rc-relative-ppc-3 rel-word-pic-tail ;
123 M: ppc %jump-label ( label -- ) B ;
124 M: ppc %return ( -- ) BLR ;
126 M:: ppc %dispatch ( src temp offset -- )
128 4 offset + cells rc-absolute-ppc-2/2 rel-here
133 M: ppc %dispatch-label ( word -- )
134 B{ 0 0 0 0 } % rc-absolute-cell rel-word ;
136 :: (%slot) ( obj slot tag temp -- reg offset )
138 temp tag neg ; inline
140 : (%slot-imm) ( obj slot tag -- reg offset )
141 [ cells ] dip - ; inline
143 M: ppc %slot ( dst obj slot tag temp -- ) (%slot) LWZ ;
144 M: ppc %slot-imm ( dst obj slot tag -- ) (%slot-imm) LWZ ;
145 M: ppc %set-slot ( src obj slot tag temp -- ) (%slot) STW ;
146 M: ppc %set-slot-imm ( src obj slot tag -- ) (%slot-imm) STW ;
148 M:: ppc %string-nth ( dst src index temp -- )
152 dst temp string-offset LBZ
155 temp src string-aux-offset LWZ
158 temp temp byte-array-offset LHZ
164 M:: ppc %set-string-nth-fast ( ch obj index temp -- )
166 ch temp string-offset STB ;
169 M: ppc %add-imm ADDI ;
170 M: ppc %sub swap SUBF ;
171 M: ppc %sub-imm SUBI ;
173 M: ppc %mul-imm MULLI ;
175 M: ppc %and-imm ANDI ;
179 M: ppc %xor-imm XORI ;
180 M: ppc %shl-imm swapd SLWI ;
181 M: ppc %shr-imm swapd SRWI ;
182 M: ppc %sar-imm SRAWI ;
185 : %alien-invoke-tail ( func dll -- )
186 [ scratch-reg ] 2dip %alien-global scratch-reg MTCTR BCTR ;
188 :: exchange-regs ( r1 r2 -- )
193 : ?MR ( r1 r2 -- ) 2dup = [ 2drop ] [ MR ] if ;
195 :: move>args ( src1 src2 -- )
197 { [ src1 4 = ] [ 3 src2 ?MR 3 4 exchange-regs ] }
198 { [ src1 3 = ] [ 4 src2 ?MR ] }
199 { [ src2 3 = ] [ 4 src1 ?MR 3 4 exchange-regs ] }
200 { [ src2 4 = ] [ 3 src1 ?MR ] }
201 [ 3 src1 MR 4 src2 MR ]
208 :: overflow-template ( src1 src2 insn func -- )
209 "no-overflow" define-label
211 scratch-reg src2 src1 insn call
212 scratch-reg ds-reg 0 STW
213 "no-overflow" get BNO
215 %prepare-alien-invoke
217 "no-overflow" resolve-label ; inline
219 :: overflow-template-tail ( src1 src2 insn func -- )
220 "overflow" define-label
222 scratch-reg src2 src1 insn call
224 scratch-reg ds-reg 0 STW
226 "overflow" resolve-label
228 %prepare-alien-invoke
229 func f %alien-invoke-tail ; inline
231 M: ppc %fixnum-add ( src1 src2 -- )
232 [ ADDO. ] "overflow_fixnum_add" overflow-template ;
234 M: ppc %fixnum-add-tail ( src1 src2 -- )
235 [ ADDO. ] "overflow_fixnum_add" overflow-template-tail ;
237 M: ppc %fixnum-sub ( src1 src2 -- )
238 [ SUBFO. ] "overflow_fixnum_subtract" overflow-template ;
240 M: ppc %fixnum-sub-tail ( src1 src2 -- )
241 [ SUBFO. ] "overflow_fixnum_subtract" overflow-template-tail ;
243 M:: ppc %fixnum-mul ( src1 src2 temp1 temp2 -- )
244 "no-overflow" define-label
246 temp1 src1 tag-bits get SRAWI
247 temp2 temp1 src2 MULLWO.
249 "no-overflow" get BNO
250 src2 src2 tag-bits get SRAWI
252 %prepare-alien-invoke
253 "overflow_fixnum_multiply" f %alien-invoke
254 "no-overflow" resolve-label ;
256 M:: ppc %fixnum-mul-tail ( src1 src2 temp1 temp2 -- )
257 "overflow" define-label
259 temp1 src1 tag-bits get SRAWI
260 temp2 temp1 src2 MULLWO.
264 "overflow" resolve-label
265 src2 src2 tag-bits get SRAWI
267 %prepare-alien-invoke
268 "overflow_fixnum_multiply" f %alien-invoke-tail ;
270 : bignum@ ( n -- offset ) cells bignum tag-number - ; inline
272 M:: ppc %integer>bignum ( dst src temp -- )
275 dst 0 >bignum %load-reference
276 ! Is it zero? Then just go to the end and return this zero
280 dst 4 cells bignum temp %allot
283 temp dst 1 bignum@ STW
286 temp temp cell-bits 1- SRAWI
289 temp dst 2 bignum@ STW
290 ! Make negative value positive
296 temp dst 3 bignum@ STW
300 M:: ppc %bignum>integer ( dst src temp -- )
303 temp src 1 bignum@ LWZ
304 ! if the length is 1, its just the sign and nothing else,
307 0 temp 1 tag-fixnum CMPI
310 dst src 3 bignum@ LWZ
312 temp src 2 bignum@ LWZ
313 ! branchless arithmetic: we want to turn 0 into 1,
318 ! multiply value by sign
323 M: ppc %add-float FADD ;
324 M: ppc %sub-float FSUB ;
325 M: ppc %mul-float FMUL ;
326 M: ppc %div-float FDIV ;
328 M:: ppc %integer>float ( dst src -- )
329 HEX: 4330 scratch-reg LIS
330 scratch-reg 1 0 scratch@ STW
332 scratch-reg dup HEX: 8000 XORIS
333 scratch-reg 1 4 scratch@ STW
335 scratch-reg 4503601774854144.0 %load-reference
336 fp-scratch-reg scratch-reg float-offset LFD
337 dst dst fp-scratch-reg FSUB ;
339 M:: ppc %float>integer ( dst src -- )
340 fp-scratch-reg src FCTIWZ
341 fp-scratch-reg 1 0 scratch@ STFD
342 dst 1 4 scratch@ LWZ ;
344 M: ppc %copy ( dst src -- ) MR ;
346 M: ppc %copy-float ( dst src -- ) FMR ;
348 M: ppc %unbox-float ( dst src -- ) float-offset LFD ;
350 M:: ppc %box-float ( dst src temp -- )
351 dst 16 float temp %allot
352 src dst float-offset STFD ;
354 M:: ppc %unbox-any-c-ptr ( dst src temp -- )
356 { "is-byte-array" "end" "start" } [ define-label ] each
357 ! Address is computed in dst
359 ! Load object into scratch-reg
361 ! We come back here with displaced aliens
362 "start" resolve-label
364 0 scratch-reg \ f tag-number CMPI
367 ! Is the object an alien?
368 0 scratch-reg header-offset LWZ
369 0 0 alien type-number tag-fixnum CMPI
370 "is-byte-array" get BNE
371 ! If so, load the offset
372 0 scratch-reg alien-offset LWZ
373 ! Add it to address being computed
375 ! Now recurse on the underlying alien
376 scratch-reg scratch-reg underlying-alien-offset LWZ
378 "is-byte-array" resolve-label
379 ! Add byte array address to address being computed
380 dst dst scratch-reg ADD
381 ! Add an offset to start of byte array's data area
382 dst dst byte-array-offset ADDI
386 : alien@ ( n -- n' ) cells object tag-number - ;
388 M:: ppc %box-alien ( dst src temp -- )
391 dst \ f tag-number %load-immediate
394 dst 4 cells alien temp %allot
398 temp \ f tag-number %load-immediate
399 temp dst 1 alien@ STW
400 ! Store underlying-alien slot
401 temp dst 2 alien@ STW
405 M: ppc %alien-unsigned-1 0 LBZ ;
406 M: ppc %alien-unsigned-2 0 LHZ ;
408 M: ppc %alien-signed-1 dupd 0 LBZ dup EXTSB ;
409 M: ppc %alien-signed-2 0 LHA ;
411 M: ppc %alien-cell 0 LWZ ;
413 M: ppc %alien-float 0 LFS ;
414 M: ppc %alien-double 0 LFD ;
416 M: ppc %set-alien-integer-1 swap 0 STB ;
417 M: ppc %set-alien-integer-2 swap 0 STH ;
419 M: ppc %set-alien-cell swap 0 STW ;
421 M: ppc %set-alien-float swap 0 STFS ;
422 M: ppc %set-alien-double swap 0 STFD ;
424 : load-zone-ptr ( reg -- )
425 "nursery" f %alien-global ;
427 : load-allot-ptr ( nursery-ptr allot-ptr -- )
428 [ drop load-zone-ptr ] [ swap 4 LWZ ] 2bi ;
430 :: inc-allot-ptr ( nursery-ptr allot-ptr n -- )
431 scratch-reg allot-ptr n 8 align ADDI
432 scratch-reg nursery-ptr 4 STW ;
434 :: store-header ( dst class -- )
435 class type-number tag-fixnum scratch-reg LI
436 scratch-reg dst 0 STW ;
438 : store-tagged ( dst tag -- )
439 dupd tag-number ORI ;
441 M:: ppc %allot ( dst size class nursery-ptr -- )
442 nursery-ptr dst load-allot-ptr
443 nursery-ptr dst size inc-allot-ptr
444 dst class store-header
445 dst class store-tagged ;
447 : load-cards-offset ( dst -- )
448 [ "cards_offset" f %alien-global ] [ dup 0 LWZ ] bi ;
450 : load-decks-offset ( dst -- )
451 [ "decks_offset" f %alien-global ] [ dup 0 LWZ ] bi ;
453 M:: ppc %write-barrier ( src card# table -- )
454 card-mark scratch-reg LI
457 table load-cards-offset
458 src card# card-bits SRWI
459 table scratch-reg card# STBX
462 table load-decks-offset
463 src card# deck-bits SRWI
464 table scratch-reg card# STBX ;
469 11 12 cell LWZ ! nursery.here -> r11
470 12 12 3 cells LWZ ! nursery.end -> r12
471 11 11 1024 ADDI ! add ALLOT_BUFFER_ZONE to here
472 11 0 12 CMP ! is here >= end?
474 %prepare-alien-invoke
475 "minor_gc" f %alien-invoke
476 "end" resolve-label ;
478 M: ppc %prologue ( n -- )
479 0 11 LOAD32 rc-absolute-ppc-2/2 rel-this
482 [ [ 1 1 ] dip neg ADDI ]
483 [ [ 11 1 ] dip xt-save STW ]
485 [ [ 11 1 ] dip next-save STW ]
486 [ [ 0 1 ] dip lr-save + STW ]
489 M: ppc %epilogue ( n -- )
490 #! At the end of each word that calls a subroutine, we store
491 #! the previous link register value in r0 by popping it off
492 #! the stack, set the link register to the contents of r0,
493 #! and jump to the link register.
494 [ [ 0 1 ] dip lr-save + LWZ ]
495 [ [ 1 1 ] dip ADDI ] bi
498 :: (%boolean) ( dst temp word -- )
500 dst \ f tag-number %load-immediate
501 "end" get word execute
502 dst \ t %load-reference
503 "end" get resolve-label ; inline
505 : %boolean ( dst temp cc -- )
507 { cc< [ \ BLT (%boolean) ] }
508 { cc<= [ \ BLE (%boolean) ] }
509 { cc> [ \ BGT (%boolean) ] }
510 { cc>= [ \ BGE (%boolean) ] }
511 { cc= [ \ BEQ (%boolean) ] }
512 { cc/= [ \ BNE (%boolean) ] }
515 : (%compare) ( src1 src2 -- ) [ 0 ] dip CMP ; inline
516 : (%compare-imm) ( src1 src2 -- ) [ 0 ] 2dip CMPI ; inline
517 : (%compare-float) ( src1 src2 -- ) [ 0 ] dip FCMPU ; inline
519 M: ppc %compare (%compare) %boolean ;
520 M: ppc %compare-imm (%compare-imm) %boolean ;
521 M: ppc %compare-float (%compare-float) %boolean ;
523 : %branch ( label cc -- )
533 M: ppc %compare-branch (%compare) %branch ;
534 M: ppc %compare-imm-branch (%compare-imm) %branch ;
535 M: ppc %compare-float-branch (%compare-float) %branch ;
537 M: ppc %spill-integer ( src n -- ) spill-integer@ 1 swap STW ;
538 M: ppc %reload-integer ( dst n -- ) spill-integer@ 1 swap LWZ ;
540 M: ppc %spill-float ( src n -- ) spill-float@ 1 swap STFD ;
541 M: ppc %reload-float ( dst n -- ) spill-float@ 1 swap LFD ;
545 M: int-regs return-reg drop 3 ;
546 M: int-regs param-regs drop { 3 4 5 6 7 8 9 10 } ;
547 M: float-regs return-reg drop 1 ;
549 M: int-regs %save-param-reg drop 1 rot local@ STW ;
550 M: int-regs %load-param-reg drop 1 rot local@ LWZ ;
552 GENERIC: STF ( src dst off reg-class -- )
554 M: single-float-regs STF drop STFS ;
555 M: double-float-regs STF drop STFD ;
557 M: float-regs %save-param-reg [ 1 rot local@ ] dip STF ;
559 GENERIC: LF ( dst src off reg-class -- )
561 M: single-float-regs LF drop LFS ;
562 M: double-float-regs LF drop LFD ;
564 M: float-regs %load-param-reg [ 1 rot local@ ] dip LF ;
566 M: stack-params %load-param-reg ( stack reg reg-class -- )
567 drop [ 0 1 rot local@ LWZ 0 1 ] dip param@ STW ;
569 : next-param@ ( n -- x ) param@ stack-frame get total-size>> + ;
571 M: stack-params %save-param-reg ( stack reg reg-class -- )
572 #! Funky. Read the parameter from the caller's stack frame.
573 #! This word is used in callbacks
575 [ 0 1 ] dip next-param@ LWZ
576 [ 0 1 ] dip local@ STW ;
578 M: ppc %prepare-unbox ( -- )
579 ! First parameter is top of stack
581 ds-reg dup cell SUBI ;
583 M: ppc %unbox ( n reg-class func -- )
584 ! Value must be in r3
587 ! Store the return value on the C stack
588 over [ [ return-reg ] keep %save-param-reg ] [ 2drop ] if ;
590 M: ppc %unbox-long-long ( n func -- )
591 ! Value must be in r3:r4
594 ! Store the return value on the C stack
596 [ [ 3 1 ] dip local@ STW ]
597 [ [ 4 1 ] dip cell + local@ STW ] bi
600 M: ppc %unbox-large-struct ( n c-type -- )
601 ! Value must be in r3
602 ! Compute destination address and load struct size
603 [ [ 4 1 ] dip local@ ADDI ] [ heap-size 5 LI ] bi*
605 "to_value_struct" f %alien-invoke ;
607 M: ppc %box ( n reg-class func -- )
608 ! If the source is a stack location, load it into freg #0.
609 ! If the source is f, then we assume the value is already in
611 [ over [ 0 over param-reg swap %load-param-reg ] [ 2drop ] if ] dip
614 M: ppc %box-long-long ( n func -- )
617 [ [ 3 1 ] dip local@ LWZ ]
618 [ [ 4 1 ] dip cell + local@ LWZ ] bi
620 ] dip f %alien-invoke ;
622 : struct-return@ ( n -- n )
623 [ stack-frame get params>> ] unless* local@ ;
625 M: ppc %prepare-box-struct ( -- )
626 #! Compute target address for value struct return
627 3 1 f struct-return@ ADDI
630 M: ppc %box-large-struct ( n c-type -- )
631 ! If n = f, then we're boxing a returned struct
632 ! Compute destination address and load struct size
633 [ [ 3 1 ] dip struct-return@ ADDI ] [ heap-size 4 LI ] bi*
635 "box_value_struct" f %alien-invoke ;
637 M: ppc %prepare-alien-invoke
638 #! Save Factor stack pointers in case the C code calls a
639 #! callback which does a GC, which must reliably trace
641 scratch-reg "stack_chain" f %alien-global
642 scratch-reg scratch-reg 0 LWZ
644 ds-reg scratch-reg 8 STW
645 rs-reg scratch-reg 12 STW ;
647 M: ppc %alien-invoke ( symbol dll -- )
648 [ 11 ] 2dip %alien-global 11 MTLR BLRL ;
650 M: ppc %alien-callback ( quot -- )
651 3 swap %load-reference "c_to_factor" f %alien-invoke ;
653 M: ppc %prepare-alien-indirect ( -- )
654 "unbox_alien" f %alien-invoke
657 M: ppc %alien-indirect ( -- )
660 M: ppc %callback-value ( ctype -- )
661 ! Save top of data stack
664 ! Restore data/call/retain stacks
665 "unnest_stacks" f %alien-invoke
666 ! Restore top of data stack
668 ! Unbox former top of data stack to return registers
671 M: ppc small-enough? ( n -- ? ) -32768 32767 between? ;
673 M: ppc return-struct-in-registers? ( c-type -- ? )
674 c-type return-in-registers?>> ;
676 M: ppc %box-small-struct ( c-type -- )
677 #! Box a <= 16-byte struct returned in r3:r4:r5:r6
679 "box_medium_struct" f %alien-invoke ;
681 : %unbox-struct-1 ( -- )
682 ! Alien must be in r3.
683 "alien_offset" f %alien-invoke
686 : %unbox-struct-2 ( -- )
687 ! Alien must be in r3.
688 "alien_offset" f %alien-invoke
692 : %unbox-struct-4 ( -- )
693 ! Alien must be in r3.
694 "alien_offset" f %alien-invoke
700 M: ppc %unbox-small-struct ( size -- )
701 #! Alien must be in EAX.
702 heap-size cell align cell /i {
703 { 1 [ %unbox-struct-1 ] }
704 { 2 [ %unbox-struct-2 ] }
705 { 4 [ %unbox-struct-4 ] }
711 { [ os macosx? ] [ "cpu.ppc.macosx" require ] }
712 { [ os linux? ] [ "cpu.ppc.linux" require ] }
715 "complex-double" c-type t >>return-in-registers? drop
719 [ alien-unsigned-4 c-bool> ] >>getter
720 [ [ >c-bool ] 2dip set-alien-unsigned-4 ] >>setter
723 "box_boolean" >>boxer
724 "to_boolean" >>unboxer
725 "bool" define-primitive-type
726 ] with-compilation-unit