1 ! Copyright (C) 2005, 2009 Slava Pestov.
2 ! See http://factorcode.org/license.txt for BSD license.
3 USING: accessors assocs sequences kernel combinators make math
4 math.order math.ranges system namespaces locals layouts words
5 alien alien.accessors alien.c-types literals cpu.architecture
6 cpu.ppc.assembler cpu.ppc.assembler.backend compiler.cfg.registers
7 compiler.cfg.instructions compiler.cfg.comparisons
8 compiler.codegen.fixup compiler.cfg.intrinsics
9 compiler.cfg.stack-frame compiler.cfg.build-stack-frame
10 compiler.units compiler.constants compiler.codegen ;
11 FROM: cpu.ppc.assembler => B ;
14 ! PowerPC register assignments:
15 ! r2-r12: integer vregs
17 ! r30: integer scratch
21 ! Add some methods to the assembler that are useful to us
22 M: label (B) [ 0 ] 2dip (B) rc-relative-ppc-3 label-fixup ;
23 M: label BC [ 0 BC ] dip rc-relative-ppc-2 label-fixup ;
25 enable-float-intrinsics
28 \ ##integer>float t frame-required? set-word-prop
29 \ ##float>integer t frame-required? set-word-prop
32 M: ppc machine-registers
34 { int-regs $[ 2 12 [a,b] 15 29 [a,b] append ] }
35 { float-regs $[ 0 29 [a,b] ] }
38 CONSTANT: scratch-reg 30
39 CONSTANT: fp-scratch-reg 30
41 M: ppc two-operand? f ;
43 M: ppc %load-immediate ( reg n -- ) swap LOAD ;
45 M: ppc %load-reference ( reg obj -- )
46 [ 0 swap LOAD32 ] [ rc-absolute-ppc-2/2 rel-immediate ] bi* ;
48 M: ppc %alien-global ( register symbol dll -- )
49 [ 0 swap LOAD32 ] 2dip rc-absolute-ppc-2/2 rel-dlsym ;
54 GENERIC: loc-reg ( loc -- reg )
56 M: ds-loc loc-reg drop ds-reg ;
57 M: rs-loc loc-reg drop rs-reg ;
59 : loc>operand ( loc -- reg n )
60 [ loc-reg ] [ n>> cells neg ] bi ; inline
62 M: ppc %peek loc>operand LWZ ;
63 M: ppc %replace loc>operand STW ;
65 :: (%inc) ( n reg -- ) reg reg n cells ADDI ; inline
67 M: ppc %inc-d ( n -- ) ds-reg (%inc) ;
68 M: ppc %inc-r ( n -- ) rs-reg (%inc) ;
70 HOOK: reserved-area-size os ( -- n )
72 ! The start of the stack frame contains the size of this frame
73 ! as well as the currently executing XT
74 : factor-area-size ( -- n ) 2 cells ; foldable
75 : next-save ( n -- i ) cell - ;
76 : xt-save ( n -- i ) 2 cells - ;
78 ! Next, we have the spill area as well as the FFI parameter area.
79 ! It is safe for them to overlap, since basic blocks with FFI calls
80 ! will never spill -- indeed, basic blocks with FFI calls do not
81 ! use vregs at all, and the FFI call is a stack analysis sync point.
82 ! In the future this will change and the stack frame logic will
83 ! need to be untangled somewhat.
85 : param@ ( n -- x ) reserved-area-size + ; inline
87 : param-save-size ( -- n ) 8 cells ; foldable
90 reserved-area-size param-save-size + + ; inline
92 : spill@ ( n -- offset )
95 ! Some FP intrinsics need a temporary scratch area in the stack
96 ! frame, 8 bytes in size. This is in the param-save area so it
97 ! does not overlap with spill slots.
98 : scratch@ ( n -- offset )
102 : gc-root@ ( n -- offset )
103 gc-root-offset local@ ;
105 ! Finally we have the linkage area
106 HOOK: lr-save os ( -- n )
108 M: ppc stack-frame-size ( stack-frame -- i )
115 M: ppc %call ( word -- ) 0 BL rc-relative-ppc-3 rel-word-pic ;
117 M: ppc %jump ( word -- )
118 0 6 LOAD32 8 rc-absolute-ppc-2/2 rel-here
119 0 B rc-relative-ppc-3 rel-word-pic-tail ;
121 M: ppc %jump-label ( label -- ) B ;
122 M: ppc %return ( -- ) BLR ;
124 M:: ppc %dispatch ( src temp -- )
126 4 cells rc-absolute-ppc-2/2 rel-here
131 :: (%slot) ( obj slot tag temp -- reg offset )
133 temp tag neg ; inline
135 : (%slot-imm) ( obj slot tag -- reg offset )
136 [ cells ] dip - ; inline
138 M: ppc %slot ( dst obj slot tag temp -- ) (%slot) LWZ ;
139 M: ppc %slot-imm ( dst obj slot tag -- ) (%slot-imm) LWZ ;
140 M: ppc %set-slot ( src obj slot tag temp -- ) (%slot) STW ;
141 M: ppc %set-slot-imm ( src obj slot tag -- ) (%slot-imm) STW ;
143 M:: ppc %string-nth ( dst src index temp -- )
147 dst temp string-offset LBZ
150 temp src string-aux-offset LWZ
153 temp temp byte-array-offset LHZ
159 M:: ppc %set-string-nth-fast ( ch obj index temp -- )
161 ch temp string-offset STB ;
164 M: ppc %add-imm ADDI ;
165 M: ppc %sub swap SUBF ;
166 M: ppc %sub-imm SUBI ;
168 M: ppc %mul-imm MULLI ;
170 M: ppc %and-imm ANDI ;
174 M: ppc %xor-imm XORI ;
176 M: ppc %shl-imm swapd SLWI ;
178 M: ppc %shr-imm swapd SRWI ;
180 M: ppc %sar-imm SRAWI ;
183 :: overflow-template ( label dst src1 src2 insn -- )
186 dst src2 src1 insn call
189 M: ppc %fixnum-add ( label dst src1 src2 -- )
190 [ ADDO. ] overflow-template ;
192 M: ppc %fixnum-sub ( label dst src1 src2 -- )
193 [ SUBFO. ] overflow-template ;
195 M: ppc %fixnum-mul ( label dst src1 src2 -- )
196 [ MULLWO. ] overflow-template ;
198 : bignum@ ( n -- offset ) cells bignum tag-number - ; inline
200 M:: ppc %integer>bignum ( dst src temp -- )
203 dst 0 >bignum %load-reference
204 ! Is it zero? Then just go to the end and return this zero
208 dst 4 cells bignum temp %allot
211 temp dst 1 bignum@ STW
214 temp temp cell-bits 1 - SRAWI
217 temp dst 2 bignum@ STW
218 ! Make negative value positive
224 temp dst 3 bignum@ STW
228 M:: ppc %bignum>integer ( dst src temp -- )
231 temp src 1 bignum@ LWZ
232 ! if the length is 1, its just the sign and nothing else,
235 0 temp 1 tag-fixnum CMPI
238 dst src 3 bignum@ LWZ
240 temp src 2 bignum@ LWZ
241 ! branchless arithmetic: we want to turn 0 into 1,
246 ! multiply value by sign
251 M: ppc %add-float FADD ;
252 M: ppc %sub-float FSUB ;
253 M: ppc %mul-float FMUL ;
254 M: ppc %div-float FDIV ;
256 M:: ppc %integer>float ( dst src -- )
257 HEX: 4330 scratch-reg LIS
258 scratch-reg 1 0 scratch@ STW
260 scratch-reg dup HEX: 8000 XORIS
261 scratch-reg 1 4 scratch@ STW
263 scratch-reg 4503601774854144.0 %load-reference
264 fp-scratch-reg scratch-reg float-offset LFD
265 dst dst fp-scratch-reg FSUB ;
267 M:: ppc %float>integer ( dst src -- )
268 fp-scratch-reg src FCTIWZ
269 fp-scratch-reg 1 0 scratch@ STFD
270 dst 1 4 scratch@ LWZ ;
272 M: ppc %copy ( dst src rep -- )
275 { double-float-rep [ FMR ] }
278 M: ppc %unbox-float ( dst src -- ) float-offset LFD ;
280 M:: ppc %box-float ( dst src temp -- )
281 dst 16 float temp %allot
282 src dst float-offset STFD ;
284 : float-function-param ( i spill-slot -- )
285 [ float-regs param-regs nth 1 ] [ n>> spill@ ] bi* LFD ;
287 : float-function-return ( reg -- )
288 float-regs return-reg 2dup = [ 2drop ] [ FMR ] if ;
290 M:: ppc %unary-float-function ( dst src func -- )
291 0 src float-function-param
293 dst float-function-return ;
295 M:: ppc %binary-float-function ( dst src1 src2 func -- )
296 0 src1 float-function-param
297 1 src2 float-function-param
299 dst float-function-return ;
301 M:: ppc %unbox-any-c-ptr ( dst src temp -- )
303 { "is-byte-array" "end" "start" } [ define-label ] each
304 ! Address is computed in dst
306 ! Load object into scratch-reg
308 ! We come back here with displaced aliens
309 "start" resolve-label
311 0 scratch-reg \ f tag-number CMPI
314 ! Is the object an alien?
315 0 scratch-reg header-offset LWZ
316 0 0 alien type-number tag-fixnum CMPI
317 "is-byte-array" get BNE
318 ! If so, load the offset
319 0 scratch-reg alien-offset LWZ
320 ! Add it to address being computed
322 ! Now recurse on the underlying alien
323 scratch-reg scratch-reg underlying-alien-offset LWZ
325 "is-byte-array" resolve-label
326 ! Add byte array address to address being computed
327 dst dst scratch-reg ADD
328 ! Add an offset to start of byte array's data area
329 dst dst byte-array-offset ADDI
333 : alien@ ( n -- n' ) cells object tag-number - ;
335 :: %allot-alien ( dst displacement base temp -- )
336 dst 4 cells alien temp %allot
337 temp \ f tag-number %load-immediate
338 ! Store underlying-alien slot
339 base dst 1 alien@ STW
341 temp dst 2 alien@ STW
343 displacement dst 3 alien@ STW ;
345 M:: ppc %box-alien ( dst src temp -- )
348 dst \ f tag-number %load-immediate
351 dst src temp temp %allot-alien
355 M:: ppc %box-displaced-alien ( dst displacement base displacement' base' -- )
359 "simple-case" define-label
360 ! If displacement is zero, return the base
362 0 displacement 0 CMPI
364 ! Quickly use displacement' before its needed for real, as allot temporary
365 displacement' :> temp
366 dst 4 cells alien temp %allot
367 ! If base is already a displaced alien, unpack it
368 0 base \ f tag-number CMPI
369 "simple-case" get BEQ
370 temp base header-offset LWZ
371 0 temp alien type-number tag-fixnum CMPI
372 "simple-case" get BNE
373 ! displacement += base.displacement
374 temp base 3 alien@ LWZ
375 displacement' displacement temp ADD
377 base' base 1 alien@ LWZ
379 "simple-case" resolve-label
380 displacement' displacement MR
382 "alloc" resolve-label
383 ! Store underlying-alien slot
384 base' dst 1 alien@ STW
386 displacement' dst 3 alien@ STW
387 ! Store expired slot (its ok to clobber displacement')
388 temp \ f tag-number %load-immediate
389 temp dst 2 alien@ STW
393 M: ppc %alien-unsigned-1 0 LBZ ;
394 M: ppc %alien-unsigned-2 0 LHZ ;
396 M: ppc %alien-signed-1 dupd 0 LBZ dup EXTSB ;
397 M: ppc %alien-signed-2 0 LHA ;
399 M: ppc %alien-cell 0 LWZ ;
401 M: ppc %alien-float 0 LFS ;
402 M: ppc %alien-double 0 LFD ;
404 M: ppc %set-alien-integer-1 swap 0 STB ;
405 M: ppc %set-alien-integer-2 swap 0 STH ;
407 M: ppc %set-alien-cell swap 0 STW ;
409 M: ppc %set-alien-float swap 0 STFS ;
410 M: ppc %set-alien-double swap 0 STFD ;
412 : load-zone-ptr ( reg -- )
413 "nursery" f %alien-global ;
415 : load-allot-ptr ( nursery-ptr allot-ptr -- )
416 [ drop load-zone-ptr ] [ swap 4 LWZ ] 2bi ;
418 :: inc-allot-ptr ( nursery-ptr allot-ptr n -- )
419 scratch-reg allot-ptr n 8 align ADDI
420 scratch-reg nursery-ptr 4 STW ;
422 :: store-header ( dst class -- )
423 class type-number tag-fixnum scratch-reg LI
424 scratch-reg dst 0 STW ;
426 : store-tagged ( dst tag -- )
427 dupd tag-number ORI ;
429 M:: ppc %allot ( dst size class nursery-ptr -- )
430 nursery-ptr dst load-allot-ptr
431 nursery-ptr dst size inc-allot-ptr
432 dst class store-header
433 dst class store-tagged ;
435 : load-cards-offset ( dst -- )
436 [ "cards_offset" f %alien-global ] [ dup 0 LWZ ] bi ;
438 : load-decks-offset ( dst -- )
439 [ "decks_offset" f %alien-global ] [ dup 0 LWZ ] bi ;
441 M:: ppc %write-barrier ( src card# table -- )
442 card-mark scratch-reg LI
445 table load-cards-offset
446 src card# card-bits SRWI
447 table scratch-reg card# STBX
450 table load-decks-offset
451 src card# deck-bits SRWI
452 table scratch-reg card# STBX ;
454 M:: ppc %check-nursery ( label temp1 temp2 -- )
457 temp2 temp2 3 cells LWZ
458 ! add ALLOT_BUFFER_ZONE to here
459 temp1 temp1 1024 ADDI
464 M:: ppc %save-gc-root ( gc-root register -- )
465 register 1 gc-root gc-root@ STW ;
467 M:: ppc %load-gc-root ( gc-root register -- )
468 register 1 gc-root gc-root@ LWZ ;
470 M:: ppc %call-gc ( gc-root-count -- )
471 %prepare-alien-invoke
472 3 1 gc-root-base local@ ADDI
474 "inline_gc" f %alien-invoke ;
476 M: ppc %prologue ( n -- )
477 0 11 LOAD32 rc-absolute-ppc-2/2 rel-this
480 [ [ 1 1 ] dip neg ADDI ]
481 [ [ 11 1 ] dip xt-save STW ]
483 [ [ 11 1 ] dip next-save STW ]
484 [ [ 0 1 ] dip lr-save + STW ]
487 M: ppc %epilogue ( n -- )
488 #! At the end of each word that calls a subroutine, we store
489 #! the previous link register value in r0 by popping it off
490 #! the stack, set the link register to the contents of r0,
491 #! and jump to the link register.
492 [ [ 0 1 ] dip lr-save + LWZ ]
493 [ [ 1 1 ] dip ADDI ] bi
496 :: (%boolean) ( dst temp word -- )
498 dst \ f tag-number %load-immediate
499 "end" get word execute
500 dst \ t %load-reference
501 "end" get resolve-label ; inline
503 :: %boolean ( dst temp cc -- )
504 cc negate-cc order-cc {
505 { cc< [ dst temp \ BLT (%boolean) ] }
506 { cc<= [ dst temp \ BLE (%boolean) ] }
507 { cc> [ dst temp \ BGT (%boolean) ] }
508 { cc>= [ dst temp \ BGE (%boolean) ] }
509 { cc= [ dst temp \ BEQ (%boolean) ] }
510 { cc/= [ dst temp \ BNE (%boolean) ] }
513 : (%compare) ( src1 src2 -- ) [ 0 ] dip CMP ; inline
514 : (%compare-imm) ( src1 src2 -- ) [ 0 ] 2dip CMPI ; inline
515 : (%compare-float) ( src1 src2 -- ) [ 0 ] dip FCMPU ; inline
517 M: ppc %compare (%compare) %boolean ;
518 M: ppc %compare-imm (%compare-imm) %boolean ;
519 M: ppc %compare-float (%compare-float) %boolean ;
521 :: %branch ( label cc -- )
523 { cc< [ label BLT ] }
524 { cc<= [ label BLE ] }
525 { cc> [ label BGT ] }
526 { cc>= [ label BGE ] }
527 { cc= [ label BEQ ] }
528 { cc/= [ label BNE ] }
531 M: ppc %compare-branch (%compare) %branch ;
532 M: ppc %compare-imm-branch (%compare-imm) %branch ;
533 M: ppc %compare-float-branch (%compare-float) %branch ;
535 : load-from-frame ( dst n rep -- )
537 { int-rep [ [ 1 ] dip LWZ ] }
538 { single-float-rep [ [ 1 ] dip LFS ] }
539 { double-float-rep [ [ 1 ] dip LFD ] }
540 { stack-params [ [ 0 1 ] dip LWZ [ 0 1 ] dip param@ STW ] }
543 : next-param@ ( n -- x ) param@ stack-frame get total-size>> + ;
545 : store-to-frame ( src n rep -- )
547 { int-rep [ [ 1 ] dip STW ] }
548 { single-float-rep [ [ 1 ] dip STFS ] }
549 { double-float-rep [ [ 1 ] dip STFD ] }
550 { stack-params [ [ [ 0 1 ] dip next-param@ LWZ 0 1 ] dip STW ] }
553 M: ppc %spill ( src n rep -- )
554 [ spill@ ] dip store-to-frame ;
556 M: ppc %reload ( dst n rep -- )
557 [ spill@ ] dip load-from-frame ;
561 M: int-regs return-reg drop 3 ;
562 M: int-regs param-regs drop { 3 4 5 6 7 8 9 10 } ;
563 M: float-regs return-reg drop 1 ;
565 M:: ppc %save-param-reg ( stack reg rep -- )
566 reg stack local@ rep store-to-frame ;
568 M:: ppc %load-param-reg ( stack reg rep -- )
569 reg stack local@ rep load-from-frame ;
571 M: ppc %prepare-unbox ( -- )
572 ! First parameter is top of stack
574 ds-reg dup cell SUBI ;
576 M: ppc %unbox ( n rep func -- )
577 ! Value must be in r3
580 ! Store the return value on the C stack
581 over [ [ reg-class-of return-reg ] keep %save-param-reg ] [ 2drop ] if ;
583 M: ppc %unbox-long-long ( n func -- )
584 ! Value must be in r3:r4
587 ! Store the return value on the C stack
589 [ [ 3 1 ] dip local@ STW ]
590 [ [ 4 1 ] dip cell + local@ STW ] bi
593 M: ppc %unbox-large-struct ( n c-type -- )
594 ! Value must be in r3
595 ! Compute destination address and load struct size
596 [ [ 4 1 ] dip local@ ADDI ] [ heap-size 5 LI ] bi*
598 "to_value_struct" f %alien-invoke ;
600 M: ppc %box ( n rep func -- )
601 ! If the source is a stack location, load it into freg #0.
602 ! If the source is f, then we assume the value is already in
604 [ over [ 0 over reg-class-of param-reg swap %load-param-reg ] [ 2drop ] if ] dip
607 M: ppc %box-long-long ( n func -- )
610 [ [ 3 1 ] dip local@ LWZ ]
611 [ [ 4 1 ] dip cell + local@ LWZ ] bi
613 ] dip f %alien-invoke ;
615 : struct-return@ ( n -- n )
616 [ stack-frame get params>> ] unless* local@ ;
618 M: ppc %prepare-box-struct ( -- )
619 #! Compute target address for value struct return
620 3 1 f struct-return@ ADDI
623 M: ppc %box-large-struct ( n c-type -- )
624 ! If n = f, then we're boxing a returned struct
625 ! Compute destination address and load struct size
626 [ [ 3 1 ] dip struct-return@ ADDI ] [ heap-size 4 LI ] bi*
628 "box_value_struct" f %alien-invoke ;
630 M: ppc %prepare-alien-invoke
631 #! Save Factor stack pointers in case the C code calls a
632 #! callback which does a GC, which must reliably trace
634 scratch-reg "stack_chain" f %alien-global
635 scratch-reg scratch-reg 0 LWZ
637 ds-reg scratch-reg 8 STW
638 rs-reg scratch-reg 12 STW ;
640 M: ppc %alien-invoke ( symbol dll -- )
641 [ 11 ] 2dip %alien-global 11 MTLR BLRL ;
643 M: ppc %alien-callback ( quot -- )
644 3 swap %load-reference "c_to_factor" f %alien-invoke ;
646 M: ppc %prepare-alien-indirect ( -- )
647 "unbox_alien" f %alien-invoke
650 M: ppc %alien-indirect ( -- )
653 M: ppc %callback-value ( ctype -- )
654 ! Save top of data stack
657 ! Restore data/call/retain stacks
658 "unnest_stacks" f %alien-invoke
659 ! Restore top of data stack
661 ! Unbox former top of data stack to return registers
664 M: ppc small-enough? ( n -- ? ) -32768 32767 between? ;
666 M: ppc return-struct-in-registers? ( c-type -- ? )
667 c-type return-in-registers?>> ;
669 M: ppc %box-small-struct ( c-type -- )
670 #! Box a <= 16-byte struct returned in r3:r4:r5:r6
672 "box_medium_struct" f %alien-invoke ;
674 : %unbox-struct-1 ( -- )
675 ! Alien must be in r3.
676 "alien_offset" f %alien-invoke
679 : %unbox-struct-2 ( -- )
680 ! Alien must be in r3.
681 "alien_offset" f %alien-invoke
685 : %unbox-struct-4 ( -- )
686 ! Alien must be in r3.
687 "alien_offset" f %alien-invoke
693 M: ppc %unbox-small-struct ( size -- )
694 #! Alien must be in EAX.
695 heap-size cell align cell /i {
696 { 1 [ %unbox-struct-1 ] }
697 { 2 [ %unbox-struct-2 ] }
698 { 4 [ %unbox-struct-4 ] }
701 enable-float-functions
706 { [ os macosx? ] [ "cpu.ppc.macosx" require ] }
707 { [ os linux? ] [ "cpu.ppc.linux" require ] }
710 "complex-double" c-type t >>return-in-registers? drop
714 [ alien-unsigned-4 c-bool> ] >>getter
715 [ [ >c-bool ] 2dip set-alien-unsigned-4 ] >>setter
718 "box_boolean" >>boxer
719 "to_boolean" >>unboxer
720 "bool" define-primitive-type
721 ] with-compilation-unit