! Copyright (C) 2011 Erik Charlebois ! See https://factorcode.org/license.txt for BSD license. USING: accessors alien alien.accessors alien.c-types alien.complex alien.data alien.libraries assocs byte-arrays classes.algebra classes.struct combinators compiler.cfg compiler.cfg.build-stack-frame compiler.cfg.comparisons compiler.cfg.instructions compiler.cfg.intrinsics compiler.cfg.registers compiler.cfg.stack-frame compiler.codegen compiler.codegen.fixup compiler.constants compiler.units cpu.architecture cpu.ppc.assembler fry io kernel layouts literals locals make math math.order ranges memory namespaces prettyprint sequences system vm words ; QUALIFIED-WITH: alien.c-types c FROM: cpu.ppc.assembler => B ; FROM: math => float ; IN: cpu.ppc ! PowerPC register assignments: ! r0: reserved for function prolog/epilogues ! r1: call stack register ! r2: toc register / system reserved ! r3-r12: integer vregs ! r13: reserved by OS ! r14: data stack ! r15: retain stack ! r16: VM pointer ! r17-r29: integer vregs ! r30: integer scratch ! r31: frame register ! f0-f29: float vregs ! f30: float scratch ! f31: ? HOOK: lr-save os ( -- n ) HOOK: has-toc os ( -- ? ) HOOK: reserved-area-size os ( -- n ) HOOK: allows-null-dereference os ( -- ? ) M: label B [ 0 B ] dip rc-relative-ppc-3-pc label-fixup ; M: label BL [ 0 BL ] dip rc-relative-ppc-3-pc label-fixup ; M: label BC [ 0 BC ] dip rc-relative-ppc-2-pc label-fixup ; CONSTANT: scratch-reg 30 CONSTANT: fp-scratch-reg 30 CONSTANT: ds-reg 14 CONSTANT: rs-reg 15 CONSTANT: vm-reg 16 M: ppc machine-registers { { int-regs $[ 3 12 [a..b] 17 29 [a..b] append ] } { float-regs $[ 0 29 [a..b] ] } } ; M: ppc frame-reg 31 ; M: ppc.32 vm-stack-space 16 ; M: ppc.64 vm-stack-space 32 ; M: ppc complex-addressing? f ; ! PW1-PW8 parameter save slots : param-save-size ( -- n ) 8 cells ; foldable ! here be spill slots ! xt, size : factor-area-size ( -- n ) 2 cells ; foldable : spill@ ( n -- offset ) spill-offset reserved-area-size + param-save-size + ; : param@ ( n -- offset ) reserved-area-size + ; M: ppc gc-root-offset n>> spill@ cell /i ; : LOAD32 ( r n -- ) [ -16 shift 0xffff bitand LIS ] [ dupd 0xffff bitand ORI ] 2bi ; : LOAD64 ( r n -- ) dupd { [ nip -48 shift 0xffff bitand LIS ] [ -32 shift 0xffff bitand ORI ] [ drop 32 SLDI ] [ -16 shift 0xffff bitand ORIS ] [ 0xffff bitand ORI ] } 3cleave ; HOOK: %clear-tag-bits cpu ( dst src -- ) M: ppc.32 %clear-tag-bits tag-bits get CLRRWI ; M: ppc.64 %clear-tag-bits tag-bits get CLRRDI ; HOOK: %store-cell cpu ( dst src offset -- ) M: ppc.32 %store-cell STW ; M: ppc.64 %store-cell STD ; HOOK: %store-cell-x cpu ( dst src offset -- ) M: ppc.32 %store-cell-x STWX ; M: ppc.64 %store-cell-x STDX ; HOOK: %store-cell-update cpu ( dst src offset -- ) M: ppc.32 %store-cell-update STWU ; M: ppc.64 %store-cell-update STDU ; HOOK: %load-cell cpu ( dst src offset -- ) M: ppc.32 %load-cell LWZ ; M: ppc.64 %load-cell LD ; HOOK: %trap-null cpu ( src -- ) M: ppc.32 %trap-null allows-null-dereference [ 0 TWEQI ] [ drop ] if ; M: ppc.64 %trap-null allows-null-dereference [ 0 TDEQI ] [ drop ] if ; HOOK: %load-cell-x cpu ( dst src offset -- ) M: ppc.32 %load-cell-x LWZX ; M: ppc.64 %load-cell-x LDX ; HOOK: %load-cell-imm cpu ( dst imm -- ) M: ppc.32 %load-cell-imm LOAD32 ; M: ppc.64 %load-cell-imm LOAD64 ; HOOK: %compare-cell cpu ( cr lhs rhs -- ) M: ppc.32 %compare-cell CMPW ; M: ppc.64 %compare-cell CMPD ; HOOK: %compare-cell-imm cpu ( cr lhs imm -- ) M: ppc.32 %compare-cell-imm CMPWI ; M: ppc.64 %compare-cell-imm CMPDI ; HOOK: %load-cell-imm-rc cpu ( -- rel-class ) M: ppc.32 %load-cell-imm-rc rc-absolute-ppc-2/2 ; M: ppc.64 %load-cell-imm-rc rc-absolute-ppc-2/2/2/2 ; M: ppc.32 %load-immediate dup -0x8000 0x7fff between? [ LI ] [ LOAD32 ] if ; M: ppc.64 %load-immediate dup -0x8000 0x7fff between? [ LI ] [ LOAD64 ] if ; M: ppc %load-reference [ [ 0 %load-cell-imm ] [ %load-cell-imm-rc rel-literal ] bi* ] [ \ f type-number LI ] if* ; M:: ppc %load-float ( dst val -- ) scratch-reg 0 %load-cell-imm val %load-cell-imm-rc rel-binary-literal dst scratch-reg 0 LFS ; M:: ppc %load-double ( dst val -- ) scratch-reg 0 %load-cell-imm val %load-cell-imm-rc rel-binary-literal dst scratch-reg 0 LFD ; M:: ppc %load-vector ( dst val rep -- ) scratch-reg 0 %load-cell-imm val %load-cell-imm-rc rel-binary-literal dst 0 scratch-reg LVX ; GENERIC: loc-reg ( loc -- reg ) M: ds-loc loc-reg drop ds-reg ; M: rs-loc loc-reg drop rs-reg ; ! Load value at stack location loc into vreg. M: ppc %peek [ loc-reg ] [ n>> cells neg ] bi %load-cell ; ! Replace value at stack location loc with value in vreg. M: ppc %replace [ loc-reg ] [ n>> cells neg ] bi %store-cell ; ! Replace value at stack location with an immediate value. M:: ppc %replace-imm ( src loc -- ) loc loc-reg :> reg loc n>> cells neg :> offset src { { [ dup not ] [ drop scratch-reg \ f type-number LI ] } { [ dup fixnum? ] [ [ scratch-reg ] dip tag-fixnum LI ] } [ scratch-reg 0 LI rc-absolute rel-literal ] } cond scratch-reg reg offset %store-cell ; M: ppc %clear 297 swap %replace-imm ; ! Increment stack pointer by n cells. M: ppc %inc [ ds-loc? [ ds-reg ds-reg ] [ rs-reg rs-reg ] if ] [ n>> ] bi cells ADDI ; M: ppc stack-frame-size (stack-frame-size) reserved-area-size + param-save-size + factor-area-size + 16 align ; M: ppc %call 0 BL rc-relative-ppc-3-pc rel-word-pic ; : instrs ( n -- b ) 4 * ; inline M: ppc %jump 6 0 %load-cell-imm 1 instrs %load-cell-imm-rc rel-here 0 B rc-relative-ppc-3-pc rel-word-pic-tail ; M: ppc %dispatch [ nip 0 %load-cell-imm 3 instrs %load-cell-imm-rc rel-here ] [ swap dupd %load-cell-x ] [ nip MTCTR ] 2tri BCTR ; M: ppc %slot [ 0 assert= ] bi@ %load-cell-x ; M: ppc %slot-imm slot-offset scratch-reg swap LI scratch-reg %load-cell-x ; M: ppc %set-slot [ 0 assert= ] bi@ %store-cell-x ; M: ppc %set-slot-imm slot-offset [ scratch-reg ] dip LI scratch-reg %store-cell-x ; M: ppc %jump-label B ; M: ppc %return BLR ; M: ppc %add ADD ; M: ppc %add-imm ADDI ; M: ppc %sub SUB ; M: ppc %sub-imm SUBI ; M: ppc.32 %mul MULLW ; M: ppc.64 %mul MULLD ; M: ppc %mul-imm MULLI ; M: ppc %and AND ; M: ppc %and-imm ANDI. ; M: ppc %or OR ; M: ppc %or-imm ORI ; M: ppc %xor XOR ; M: ppc %xor-imm XORI ; M: ppc.32 %shl SLW ; M: ppc.64 %shl SLD ; M: ppc.32 %shl-imm SLWI ; M: ppc.64 %shl-imm SLDI ; M: ppc.32 %shr SRW ; M: ppc.64 %shr SRD ; M: ppc.32 %shr-imm SRWI ; M: ppc.64 %shr-imm SRDI ; M: ppc.32 %sar SRAW ; M: ppc.64 %sar SRAD ; M: ppc.32 %sar-imm SRAWI ; M: ppc.64 %sar-imm SRADI ; M: ppc.32 %min [ 0 CMPW ] [ 0 ISEL ] 2bi ; M: ppc.64 %min [ 0 CMPD ] [ 0 ISEL ] 2bi ; M: ppc.32 %max [ 0 CMPW ] [ swap 0 ISEL ] 2bi ; M: ppc.64 %max [ 0 CMPD ] [ swap 0 ISEL ] 2bi ; M: ppc %not NOT ; M: ppc %neg NEG ; M: ppc.32 %log2 [ CNTLZW ] [ drop dup NEG ] [ drop dup 31 ADDI ] 2tri ; M: ppc.64 %log2 [ CNTLZD ] [ drop dup NEG ] [ drop dup 63 ADDI ] 2tri ; M: ppc.32 %bit-count POPCNTW ; M: ppc.64 %bit-count POPCNTD ; M: ppc %copy 2over eq? [ 3drop ] [ { { tagged-rep [ MR ] } { int-rep [ MR ] } { float-rep [ FMR ] } { double-rep [ FMR ] } { vector-rep [ dup VOR ] } { scalar-rep [ dup VOR ] } } case ] if ; :: overflow-template ( label dst src1 src2 cc insn -- ) scratch-reg 0 LI scratch-reg MTXER dst src2 src1 insn call cc { { cc-o [ 0 label BSO ] } { cc/o [ 0 label BNS ] } } case ; inline M: ppc %fixnum-add [ ADDO. ] overflow-template ; M: ppc %fixnum-sub [ SUBFO. ] overflow-template ; M: ppc.32 %fixnum-mul [ MULLWO. ] overflow-template ; M: ppc.64 %fixnum-mul [ MULLDO. ] overflow-template ; M: ppc %add-float FADD ; M: ppc %sub-float FSUB ; M: ppc %mul-float FMUL ; M: ppc %div-float FDIV ; M: ppc %min-float 2dup [ scratch-reg ] 2dip FSUB [ scratch-reg ] 2dip FSEL ; M: ppc %max-float 2dup [ scratch-reg ] 2dip FSUB [ scratch-reg ] 2dip FSEL ; M: ppc %sqrt FSQRT ; M: ppc %single>double-float FMR ; M: ppc %double>single-float FRSP ; M: ppc integer-float-needs-stack-frame? t ; : scratch@ ( n -- offset ) reserved-area-size + ; M:: ppc.32 %integer>float ( dst src -- ) ! Sign extend to a doubleword and store. scratch-reg src 31 %sar-imm scratch-reg 1 0 scratch@ STW src 1 4 scratch@ STW ! Load back doubleword into FPR and convert from integer. dst 1 0 scratch@ LFD dst dst FCFID ; M:: ppc.64 %integer>float ( dst src -- ) src 1 0 scratch@ STD dst 1 0 scratch@ LFD dst dst FCFID ; M:: ppc.32 %float>integer ( dst src -- ) fp-scratch-reg src FRIZ fp-scratch-reg fp-scratch-reg FCTIWZ fp-scratch-reg 1 0 scratch@ STFD dst 1 4 scratch@ LWZ ; M:: ppc.64 %float>integer ( dst src -- ) fp-scratch-reg src FRIZ fp-scratch-reg fp-scratch-reg FCTID fp-scratch-reg 1 0 scratch@ STFD dst 1 0 scratch@ LD ; ! Scratch registers by register class. : scratch-regs ( -- regs ) { { int-regs { 30 } } { float-regs { 30 } } } ; ! Return values of this class go here M: ppc return-regs { { int-regs { 3 4 5 6 } } { float-regs { 1 2 3 4 } } } ; ! Is this structure small enough to be returned in registers? M: ppc return-struct-in-registers? lookup-c-type return-in-registers?>> ; ! If t, the struct return pointer is never passed in a param reg M: ppc struct-return-on-stack? f ; GENERIC: load-param ( reg src -- ) M: integer load-param int-rep %copy ; M: spill-slot load-param [ 1 ] dip n>> spill@ %load-cell ; GENERIC: store-param ( reg dst -- ) M: integer store-param swap int-rep %copy ; M: spill-slot store-param [ 1 ] dip n>> spill@ %store-cell ; M:: ppc %unbox ( dst src func rep -- ) 3 src load-param 4 vm-reg MR func f f %c-invoke 3 dst store-param ; M:: ppc %unbox-long-long ( dst1 dst2 src func -- ) 3 src load-param 4 vm-reg MR func f f %c-invoke 3 dst1 store-param 4 dst2 store-param ; M:: ppc %local-allot ( dst size align offset -- ) dst 1 offset local-allot-offset reserved-area-size + ADDI ; : param-reg ( n rep -- reg ) reg-class-of cdecl param-regs at nth ; M:: ppc %box ( dst src func rep gc-map -- ) 3 src load-param 4 vm-reg MR func f gc-map %c-invoke 3 dst store-param ; M:: ppc %box-long-long ( dst src1 src2 func gc-map -- ) 3 src1 load-param 4 src2 load-param 5 vm-reg MR func f gc-map %c-invoke 3 dst store-param ; M:: ppc %save-context ( temp1 temp2 -- ) temp1 %context 1 temp1 "callstack-top" context offset-of %store-cell ds-reg temp1 "datastack" context offset-of %store-cell rs-reg temp1 "retainstack" context offset-of %store-cell ; M:: ppc %c-invoke ( name dll gc-map -- ) 11 0 %load-cell-imm name dll %load-cell-imm-rc rel-dlsym has-toc [ 2 0 %load-cell-imm name dll %load-cell-imm-rc rel-dlsym-toc ] when 11 MTCTR BCTRL gc-map gc-map-here ; : return-reg ( rep -- reg ) reg-class-of return-regs at first ; : scratch-reg-class ( rep -- reg ) reg-class-of scratch-regs at first ; :: store-stack-param ( vreg rep n -- ) rep scratch-reg-class rep vreg %reload rep scratch-reg-class n param@ rep { { int-rep [ [ 1 ] dip %store-cell ] } { tagged-rep [ [ 1 ] dip %store-cell ] } { float-rep [ [ 1 ] dip STFS ] } { double-rep [ [ 1 ] dip STFD ] } { vector-rep [ scratch-reg swap LI 1 scratch-reg STVX ] } { scalar-rep [ scratch-reg swap LI 1 scratch-reg STVX ] } } case ; :: store-reg-param ( vreg rep reg -- ) reg rep vreg %reload ; : discard-reg-param ( rep reg -- ) 2drop ; :: load-reg-param ( vreg rep reg -- ) reg rep vreg %spill ; :: load-stack-param ( vreg rep n -- ) rep scratch-reg-class n param@ rep { { int-rep [ [ frame-reg ] dip %load-cell ] } { tagged-rep [ [ frame-reg ] dip %load-cell ] } { float-rep [ [ frame-reg ] dip LFS ] } { double-rep [ [ frame-reg ] dip LFD ] } { vector-rep [ scratch-reg swap LI frame-reg scratch-reg LVX ] } { scalar-rep [ scratch-reg swap LI frame-reg scratch-reg LVX ] } } case rep scratch-reg-class rep vreg %spill ; :: emit-alien-insn ( varargs? reg-inputs stack-inputs reg-outputs dead-outputs cleanup stack-size quot -- ) stack-inputs [ first3 store-stack-param ] each reg-inputs [ first3 store-reg-param ] each quot call reg-outputs [ first3 load-reg-param ] each dead-outputs [ first2 discard-reg-param ] each ; inline M: ppc %alien-invoke '[ _ _ _ %c-invoke ] emit-alien-insn ; M:: ppc %alien-indirect ( src varargs? reg-inputs stack-inputs reg-outputs dead-outputs cleanup stack-size gc-map -- ) reg-inputs stack-inputs reg-outputs dead-outputs cleanup stack-size [ has-toc [ 11 src load-param 2 11 1 cells %load-cell 11 11 0 cells %load-cell ] [ 11 src load-param ] if 11 MTCTR BCTRL gc-map gc-map-here ] emit-alien-insn ; M: ppc %alien-assembly '[ _ call( -- ) ] emit-alien-insn ; M: ppc %callback-inputs [ [ first3 load-reg-param ] each ] [ [ first3 load-stack-param ] each ] bi* 3 vm-reg MR 4 0 LI "begin_callback" f f %c-invoke ; M: ppc %callback-outputs 3 vm-reg MR "end_callback" f f %c-invoke [ first3 store-reg-param ] each ; M: ppc stack-cleanup 3drop 0 ; M: ppc fused-unboxing? f ; M: ppc %alien-global [ 0 %load-cell-imm ] 2dip %load-cell-imm-rc rel-dlsym ; M: ppc %vm-field [ vm-reg ] dip %load-cell ; M: ppc %set-vm-field [ vm-reg ] dip %store-cell ; M: ppc %unbox-alien scratch-reg alien-offset LI scratch-reg %load-cell-x ; ! Convert a c-ptr object to a raw C pointer. ! if (src == F_TYPE) ! dst = NULL; ! else if ((src & tag_mask) == ALIEN_TYPE) ! dst = ((alien*)src)->address; ! else // Assume (src & tag_mask) == BYTE_ARRAY_TYPE ! dst = ((byte_array*)src) + 1; M:: ppc %unbox-any-c-ptr ( dst src -- )