! Copyright (C) 2004, 2011 Slava Pestov. ! See http://factorcode.org/license.txt for BSD license. USING: alien alien.strings arrays byte-arrays generic hashtables hashtables.private io io.binary io.files io.encodings.binary io.pathnames kernel kernel.private math namespaces make parser prettyprint sequences combinators.smart strings sbufs vectors words quotations assocs system layouts splitting grouping growable classes classes.private classes.builtin classes.tuple classes.tuple.private vocabs vocabs.loader source-files definitions debugger quotations.private combinators combinators.short-circuit math.order math.private accessors slots.private generic.single.private compiler.units compiler.constants compiler.codegen.relocation fry locals bootstrap.image.syntax parser.notes ; IN: bootstrap.image : arch ( os cpu -- arch ) 2dup [ windows? ] [ ppc? ] bi* or [ [ drop unix ] dip ] unless [ name>> ] [ name>> ] bi* "-" glue ; : my-arch ( -- arch ) os cpu arch ; : boot-image-name ( arch -- string ) "boot." ".image" surround ; : my-boot-image-name ( -- string ) my-arch boot-image-name ; : images ( -- seq ) { "windows-x86.32" "unix-x86.32" "windows-x86.64" "unix-x86.64" } ; eql-wrapper M: eql-wrapper hashcode* obj>> hashcode* ; GENERIC: (eql?) ( obj1 obj2 -- ? ) : eql? ( obj1 obj2 -- ? ) { [ [ class-of ] bi@ = ] [ (eql?) ] } 2&& ; M: fixnum (eql?) eq? ; M: bignum (eql?) = ; M: float (eql?) fp-bitwise= ; M: sequence (eql?) 2dup [ length ] bi@ = [ [ eql? ] 2all? ] [ 2drop f ] if ; M: object (eql?) = ; M: eql-wrapper equal? over eql-wrapper? [ [ obj>> ] bi@ eql? ] [ 2drop f ] if ; TUPLE: eq-wrapper { obj read-only } ; C: eq-wrapper M: eq-wrapper equal? over eq-wrapper? [ [ obj>> ] bi@ eq? ] [ 2drop f ] if ; M: eq-wrapper hashcode* nip obj>> identity-hashcode ; SYMBOL: objects : cache-eql-object ( obj quot -- value ) [ objects get ] dip '[ obj>> @ ] cache ; inline : cache-eq-object ( obj quot -- value ) [ objects get ] dip '[ obj>> @ ] cache ; inline : lookup-object ( obj -- n/f ) objects get at ; : put-object ( n obj -- ) objects get set-at ; ! Constants CONSTANT: image-magic HEX: 0f0e0d0c CONSTANT: image-version 4 CONSTANT: data-base 1024 CONSTANT: special-objects-size 80 CONSTANT: header-size 10 CONSTANT: data-heap-size-offset 3 CONSTANT: t-offset 6 CONSTANT: 0-offset 7 CONSTANT: 1-offset 8 CONSTANT: -1-offset 9 SYMBOL: sub-primitives :: jit-conditional ( test-quot false-quot -- ) [ 0 test-quot call ] B{ } make length :> len building get length extra-offset get + len + [ extra-offset set false-quot call ] B{ } make [ length test-quot call ] [ % ] bi ; inline : make-jit ( quot -- parameters literals code ) #! code is a { relocation insns } pair [ 0 extra-offset set init-relocation call( -- ) parameter-table get >array literal-table get >array relocation-table get >byte-array ] B{ } make 2array ; : make-jit-no-params ( quot -- code ) make-jit 2nip ; : jit-define ( quot name -- ) [ make-jit-no-params ] dip set ; : define-sub-primitive ( quot word -- ) [ make-jit 3array ] dip sub-primitives get set-at ; : define-combinator-primitive ( quot non-tail-quot tail-quot word -- ) [ [ [ make-jit ] [ make-jit-no-params ] [ make-jit-no-params ] tri* ] output>array ] dip sub-primitives get set-at ; ! The image being constructed; a vector of word-size integers SYMBOL: image ! Image output format SYMBOL: big-endian ! Bootstrap architecture name SYMBOL: architecture RESET ! Boot quotation, set in stage1.factor SPECIAL-OBJECT: bootstrap-startup-quot 20 ! Bootstrap global namesapce SPECIAL-OBJECT: bootstrap-global 21 ! JIT parameters SPECIAL-OBJECT: jit-prolog 23 SPECIAL-OBJECT: jit-primitive-word 24 SPECIAL-OBJECT: jit-primitive 25 SPECIAL-OBJECT: jit-word-jump 26 SPECIAL-OBJECT: jit-word-call 27 SPECIAL-OBJECT: jit-if-word 28 SPECIAL-OBJECT: jit-if 29 SPECIAL-OBJECT: jit-safepoint 30 SPECIAL-OBJECT: jit-epilog 31 SPECIAL-OBJECT: jit-return 32 SPECIAL-OBJECT: jit-profiling 33 SPECIAL-OBJECT: jit-push 34 SPECIAL-OBJECT: jit-dip-word 35 SPECIAL-OBJECT: jit-dip 36 SPECIAL-OBJECT: jit-2dip-word 37 SPECIAL-OBJECT: jit-2dip 38 SPECIAL-OBJECT: jit-3dip-word 39 SPECIAL-OBJECT: jit-3dip 40 SPECIAL-OBJECT: jit-execute 41 SPECIAL-OBJECT: jit-declare-word 42 SPECIAL-OBJECT: c-to-factor-word 43 SPECIAL-OBJECT: lazy-jit-compile-word 44 SPECIAL-OBJECT: unwind-native-frames-word 45 SPECIAL-OBJECT: fpu-state-word 46 SPECIAL-OBJECT: set-fpu-state-word 47 SPECIAL-OBJECT: signal-handler-word 48 SPECIAL-OBJECT: leaf-signal-handler-word 49 SPECIAL-OBJECT: ffi-signal-handler-word 50 SPECIAL-OBJECT: ffi-leaf-signal-handler-word 51 SPECIAL-OBJECT: callback-stub 53 ! PIC stubs SPECIAL-OBJECT: pic-load 54 SPECIAL-OBJECT: pic-tag 55 SPECIAL-OBJECT: pic-tuple 56 SPECIAL-OBJECT: pic-check-tag 57 SPECIAL-OBJECT: pic-check-tuple 58 SPECIAL-OBJECT: pic-hit 59 SPECIAL-OBJECT: pic-miss-word 60 SPECIAL-OBJECT: pic-miss-tail-word 61 ! Megamorphic dispatch SPECIAL-OBJECT: mega-lookup 62 SPECIAL-OBJECT: mega-lookup-word 63 SPECIAL-OBJECT: mega-miss-word 64 ! Default definition for undefined words SPECIAL-OBJECT: undefined-quot 65 : special-object-offset ( symbol -- n ) special-objects get at header-size + ; : emit ( cell -- ) image get push ; : emit-64 ( cell -- ) bootstrap-cell 8 = [ emit ] [ d>w/w big-endian get [ swap ] unless emit emit ] if ; : emit-seq ( seq -- ) image get push-all ; : fixup ( value offset -- ) image get set-nth ; : heap-size ( -- size ) image get length header-size - special-objects-size - bootstrap-cells ; : here ( -- size ) heap-size data-base + ; : here-as ( tag -- pointer ) here bitor ; : (align-here) ( alignment -- ) [ here neg ] dip rem [ bootstrap-cell /i [ 0 emit ] times ] unless-zero ; : align-here ( -- ) data-alignment get (align-here) ; : emit-fixnum ( n -- ) tag-fixnum emit ; : emit-header ( n -- ) tag-header emit ; : emit-object ( class quot -- addr ) [ type-number ] dip over here-as [ swap emit-header call align-here ] dip ; inline ! Write an object to the image. GENERIC: ' ( obj -- ptr ) ! Image header : emit-image-header ( -- ) image-magic emit image-version emit data-base emit ! relocation base at end of header 0 emit ! size of data heap set later 0 emit ! reloc base of code heap is 0 0 emit ! size of code heap is 0 0 emit ! pointer to t object 0 emit ! pointer to bignum 0 0 emit ! pointer to bignum 1 0 emit ! pointer to bignum -1 special-objects-size [ f ' emit ] times ; : emit-special-object ( symbol -- ) [ get ' ] [ special-object-offset ] bi fixup ; ! Bignums : bignum-bits ( -- n ) bootstrap-cell-bits 2 - ; : bignum-radix ( -- n ) bignum-bits 2^ 1 - ; : bignum>seq ( n -- seq ) #! n is positive or zero. [ dup 0 > ] [ [ bignum-bits neg shift ] [ bignum-radix bitand ] bi ] produce nip ; : emit-bignum ( n -- ) dup dup 0 < [ neg ] when bignum>seq [ nip length 1 + emit-fixnum ] [ drop 0 < 1 0 ? emit ] [ nip emit-seq ] 2tri ; M: bignum ' [ bignum [ emit-bignum ] emit-object ] cache-eql-object ; ! Fixnums M: fixnum ' #! When generating a 32-bit image on a 64-bit system, #! some fixnums should be bignums. dup bootstrap-most-negative-fixnum bootstrap-most-positive-fixnum between? [ tag-fixnum ] [ >bignum ' ] if ; TUPLE: fake-bignum n ; C: fake-bignum M: fake-bignum ' n>> tag-fixnum ; ! Floats M: float ' [ float [ 8 (align-here) double>bits emit-64 ] emit-object ] cache-eql-object ; ! Special objects ! Padded with fixnums for 8-byte alignment : t, ( -- ) t t-offset fixup ; M: f ' drop \ f type-number ; : 0, ( -- ) 0 >bignum ' 0-offset fixup ; : 1, ( -- ) 1 >bignum ' 1-offset fixup ; : -1, ( -- ) -1 >bignum ' -1-offset fixup ; ! Words : word-sub-primitive ( word -- obj ) [ target-word ] with-global sub-primitives get at ; : emit-word ( word -- ) [ [ subwords [ emit-word ] each ] [ [ { [ hashcode , ] [ name>> , ] [ vocabulary>> , ] [ def>> , ] [ props>> , ] [ pic-def>> , ] [ pic-tail-def>> , ] [ drop 0 , ] ! count [ word-sub-primitive , ] [ drop 0 , ] ! xt [ drop 0 , ] ! code [ drop 0 , ] ! profiling } cleave ] { } make [ ' ] map ] bi \ word [ emit-seq ] emit-object ] keep put-object ; : word-error ( word msg -- * ) [ % dup vocabulary>> % " " % name>> % ] "" make throw ; : transfer-word ( word -- word ) [ target-word ] keep or ; : fixup-word ( word -- offset ) transfer-word dup lookup-object [ ] [ "Not in image: " word-error ] ?if ; : fixup-words ( -- ) image get [ dup word? [ fixup-word ] when ] map! drop ; M: word ' ; ! Wrappers M: wrapper ' [ wrapped>> ' wrapper [ emit ] emit-object ] cache-eql-object ; ! Strings : native> ( object -- object ) big-endian get [ [ be> ] map ] [ [ le> ] map ] if ; : emit-bytes ( seq -- ) bootstrap-cell native> emit-seq ; : pad-bytes ( seq -- newseq ) dup length bootstrap-cell align 0 pad-tail ; : extended-part ( str -- str' ) dup [ 128 < ] all? [ drop f ] [ [ -7 shift 1 bitxor ] { } map-as big-endian get [ [ 2 >be ] { } map-as ] [ [ 2 >le ] { } map-as ] if B{ } join ] if ; : ascii-part ( str -- str' ) [ [ 128 mod ] [ 128 >= ] bi [ 128 bitor ] when ] B{ } map-as ; : emit-string ( string -- ptr ) [ length ] [ extended-part ' ] [ ] tri string [ [ emit-fixnum ] [ emit ] [ f ' emit ascii-part pad-bytes emit-bytes ] tri* ] emit-object ; M: string ' #! We pool strings so that each string is only written once #! to the image [ emit-string ] cache-eql-object ; : assert-empty ( seq -- ) length 0 assert= ; : emit-dummy-array ( obj type -- ptr ) [ assert-empty ] [ [ 0 emit-fixnum ] emit-object ] bi* ; M: byte-array ' [ byte-array [ dup length emit-fixnum bootstrap-cell 4 = [ 0 emit 0 emit ] when pad-bytes emit-bytes ] emit-object ] cache-eq-object ; ! Tuples ERROR: tuple-removed class ; : require-tuple-layout ( word -- layout ) dup tuple-layout [ ] [ tuple-removed ] ?if ; : (emit-tuple) ( tuple -- pointer ) [ tuple-slots ] [ class-of transfer-word require-tuple-layout ] bi prefix [ ' ] map tuple [ emit-seq ] emit-object ; : emit-tuple ( tuple -- pointer ) dup class-of name>> "tombstone" = [ [ (emit-tuple) ] cache-eql-object ] [ [ (emit-tuple) ] cache-eq-object ] if ; M: tuple ' emit-tuple ; M: tombstone ' state>> "((tombstone))" "((empty))" ? "hashtables.private" lookup def>> first [ emit-tuple ] cache-eql-object ; ! Arrays : emit-array ( array -- offset ) [ ' ] map array [ [ length emit-fixnum ] [ emit-seq ] bi ] emit-object ; M: array ' [ emit-array ] cache-eq-object ; ! This is a hack. We need to detect arrays which are tuple ! layout arrays so that they can be internalized, but making ! them a built-in type is not worth it. PREDICATE: tuple-layout-array < array dup length 5 >= [ [ first tuple-class? ] [ second fixnum? ] [ third fixnum? ] tri and and ] [ drop f ] if ; M: tuple-layout-array ' [ [ dup integer? [ ] when ] map emit-array ] cache-eql-object ; ! Quotations M: quotation ' [ array>> ' quotation [ emit ! array f ' emit ! cached-effect f ' emit ! cache-counter 0 emit ! xt 0 emit ! code ] emit-object ] cache-eql-object ; ! End of the image : emit-words ( -- ) all-words [ emit-word ] each ; : emit-global ( -- ) { dictionary source-files builtins update-map implementors-map } [ [ bootstrap-word ] [ get ] bi ] H{ } map>assoc { class<=-cache class-not-cache classes-intersect-cache class-and-cache class-or-cache next-method-quot-cache } [ H{ } clone ] H{ } map>assoc assoc-union bootstrap-global set ; : emit-jit-data ( -- ) \ if jit-if-word set \ do-primitive jit-primitive-word set \ dip jit-dip-word set \ 2dip jit-2dip-word set \ 3dip jit-3dip-word set \ inline-cache-miss pic-miss-word set \ inline-cache-miss-tail pic-miss-tail-word set \ mega-cache-lookup mega-lookup-word set \ mega-cache-miss mega-miss-word set \ declare jit-declare-word set \ c-to-factor c-to-factor-word set \ lazy-jit-compile lazy-jit-compile-word set \ unwind-native-frames unwind-native-frames-word set \ fpu-state fpu-state-word set \ set-fpu-state set-fpu-state-word set \ signal-handler signal-handler-word set \ leaf-signal-handler leaf-signal-handler-word set \ ffi-signal-handler ffi-signal-handler-word set \ ffi-leaf-signal-handler ffi-leaf-signal-handler-word set undefined-def undefined-quot set ; : emit-special-objects ( -- ) special-objects get keys [ emit-special-object ] each ; : fixup-header ( -- ) heap-size data-heap-size-offset fixup ; : build-generics ( -- ) [ all-words [ generic? ] filter [ make-generic ] each ] with-compilation-unit ; : build-image ( -- image ) 800000 image set 20000 objects set emit-image-header t, 0, 1, -1, "Building generic words..." print flush build-generics "Serializing words..." print flush emit-words "Serializing JIT data..." print flush emit-jit-data "Serializing global namespace..." print flush emit-global "Serializing special object table..." print flush emit-special-objects "Performing word fixups..." print flush fixup-words "Performing header fixups..." print flush fixup-header "Image length: " write image get length . "Object cache size: " write objects get assoc-size . \ word global delete-at image get ; ! Image output : (write-image) ( image -- ) bootstrap-cell big-endian get [ '[ _ >be write ] each ] [ '[ _ >le write ] each ] if ; : write-image ( image -- ) "Writing image to " write architecture get boot-image-name resource-path [ write "..." print flush ] [ binary [ (write-image) ] with-file-writer ] bi ; PRIVATE> : make-image ( arch -- ) [ parser-quiet? off auto-use? off architecture set "resource:/core/bootstrap/stage1.factor" run-file build-image write-image ] with-scope ; : make-images ( -- ) images [ make-image ] each ;