1 ! Copyright (C) 2005, 2009 Daniel Ehrenberg, Doug Coleman.
2 ! See http://factorcode.org/license.txt for BSD license.
3 USING: namespaces math kernel sequences accessors fry circular
4 unicode.case unicode.categories locals combinators.short-circuit
5 make combinators io splitting math.parser ;
8 TUPLE: sequence-parser sequence n ;
10 : <sequence-parser> ( sequence -- sequence-parser )
15 : offset ( sequence-parser offset -- char/f )
17 [ n>> + ] [ sequence>> ?nth ] bi ; inline
19 : current ( sequence-parser -- char/f ) 0 offset ; inline
21 : previous ( sequence-parser -- char/f ) -1 offset ; inline
23 : peek-next ( sequence-parser -- char/f ) 1 offset ; inline
25 : advance ( sequence-parser -- sequence-parser )
26 [ 1 + ] change-n ; inline
28 : advance* ( sequence-parser -- )
31 : get+increment ( sequence-parser -- char/f )
32 [ current ] [ advance drop ] bi ; inline
34 :: skip-until ( sequence-parser quot: ( obj -- ? ) -- )
35 sequence-parser current [
36 sequence-parser quot call [ sequence-parser advance quot skip-until ] unless
37 ] when ; inline recursive
39 : sequence-parse-end? ( sequence-parser -- ? ) current not ;
41 : take-until ( sequence-parser quot: ( obj -- ? ) -- sequence/f )
42 over sequence-parse-end? [
47 [ drop [ n>> ] [ sequence>> ] bi ] 2tri subseq
50 : take-while ( sequence-parser quot: ( obj -- ? ) -- sequence/f )
51 [ not ] compose take-until ; inline
53 : <safe-slice> ( from to seq -- slice/f )
56 [ [ drop ] 2dip length > ]
58 } 3|| [ 3drop f ] [ slice boa ] if ; inline
60 :: take-sequence ( sequence-parser sequence -- obj/f )
61 sequence-parser [ n>> dup sequence length + ] [ sequence>> ] bi
62 <safe-slice> sequence sequence= [
64 sequence-parser [ sequence length + ] change-n drop
69 : take-sequence* ( sequence-parser sequence -- )
72 :: take-until-sequence ( sequence-parser sequence -- sequence'/f )
73 sequence-parser n>> :> saved
74 sequence length <growing-circular> :> growing
77 current growing push-growing-circular
78 sequence growing sequence=
80 growing sequence sequence= [
82 growing length 1- - head
83 sequence-parser [ growing length - 1 + ] change-n drop
84 ! sequence-parser advance drop
86 saved sequence-parser (>>n)
90 :: take-until-sequence* ( sequence-parser sequence -- sequence'/f )
91 sequence-parser sequence take-until-sequence :> out
93 sequence-parser [ sequence length + ] change-n drop
96 : skip-whitespace ( sequence-parser -- sequence-parser )
97 [ [ current blank? not ] take-until drop ] keep ;
99 : take-rest-slice ( sequence-parser -- sequence/f )
100 [ sequence>> ] [ n>> ] bi
101 2dup [ length ] dip < [ 2drop f ] [ tail-slice ] if ; inline
103 : take-rest ( sequence-parser -- sequence )
104 [ take-rest-slice ] [ sequence>> like ] bi ;
106 : take-until-object ( sequence-parser obj -- sequence )
107 '[ current _ = ] take-until ;
109 : parse-sequence ( sequence quot -- )
110 [ <sequence-parser> ] dip call ; inline
112 :: take-quoted-string ( sequence-parser escape-char quote-char -- string )
113 sequence-parser n>> :> start-n
114 sequence-parser advance
117 [ { [ previous escape-char = ] [ current quote-char = ] } 1&& ]
118 [ current quote-char = not ]
120 ] take-while :> string
121 sequence-parser current quote-char = [
122 sequence-parser advance* string
124 start-n sequence-parser (>>n) f
127 : (take-token) ( sequence-parser -- string )
128 skip-whitespace [ current { [ blank? ] [ f = ] } 1|| ] take-until ;
130 :: take-token* ( sequence-parser escape-char quote-char -- string/f )
131 sequence-parser skip-whitespace
133 { quote-char [ escape-char quote-char take-quoted-string ] }
135 [ drop (take-token) ]
138 : take-token ( sequence-parser -- string/f )
139 CHAR: \ CHAR: " take-token* ;
141 : take-integer ( sequence-parser -- n/f )
142 [ current digit? ] take-while string>number ;
144 :: take-n ( sequence-parser n -- seq/f )
145 n sequence-parser [ n>> + ] [ sequence>> length ] bi > [
148 sequence-parser n>> dup n + sequence-parser sequence>> subseq
149 sequence-parser [ n + ] change-n drop
152 : write-full ( sequence-parser -- ) sequence>> write ;
153 : write-rest ( sequence-parser -- ) take-rest write ;