1 ! Copyright (C) 2008, 2009 Doug Coleman, Daniel Ehrenberg.
2 ! See http://factorcode.org/license.txt for BSD license.
3 USING: accessors kernel math math.order words combinators locals
4 ascii unicode.categories combinators.short-circuit sequences ;
5 QUALIFIED-WITH: multi-methods m
8 SINGLETONS: any-char any-char-no-nl
9 letter-class LETTER-class Letter-class digit-class
10 alpha-class non-newline-blank-class
11 ascii-class punctuation-class java-printable-class blank-class
12 control-character-class hex-digit-class java-blank-class c-identifier-class
13 unmatchable-class terminator-class word-boundary-class ;
15 SINGLETONS: beginning-of-input ^ end-of-input $ ;
17 TUPLE: range from to ;
20 GENERIC: class-member? ( obj class -- ? )
22 M: t class-member? ( obj class -- ? ) 2drop t ;
24 M: integer class-member? ( obj class -- ? ) = ;
26 M: range class-member? ( obj class -- ? )
27 [ from>> ] [ to>> ] bi between? ;
29 M: any-char class-member? ( obj class -- ? )
32 M: any-char-no-nl class-member? ( obj class -- ? )
35 M: letter-class class-member? ( obj class -- ? )
38 M: LETTER-class class-member? ( obj class -- ? )
41 M: Letter-class class-member? ( obj class -- ? )
44 M: ascii-class class-member? ( obj class -- ? )
47 M: digit-class class-member? ( obj class -- ? )
50 : c-identifier-char? ( ch -- ? )
51 { [ alpha? ] [ CHAR: _ = ] } 1|| ;
53 M: c-identifier-class class-member? ( obj class -- ? )
54 drop c-identifier-char? ;
56 M: alpha-class class-member? ( obj class -- ? )
60 "!\"#$%&'()*+,-./:;<=>?@[\\]^_`{|}~" member? ;
62 M: punctuation-class class-member? ( obj class -- ? )
65 : java-printable? ( ch -- ? )
66 { [ alpha? ] [ punct? ] } 1|| ;
68 M: java-printable-class class-member? ( obj class -- ? )
69 drop java-printable? ;
71 M: non-newline-blank-class class-member? ( obj class -- ? )
72 drop { [ blank? ] [ CHAR: \n = not ] } 1&& ;
74 M: control-character-class class-member? ( obj class -- ? )
77 : hex-digit? ( ch -- ? )
79 [ CHAR: A CHAR: F between? ]
80 [ CHAR: a CHAR: f between? ]
81 [ CHAR: 0 CHAR: 9 between? ]
84 M: hex-digit-class class-member? ( obj class -- ? )
87 : java-blank? ( ch -- ? )
89 CHAR: \s CHAR: \t CHAR: \n
90 HEX: b HEX: 7 CHAR: \r
93 M: java-blank-class class-member? ( obj class -- ? )
96 M: unmatchable-class class-member? ( obj class -- ? )
99 M: terminator-class class-member? ( obj class -- ? )
100 drop "\r\n\u000085\u002029\u002028" member? ;
102 M: ^ class-member? ( obj class -- ? )
105 M: $ class-member? ( obj class -- ? )
108 M: f class-member? 2drop f ;
110 TUPLE: primitive-class class ;
111 C: <primitive-class> primitive-class
113 TUPLE: or-class seq ;
115 TUPLE: not-class class ;
117 TUPLE: and-class seq ;
119 m:GENERIC: combine-and ( class1 class2 -- combined ? )
121 : replace-if-= ( object object -- object ? )
124 m:METHOD: combine-and { object object } replace-if-= ;
126 m:METHOD: combine-and { integer integer }
127 2dup = [ drop t ] [ 2drop f t ] if ;
129 m:METHOD: combine-and { t object }
132 m:METHOD: combine-and { f object }
135 m:METHOD: combine-and { not-class object }
136 [ class>> ] dip = [ f t ] [ f f ] if ;
138 m:METHOD: combine-and { integer object }
139 2dup class-member? [ drop t ] [ 2drop f t ] if ;
141 m:GENERIC: combine-or ( class1 class2 -- combined ? )
143 m:METHOD: combine-or { object object } replace-if-= ;
145 m:METHOD: combine-or { integer integer }
146 2dup = [ drop t ] [ 2drop f f ] if ;
148 m:METHOD: combine-or { t object }
151 m:METHOD: combine-or { f object }
154 m:METHOD: combine-or { not-class object }
155 [ class>> ] dip = [ t t ] [ f f ] if ;
157 m:METHOD: combine-or { integer object }
158 2dup class-member? [ nip t ] [ 2drop f f ] if ;
160 : try-combine ( elt1 elt2 quot -- combined/f ? )
161 3dup call [ [ 3drop ] dip t ] [ drop swapd call ] if ; inline
163 :: prefix-combining ( seq elt quot: ( elt1 elt2 -- combined/f ? ) -- newseq )
165 seq [ elt quot try-combine swap combined! ] find drop
166 [ seq remove-nth combined prefix ]
167 [ seq elt prefix ] if* ; inline
169 :: combine ( seq quot: ( elt1 elt2 -- combined/f ? ) empty class -- newseq )
170 seq { } [ quot prefix-combining ] reduce
174 [ drop class new swap >>seq ]
177 : <and-class> ( seq -- class )
178 [ combine-and ] t and-class combine ;
180 M: and-class class-member?
181 seq>> [ class-member? ] with all? ;
183 : <or-class> ( seq -- class )
184 [ combine-or ] f or-class combine ;
186 M: or-class class-member?
187 seq>> [ class-member? ] with any? ;
189 : <not-class> ( class -- inverse )
193 [ dup not-class? [ class>> ] [ not-class boa ] if ]
196 M: not-class class-member?
197 class>> class-member? not ;
199 M: primitive-class class-member?
200 class>> class-member? ;
202 UNION: class primitive-class not-class or-class range ;