1 ! Copyright (C) 2007, 2009 Slava Pestov.
2 ! See http://factorcode.org/license.txt for BSD license.
3 USING: accessors xmode.tokens xmode.rules xmode.keyword-map
4 xml.data xml.traversal xml assocs kernel combinators sequences
5 math.parser namespaces make parser lexer xmode.utilities
6 regexp io.files splitting arrays xml.syntax xml.syntax.private ;
7 IN: xmode.loader.syntax
9 ! Rule tag parsing utilities
10 : (parse-rule-tag) ( rule-set tag specs class -- )
11 new swap init-from-tag swap add-rule ; inline
14 scan scan-word scan-word [
15 parse-definition { } make
16 swap [ (parse-rule-tag) ] 2curry
17 ] dip swap define-tag ; parsing
20 : string>boolean ( string -- ? ) "TRUE" = ;
22 : string>match-type ( string -- obj )
29 : string>rule-set-name ( string -- name ) "MAIN" or ;
32 : parse-prop-tag ( tag -- key value )
33 [ "NAME" attr ] [ "VALUE" attr ] bi ;
35 : parse-props-tag ( tag -- assoc )
37 [ parse-prop-tag ] H{ } map>assoc ;
39 : position-attrs ( tag -- at-line-start? at-whitespace-end? at-word-start? )
41 { "AT_LINE_START" "AT_WHITESPACE_END" "AT_WORD_START" }
42 [ attr string>boolean ] with map first3 ;
44 : parse-literal-matcher ( tag -- matcher )
46 rule-set get ignore-case?>> <string-matcher>
47 swap position-attrs <matcher> ;
49 : parse-regexp-matcher ( tag -- matcher )
51 rule-set get ignore-case?>> <?insensitive-regexp>
52 swap position-attrs <matcher> ;
54 : shared-tag-attrs ( -- )
55 { "TYPE" string>token (>>body-token) } , ; inline
57 : parse-delegate ( string -- pair )
58 "::" split1 [ rule-set get swap ] unless* 2array ;
60 : delegate-attr ( -- )
61 { "DELEGATE" f (>>delegate) } , ;
64 { "HASH_CHAR" f (>>chars) } , ;
66 : match-type-attr ( -- )
67 { "MATCH_TYPE" string>match-type (>>match-token) } , ;
70 { "NO_LINE_BREAK" string>boolean (>>no-line-break?) } ,
71 { "NO_WORD_BREAK" string>boolean (>>no-word-break?) } ,
72 { "NO_ESCAPE" string>boolean (>>no-escape?) } , ;
74 : literal-start ( -- )
75 [ parse-literal-matcher >>start drop ] , ;
78 [ parse-regexp-matcher >>start drop ] , ;
81 [ parse-literal-matcher >>end drop ] , ;
84 TAGS: parse-begin/end-tag ( rule tag -- )
86 TAG: BEGIN parse-begin/end-tag
88 parse-literal-matcher >>start drop ;
90 TAG: END parse-begin/end-tag
92 parse-literal-matcher >>end drop ;
94 : parse-begin/end-tags ( -- )
96 ! XXX: handle position attrs on span tag itself
97 children-tags [ parse-begin/end-tag ] with each
100 : init-span-tag ( -- ) [ drop init-span ] , ;
102 : init-eol-span-tag ( -- ) [ drop init-eol-span ] , ;
104 : parse-keyword-tag ( tag keyword-map -- )
105 [ dup main>> string>token swap children>string ] dip set-at ;