Merge branch 'master' into regexp

author Daniel Ehrenberg <littledan@Macintosh-103.local>

Mon, 16 Feb 2009 02:42:45 +0000 (20:42 -0600)

committer Daniel Ehrenberg <littledan@Macintosh-103.local>

Mon, 16 Feb 2009 02:42:45 +0000 (20:42 -0600)
author Daniel Ehrenberg <littledan@Macintosh-103.local>
Mon, 16 Feb 2009 02:42:45 +0000 (20:42 -0600)
committer Daniel Ehrenberg <littledan@Macintosh-103.local>
Mon, 16 Feb 2009 02:42:45 +0000 (20:42 -0600)
diff --git a/basis/ascii/ascii.factor b/basis/ascii/ascii.factor

index 193e847d2714ee868e2e195373a067557bcf6b89..bd1b86b2793347fcf56dfa1923b9b87a4184a508 100644 (file)
--- a/basis/ascii/ascii.factor
+++ b/basis/ascii/ascii.factor
@@ -10,7 +10,7 @@ IN: ascii
  : LETTER? ( ch -- ? ) CHAR: A CHAR: Z between? ; inline\r
  : digit? ( ch -- ? ) CHAR: 0 CHAR: 9 between? ; inline\r
  : printable? ( ch -- ? ) CHAR: \s CHAR: ~ between? ; inline\r
-: control? ( ch -- ? ) "\0\e\r\n\t\u000008\u00007f" member? ; inline\r
+: control? ( ch -- ? ) { [ 0 HEX: 1F between? ] [ HEX: 7F = ] } 1|| ; inline\r
  : quotable? ( ch -- ? ) { [ printable? ] [ "\"\\" member? not ] } 1&& ; inline\r
  : Letter? ( ch -- ? ) { [ letter? ] [ LETTER? ] } 1|| ; inline\r
  : alpha? ( ch -- ? ) { [ Letter? ] [ digit? ] } 1|| ; inline\r
@@ -20,4 +20,4 @@ IN: ascii
  : >upper ( str -- upper ) [ ch>upper ] map ;\r
  \r
  HINTS: >lower string ;\r
-HINTS: >upper string ;
-\ No newline at end of file
+HINTS: >upper string ;\r
diff --git a/basis/regexp/classes/classes.factor b/basis/regexp/classes/classes.factor

index 4a807fa51bbc0f815282c086e77d136517707b69..94d1b78d5954c4a3f1cc463efe31ec3987f1c0aa 100644 (file)
--- a/basis/regexp/classes/classes.factor
+++ b/basis/regexp/classes/classes.factor
@@ -1,7 +1,7 @@
  ! Copyright (C) 2008 Doug Coleman.
  ! See http://factorcode.org/license.txt for BSD license.
  USING: accessors kernel math math.order words regexp.utils
-unicode.categories combinators.short-circuit ;
+ascii unicode.categories combinators.short-circuit ;
  IN: regexp.classes
  
  SINGLETONS: any-char any-char-no-nl
@@ -64,7 +64,7 @@ M: non-newline-blank-class class-member? ( obj class -- ? )
      drop { [ blank? ] [ CHAR: \n = not ] } 1&& ;
  
  M: control-character-class class-member? ( obj class -- ? )
-    drop control-char? ;
+    drop control? ;
  
  M: hex-digit-class class-member? ( obj class -- ? )
      drop hex-digit? ;
diff --git a/basis/regexp/nfa/nfa.factor b/basis/regexp/nfa/nfa.factor

index 537c85c2d3b20acfd305a3903bab4b27a3a08667..44481454fcf885143ef6a2a429ef4ade95ddc6fe 100644 (file)
--- a/basis/regexp/nfa/nfa.factor
+++ b/basis/regexp/nfa/nfa.factor
@@ -183,15 +183,8 @@ M: character-class-range nfa-node ( node -- )
      ] if ;
  
  M: capture-group nfa-node ( node -- )
-    "capture-groups" feature-is-broken
-    eps literal-transition add-simple-entry
-    capture-group-on add-traversal-flag
-    term>> nfa-node
-    eps literal-transition add-simple-entry
-    capture-group-off add-traversal-flag
-    2 [ concatenate-nodes ] times ;
+    term>> nfa-node ;
  
-! xyzzy
  M: non-capture-group nfa-node ( node -- )
      term>> nfa-node ;
  
diff --git a/basis/regexp/regexp-tests.factor b/basis/regexp/regexp-tests.factor

index 1cd9a2392efc87e1646eb52b17ec24fda88b67e1..cc9b2cccf1b56be2cd6a6c8e1394e488b8de44f8 100644 (file)
--- a/basis/regexp/regexp-tests.factor
+++ b/basis/regexp/regexp-tests.factor
@@ -44,9 +44,9 @@ IN: regexp-tests
  ! Dotall mode -- when on, . matches newlines.
  ! Off by default.
  [ f ] [ "\n" "." <regexp> matches? ] unit-test
-[ t ] [ "\n" "(?s)." <regexp> matches? ] unit-test
+! [ t ] [ "\n" "(?s)." <regexp> matches? ] unit-test
  [ t ] [ "\n" R/ ./s matches? ] unit-test
-[ f ] [ "\n\n" "(?s).(?-s)." <regexp> matches? ] unit-test
+! [ f ] [ "\n\n" "(?s).(?-s)." <regexp> matches? ] unit-test
  
  [ f ] [ "" ".+" <regexp> matches? ] unit-test
  [ t ] [ "a" ".+" <regexp> matches? ] unit-test
@@ -76,8 +76,6 @@ IN: regexp-tests
  [ t ] [ "bar" "foo|bar" <regexp> matches? ] unit-test
  [ f ] [ "foobar" "foo|bar" <regexp> matches? ] unit-test
  
-/*
-! FIXME
  [ f ] [ "" "(a)" <regexp> matches? ] unit-test
  [ t ] [ "a" "(a)" <regexp> matches? ] unit-test
  [ f ] [ "aa" "(a)" <regexp> matches? ] unit-test
@@ -85,7 +83,6 @@ IN: regexp-tests
  
  [ f ] [ "aababaaabbac" "(a|b)+" <regexp> matches? ] unit-test
  [ t ] [ "ababaaabba" "(a|b)+" <regexp> matches? ] unit-test
-*/
  
  [ f ] [ "" "a{1}" <regexp> matches? ] unit-test
  [ t ] [ "a" "a{1}" <regexp> matches? ] unit-test
@@ -168,12 +165,9 @@ IN: regexp-tests
  [ f ] [ "0" "[^\\d]" <regexp> matches? ] unit-test
  [ t ] [ "a" "[^\\d]" <regexp> matches? ] unit-test
  
-/*
-! FIXME
  [ t ] [ "a" "[a-z]{1,}|[A-Z]{2,4}|b*|c|(f|g)*" <regexp> matches? ] unit-test
  [ t ] [ "a" "[a-z]{1,2}|[A-Z]{3,3}|b*|c|(f|g)*" <regexp> matches? ] unit-test
  [ t ] [ "a" "[a-z]{1,2}|[A-Z]{3,3}" <regexp> matches? ] unit-test
-*/
  
  [ t ] [ "1000" "\\d{4,6}" <regexp> matches? ] unit-test
  [ t ] [ "1000" "[0-9]{4,6}" <regexp> matches? ] unit-test
@@ -226,6 +220,7 @@ IN: regexp-tests
  [ t ] [ "c" R/ [A-Z]/i matches? ] unit-test
  [ f ] [ "3" R/ [A-Z]/i matches? ] unit-test
  
+/*
  [ t ] [ "a" "(?i)a" <regexp> matches? ] unit-test
  [ t ] [ "a" "(?i)a" <regexp> matches? ] unit-test
  [ t ] [ "A" "(?i)a" <regexp> matches? ] unit-test
@@ -235,6 +230,7 @@ IN: regexp-tests
  [ t ] [ "a" R/ (?-i)a/i matches? ] unit-test
  [ f ] [ "A" R/ (?-i)a/i matches? ] unit-test
  [ f ] [ "A" R/ (?-i)a/i matches? ] unit-test
+*/
  
  [ f ] [ "A" "[a-z]" <regexp> matches? ] unit-test
  [ t ] [ "A" R/ [a-z]/i matches? ] unit-test
@@ -253,8 +249,6 @@ IN: regexp-tests
  [ t ] [ "abc*" "[^\\*]*\\*" <regexp> matches? ] unit-test
  [ t ] [ "bca" "[^a]*a" <regexp> matches? ] unit-test
  
-/*
-! FIXME
  [ ] [
      "(0[lL]?|[1-9]\\d{0,9}(\\d{0,9}[lL])?|0[xX]\\p{XDigit}{1,8}(\\p{XDigit}{0,8}[lL])?|0[0-7]{1,11}([0-7]{0,11}[lL])?|([0-9]+\\.[0-9]*|\\.[0-9]+)([eE][+-]?[0-9]+)?[fFdD]?|[0-9]+([eE][+-]?[0-9]+[fFdD]?|([eE][+-]?[0-9]+)?[fFdD]))"
      <regexp> drop
@@ -278,7 +272,6 @@ IN: regexp-tests
  [ "abc" ] [ "abc" "(ab|a)(bc)?" <regexp> first-match >string ] unit-test
  
  [ "b" ] [ "aaaaaaaaaaaaaaaaaaaaaaab" "((a*)*b)*b" <regexp> first-match >string ] unit-test
-*/
  
  ! [ t ] [ "a:b" ".+:?" <regexp> matches? ] unit-test
  
@@ -309,7 +302,6 @@ IN: regexp-tests
  [ "-- title --" ] [ "== title ==" R/ =/ "-" re-replace ] unit-test
  
  /*
-! FIXME
  [ f ] [ "ab" "a(?!b)" <regexp> first-match ] unit-test
  [ "a" ] [ "ac" "a(?!b)" <regexp> first-match >string ] unit-test
  [ t ] [ "fxxbar" "(?!foo).{3}bar" <regexp> matches? ] unit-test
diff --git a/basis/regexp/transition-tables/transition-tables.factor b/basis/regexp/transition-tables/transition-tables.factor

index e5c31a54e0e40f4260e439030410069e36b99bc2..64d5cdb2449467a5207ca00870e82582bd44475f 100644 (file)
--- a/basis/regexp/transition-tables/transition-tables.factor
+++ b/basis/regexp/transition-tables/transition-tables.factor
@@ -41,8 +41,8 @@ TUPLE: transition-table transitions start-state final-states ;
      #! set the state as a key
      2dup [ to>> ] dip maybe-initialize-key
      [ [ to>> ] [ obj>> ] [ from>> ] tri ] dip
-    2dup at* [ 2nip insert-at ]
-    [ drop [ H{ } clone [ insert-at ] keep ] 2dip set-at ] if ;
+    2dup at* [ 2nip push-at ]
+    [ drop [ H{ } clone [ push-at ] keep ] 2dip set-at ] if ;
  
  : add-transition ( transition transition-table -- )
      transitions>> set-transition ;
diff --git a/basis/regexp/traversal/traversal.factor b/basis/regexp/traversal/traversal.factor

index 104a6c2ce1c2159445e2ba8175d55520e5e295b1..d0a76a6ddcaf015c1bd751296af6350f3a1736f9 100644 (file)
--- a/basis/regexp/traversal/traversal.factor
+++ b/basis/regexp/traversal/traversal.factor
@@ -7,34 +7,20 @@ IN: regexp.traversal
  
  TUPLE: dfa-traverser
      dfa-table
-    traversal-flags
-    traverse-forward
-    lookahead-counters
-    lookbehind-counters
-    capture-counters
-    captured-groups
-    capture-group-index
-    last-state current-state
+    current-state
      text
      match-failed?
      start-index current-index
      matches ;
  
  : <dfa-traverser> ( text regexp -- match )
-    [ dfa-table>> ] [ dfa-traversal-flags>> ] bi
+    dfa-table>>
      dfa-traverser new
-        swap >>traversal-flags
          swap [ start-state>> >>current-state ] [ >>dfa-table ] bi
          swap >>text
-        t >>traverse-forward
          0 >>start-index
          0 >>current-index
-        0 >>capture-group-index
-        V{ } clone >>matches
-        V{ } clone >>capture-counters
-        V{ } clone >>lookbehind-counters
-        V{ } clone >>lookahead-counters
-        H{ } clone >>captured-groups ;
+        V{ } clone >>matches ;
  
  : final-state? ( dfa-traverser -- ? )
      [ current-state>> ]
@@ -61,111 +47,28 @@ TUPLE: dfa-traverser
          dup save-final-state
      ] when text-finished? ;
  
+: text-character ( dfa-traverser n -- ch )
+    [ text>> ] swap '[ current-index>> _ + ] bi nth ;
+
  : previous-text-character ( dfa-traverser -- ch )
-    [ text>> ] [ current-index>> 1- ] bi nth ;
+    -1 text-character ;
  
  : current-text-character ( dfa-traverser -- ch )
-    [ text>> ] [ current-index>> ] bi nth ;
+    0 text-character ;
  
  : next-text-character ( dfa-traverser -- ch )
-    [ text>> ] [ current-index>> 1+ ] bi nth ;
-
-GENERIC: flag-action ( dfa-traverser flag -- )
-
-
-M: beginning-of-input flag-action ( dfa-traverser flag -- )
-    drop
-    dup beginning-of-text? [ t >>match-failed? ] unless drop ;
-
-M: end-of-input flag-action ( dfa-traverser flag -- )
-    drop
-    dup end-of-text? [ t >>match-failed? ] unless drop ;
-
-
-M: beginning-of-line flag-action ( dfa-traverser flag -- )
-    drop
-    dup {
-        [ beginning-of-text? ]
-        [ previous-text-character terminator-class class-member? ]
-    } 1|| [ t >>match-failed? ] unless drop ;
-
-M: end-of-line flag-action ( dfa-traverser flag -- )
-    drop
-    dup {
-        [ end-of-text? ]
-        [ next-text-character terminator-class class-member? ]
-    } 1|| [ t >>match-failed? ] unless drop ;
-
-
-M: word-boundary flag-action ( dfa-traverser flag -- )
-    drop
-    dup {
-        [ end-of-text? ]
-        [ current-text-character terminator-class class-member? ]
-    } 1|| [ t >>match-failed? ] unless drop ;
-
-
-M: lookahead-on flag-action ( dfa-traverser flag -- )
-    drop
-    lookahead-counters>> 0 swap push ;
-
-M: lookahead-off flag-action ( dfa-traverser flag -- )
-    drop
-    dup lookahead-counters>>
-    [ drop ] [ pop '[ _ - ] change-current-index drop ] if-empty ;
-
-M: lookbehind-on flag-action ( dfa-traverser flag -- )
-    drop
-    f >>traverse-forward
-    [ 2 - ] change-current-index
-    lookbehind-counters>> 0 swap push ;
-
-M: lookbehind-off flag-action ( dfa-traverser flag -- )
-    drop
-    t >>traverse-forward
-    dup lookbehind-counters>>
-    [ drop ] [ pop '[ _ + 2 + ] change-current-index drop ] if-empty ;
-
-M: capture-group-on flag-action ( dfa-traverser flag -- )
-    drop
-    [ current-index>> 0 2array ]
-    [ capture-counters>> ] bi push ;
-
-M: capture-group-off flag-action ( dfa-traverser flag -- )
-    drop
-    dup capture-counters>> empty? [
-        drop
-    ] [
-        {
-            [ capture-counters>> pop first2 dupd + ]
-            [ text>> <slice> ]
-            [ [ 1+ ] change-capture-group-index capture-group-index>> ]
-            [ captured-groups>> set-at ]
-        } cleave
-    ] if ;
-
-: process-flags ( dfa-traverser -- )
-    [ [ 1+ ] map ] change-lookahead-counters
-    [ [ 1+ ] map ] change-lookbehind-counters
-    [ [ first2 1+ 2array ] map ] change-capture-counters
-    ! dup current-state>> .
-    dup [ current-state>> ] [ traversal-flags>> ] bi
-    at [ flag-action ] with each ;
+    1 text-character ;
  
  : increment-state ( dfa-traverser state -- dfa-traverser )
-    [
-        dup traverse-forward>>
-        [ [ 1+ ] change-current-index ]
-        [ [ 1- ] change-current-index ] if
-        dup current-state>> >>last-state
-    ] [ first ] bi* >>current-state ;
+    [ [ 1 + ] change-current-index ]
+    [ first ] bi* >>current-state ;
  
  : match-literal ( transition from-state table -- to-state/f )
      transitions>> at at ;
  
  : match-class ( transition from-state table -- to-state/f )
      transitions>> at* [
-        [ drop class-member? ] assoc-with assoc-find [ nip ] [ drop ] if
+        '[ drop _ swap class-member? ] assoc-find [ nip ] [ drop ] if
      ] [ drop ] if ;
  
  : match-default ( transition from-state table -- to-state/f )
@@ -180,7 +83,6 @@ M: capture-group-off flag-action ( dfa-traverser flag -- )
      [ dfa-table>> ] tri ;
  
  : do-match ( dfa-traverser -- dfa-traverser )
-    dup process-flags
      dup match-done? [
          dup setup-match match-transition
          [ increment-state do-match ] when*
diff --git a/basis/regexp/utils/utils.factor b/basis/regexp/utils/utils.factor

index af1b2fa1fb0eb25dd1bbec644f07a48680853f60..d1266a6d98a54fdc4154b604775db87a13c2e957 100644 (file)
--- a/basis/regexp/utils/utils.factor
+++ b/basis/regexp/utils/utils.factor
@@ -12,47 +12,25 @@ IN: regexp.utils
  : while-changes ( obj quot pred -- obj' )
      pick over call (while-changes) ; inline
  
-: assoc-with ( param assoc quot -- assoc curry )
-    swapd [ [ -rot ] dip call ] 2curry ; inline
-
-: insert-at ( value key hash -- )
-    2dup at* [
-        2nip push
-    ] [
-        drop
-        [ dup vector? [ 1vector ] unless ] 2dip set-at
-    ] if ;
-
-: ?insert-at ( value key hash/f -- hash )
-    [ H{ } clone ] unless* [ insert-at ] keep ;
-
  ERROR: bad-octal number ;
  ERROR: bad-hex number ;
  : check-octal ( octal -- octal ) dup 255 > [ bad-octal ] when ;
  : check-hex ( hex -- hex ) dup number? [ bad-hex ] unless ;
  
-: ascii? ( n -- ? ) 0 HEX: 7f between? ;
-: octal-digit? ( n -- ? ) CHAR: 0 CHAR: 7 between? ;
  : decimal-digit? ( n -- ? ) CHAR: 0 CHAR: 9 between? ;
  
  : hex-digit? ( n -- ? )
-    [
+    {
          [ decimal-digit? ]
          [ CHAR: a CHAR: f between? ]
          [ CHAR: A CHAR: F between? ]
-    ] 1|| ;
-
-: control-char? ( n -- ? )
-    [
-        [ 0 HEX: 1f between? ]
-        [ HEX: 7f = ]
-    ] 1|| ;
+    } 1|| ;
  
  : punct? ( n -- ? )
      "!\"#$%&'()*+,-./:;<=>?@[\\]^_`{|}~" member? ;
  
  : c-identifier-char? ( ch -- ? )
-    [ [ alpha? ] [ CHAR: _ = ] ] 1|| ;
+    { [ alpha? ] [ CHAR: _ = ] } 1|| ;
  
  : java-blank? ( n -- ? )
      {
diff --git a/basis/xmode/catalog/catalog.factor b/basis/xmode/catalog/catalog.factor

index 4e3af0af5613998deb548a265993a7f86881521c..b08e47ddc56e96b6e138c2bc1b547fe20dfb9aa9 100644 (file)
--- a/basis/xmode/catalog/catalog.factor
+++ b/basis/xmode/catalog/catalog.factor
@@ -1,13 +1,14 @@
  USING: xmode.loader xmode.utilities xmode.rules namespaces
  strings splitting assocs sequences kernel io.files xml memoize
-words globs combinators io.encodings.utf8 sorting accessors xml.data ;
+words globs combinators io.encodings.utf8 sorting accessors xml.data
+xml.traversal xml.syntax ;
  IN: xmode.catalog
  
  TUPLE: mode file file-name-glob first-line-glob ;
  
-<TAGS: parse-mode-tag ( modes tag -- )
+TAGS: parse-mode-tag ( modes tag -- )
  
-TAG: MODE
+TAG: MODE parse-mode-tag
      dup "NAME" attr [
          mode new {
              { "FILE" f (>>file) }
@@ -17,11 +18,9 @@ TAG: MODE
      ] dip
      rot set-at ;
  
-TAGS>
-
  : parse-modes-tag ( tag -- modes )
      H{ } clone [
-        swap child-tags [ parse-mode-tag ] with each
+        swap children-tags [ parse-mode-tag ] with each
      ] keep ;
  
  MEMO: modes ( -- modes )
@@ -98,8 +97,8 @@ ERROR: mutually-recursive-rulesets ruleset ;
      ] if ;
  
  : finalize-mode ( rulesets -- )
-    rule-sets [
-        dup [ nip finalize-rule-set ] assoc-each
+    dup rule-sets [
+        [ nip finalize-rule-set ] assoc-each
      ] with-variable ;
  
  : load-mode ( name -- rule-sets )
diff --git a/basis/xmode/loader/loader.factor b/basis/xmode/loader/loader.factor

index 70466913a09b8213eba7ba9a09c000b8df5801c9..d6f3943e145627c452ceb76a16e459ce0d033ee4 100644 (file)
--- a/basis/xmode/loader/loader.factor
+++ b/basis/xmode/loader/loader.factor
@@ -1,56 +1,54 @@
  USING: xmode.loader.syntax xmode.tokens xmode.rules
  xmode.keyword-map xml.data xml.traversal xml assocs kernel
  combinators sequences math.parser namespaces parser
-xmode.utilities parser-combinators.regexp io.files accessors ;
+xmode.utilities regexp io.files accessors xml.syntax ;
  IN: xmode.loader
  
  ! Based on org.gjt.sp.jedit.XModeHandler
  
  ! RULES and its children
-<TAGS: parse-rule-tag ( rule-set tag -- )
+TAGS: parse-rule-tag ( rule-set tag -- )
  
-TAG: PROPS
+TAG: PROPS parse-rule-tag
      parse-props-tag >>props drop ;
  
-TAG: IMPORT
+TAG: IMPORT parse-rule-tag
      "DELEGATE" attr swap import-rule-set ;
  
-TAG: TERMINATE
+TAG: TERMINATE parse-rule-tag
      "AT_CHAR" attr string>number >>terminate-char drop ;
  
-RULE: SEQ seq-rule
+RULE: SEQ seq-rule parse-rule-tag
      shared-tag-attrs delegate-attr literal-start ;
  
-RULE: SEQ_REGEXP seq-rule
+RULE: SEQ_REGEXP seq-rule parse-rule-tag
      shared-tag-attrs delegate-attr regexp-attr regexp-start ;
  
-RULE: SPAN span-rule
+RULE: SPAN span-rule parse-rule-tag
      shared-tag-attrs delegate-attr match-type-attr span-attrs parse-begin/end-tags init-span-tag ;
  
-RULE: SPAN_REGEXP span-rule
+RULE: SPAN_REGEXP span-rule parse-rule-tag
      shared-tag-attrs delegate-attr match-type-attr span-attrs regexp-attr parse-begin/end-tags init-span-tag ;
  
-RULE: EOL_SPAN eol-span-rule
+RULE: EOL_SPAN eol-span-rule parse-rule-tag
      shared-tag-attrs delegate-attr match-type-attr literal-start init-eol-span-tag ;
  
-RULE: EOL_SPAN_REGEXP eol-span-rule
+RULE: EOL_SPAN_REGEXP eol-span-rule parse-rule-tag
      shared-tag-attrs delegate-attr match-type-attr regexp-attr regexp-start init-eol-span-tag ;
  
-RULE: MARK_FOLLOWING mark-following-rule
+RULE: MARK_FOLLOWING mark-following-rule parse-rule-tag
      shared-tag-attrs match-type-attr literal-start ;
  
-RULE: MARK_PREVIOUS mark-previous-rule
+RULE: MARK_PREVIOUS mark-previous-rule parse-rule-tag
      shared-tag-attrs match-type-attr literal-start ;
  
-TAG: KEYWORDS ( rule-set tag -- key value )
+TAG: KEYWORDS parse-rule-tag
      rule-set get ignore-case?>> <keyword-map>
-    swap child-tags [ over parse-keyword-tag ] each
+    swap children-tags [ over parse-keyword-tag ] each
      swap (>>keywords) ;
  
-TAGS>
-
  : ?<regexp> ( string/f -- regexp/f )
-    dup [ rule-set get ignore-case?>> <regexp> ] when ;
+    dup [ rule-set get ignore-case?>> <?insensitive-regexp> ] when ;
  
  : (parse-rules-tag) ( tag -- rule-set )
      <rule-set> dup rule-set set
@@ -66,7 +64,7 @@ TAGS>
  
  : parse-rules-tag ( tag -- rule-set )
      [
-        [ (parse-rules-tag) ] [ child-tags ] bi
+        [ (parse-rules-tag) ] [ children-tags ] bi
          [ parse-rule-tag ] with each
          rule-set get
      ] with-scope ;
diff --git a/basis/xmode/loader/syntax/syntax.factor b/basis/xmode/loader/syntax/syntax.factor

index 0e7293da976f54d16fe4222a658580a736cbe570..60318e669e7fea9cffb97649a07d07c21a2236d7 100644 (file)
--- a/basis/xmode/loader/syntax/syntax.factor
+++ b/basis/xmode/loader/syntax/syntax.factor
@@ -3,7 +3,7 @@
  USING: accessors xmode.tokens xmode.rules xmode.keyword-map
  xml.data xml.traversal xml assocs kernel combinators sequences
  math.parser namespaces make parser lexer xmode.utilities
-parser-combinators.regexp io.files splitting arrays ;
+regexp io.files splitting arrays xml.syntax xml.syntax.private ;
  IN: xmode.loader.syntax
  
  ! Rule tag parsing utilities
@@ -11,9 +11,10 @@ IN: xmode.loader.syntax
      new swap init-from-tag swap add-rule ; inline
  
  : RULE:
-    scan scan-word
-    parse-definition { } make
-    swap [ (parse-rule-tag) ] 2curry (TAG:) ; parsing
+    scan scan-word scan-word [
+        parse-definition { } make
+        swap [ (parse-rule-tag) ] 2curry
+    ] dip swap define-tag ; parsing
  
  ! Attribute utilities
  : string>boolean ( string -- ? ) "TRUE" = ;
@@ -32,7 +33,7 @@ IN: xmode.loader.syntax
      [ "NAME" attr ] [ "VALUE" attr ] bi ;
  
  : parse-props-tag ( tag -- assoc )
-    child-tags
+    children-tags
      [ parse-prop-tag ] H{ } map>assoc ;
  
  : position-attrs ( tag -- at-line-start? at-whitespace-end? at-word-start? )
@@ -46,7 +47,8 @@ IN: xmode.loader.syntax
      swap position-attrs <matcher> ;
  
  : parse-regexp-matcher ( tag -- matcher )
-    dup children>string rule-set get ignore-case?>> <regexp>
+    dup children>string
+    rule-set get ignore-case?>> <?insensitive-regexp>
      swap position-attrs <matcher> ;
  
  : shared-tag-attrs ( -- )
@@ -79,22 +81,20 @@ IN: xmode.loader.syntax
      [ parse-literal-matcher >>end drop ] , ;
  
  ! SPAN's children
-<TAGS: parse-begin/end-tag ( rule tag -- )
+TAGS: parse-begin/end-tag ( rule tag -- )
  
-TAG: BEGIN
+TAG: BEGIN parse-begin/end-tag
      ! XXX
      parse-literal-matcher >>start drop ;
  
-TAG: END
+TAG: END parse-begin/end-tag
      ! XXX
      parse-literal-matcher >>end drop ;
  
-TAGS>
-
  : parse-begin/end-tags ( -- )
      [
          ! XXX: handle position attrs on span tag itself
-        child-tags [ parse-begin/end-tag ] with each
+        children-tags [ parse-begin/end-tag ] with each
      ] , ;
  
  : init-span-tag ( -- ) [ drop init-span ] , ;
diff --git a/basis/xmode/marker/marker.factor b/basis/xmode/marker/marker.factor

index cff0af2a981ed41c7cff5f2a8e6d8dc8585c5cb3..e106af79526eb2209de8a46fe9cbeb419df22c04 100755 (executable)
--- a/basis/xmode/marker/marker.factor
+++ b/basis/xmode/marker/marker.factor
@@ -4,8 +4,24 @@ IN: xmode.marker
  USING: kernel namespaces make xmode.rules xmode.tokens
  xmode.marker.state xmode.marker.context xmode.utilities
  xmode.catalog sequences math assocs combinators strings
-parser-combinators.regexp splitting parser-combinators ascii
+regexp splitting ascii regexp.backend unicode.case
  ascii combinators.short-circuit accessors ;
+! regexp.backend is for the regexp class
+
+! Next two words copied from parser-combinators
+! Just like head?, but they optionally ignore case
+
+: string= ( str1 str2 ignore-case -- ? )
+    [ [ >upper ] bi@ ] when sequence= ;
+
+: string-head? ( str1 str2 ignore-case -- ? )
+    2over shorter?
+    [ 3drop f ] [
+        [
+            [ nip ]
+            [ length head-slice ] 2bi
+        ] dip string=
+    ] if ;
  
  ! Based on org.gjt.sp.jedit.syntax.TokenMarker
  
@@ -150,7 +166,7 @@ M: escape-rule handle-rule-start
      process-escape? get [
          escaped? [ not ] change
          position [ + ] change
-    ] [ 2drop ] if ;
+    ] [ drop ] if ;
  
  M: seq-rule handle-rule-start
      ?end-rule
diff --git a/basis/xmode/rules/rules.factor b/basis/xmode/rules/rules.factor

index adc43d7bb6b6364521eb220c564af61dfbcd6436..99364fe7cd605808e74a0815b10149c2870db86e 100644 (file)
--- a/basis/xmode/rules/rules.factor
+++ b/basis/xmode/rules/rules.factor
@@ -1,6 +1,6 @@
  USING: accessors xmode.tokens xmode.keyword-map kernel
  sequences vectors assocs strings memoize unicode.case
-parser-combinators.regexp ;
+regexp regexp.backend ; ! regexp.backend has the regexp class
  IN: xmode.rules
  
  TUPLE: string-matcher string ignore-case? ;
diff --git a/basis/xmode/utilities/utilities-tests.factor b/basis/xmode/utilities/utilities-tests.factor

index 45238ca2b18bcf1e0688b52f21c88f9b1211873a..0ef221f23732e44d69fde9a44ddd316f5c9d1015 100644 (file)
--- a/basis/xmode/utilities/utilities-tests.factor
+++ b/basis/xmode/utilities/utilities-tests.factor
@@ -1,7 +1,6 @@
+USING: assocs xmode.utilities tools.test ;
  IN: xmode.utilities.tests
-USING: accessors xmode.utilities tools.test xml xml.data kernel
-strings vectors sequences io.files prettyprint assocs
-unicode.case ;
+
  [ "hi" 3 ] [
      { 1 2 3 4 5 6 7 8 } [ H{ { 3 "hi" } } at ] map-find
  ] unit-test
@@ -9,44 +8,3 @@ unicode.case ;
  [ f f ] [
      { 1 2 3 4 5 6 7 8 } [ H{ { 11 "hi" } } at ] map-find
  ] unit-test
-
-TUPLE: company employees type ;
-
-: <company> V{ } clone f company boa ;
-
-: add-employee employees>> push ;
-
-<TAGS: parse-employee-tag
-
-TUPLE: employee name description ;
-
-TAG: employee
-    employee new
-    { { "name" f (>>name) } { f (>>description) } }
-    init-from-tag swap add-employee ;
-
-TAGS>
-
-\ parse-employee-tag see
-
-: parse-company-tag
-    [
-        <company>
-        { { "type" >upper (>>type) } }
-        init-from-tag dup
-    ] keep
-    children>> [ tag? ] filter
-    [ parse-employee-tag ] with each ;
-
-[
-    T{ company f
-        V{
-            T{ employee f "Joe" "VP Sales" }
-            T{ employee f "Jane" "CFO" }
-        }
-        "PUBLIC"
-    }
-] [
-    "resource:basis/xmode/utilities/test.xml"
-    file>xml parse-company-tag
-] unit-test
diff --git a/basis/xmode/utilities/utilities.factor b/basis/xmode/utilities/utilities.factor

index 2423fb0d861cbff37d0e8041a4436157747b8600..1b2b4a352ffede5c44296ae15e3f370b1f3bd4c7 100644 (file)
--- a/basis/xmode/utilities/utilities.factor
+++ b/basis/xmode/utilities/utilities.factor
@@ -1,11 +1,10 @@
  USING: accessors sequences assocs kernel quotations namespaces
-xml.data xml.traversal combinators macros parser lexer words fry ;
+xml.data xml.traversal combinators macros parser lexer words fry
+regexp ;
  IN: xmode.utilities
  
  : implies ( x y -- z ) [ not ] dip or ; inline
  
-: child-tags ( tag -- seq ) children>> [ tag? ] filter ;
-
  : map-find ( seq quot -- result elt )
      [ f ] 2dip
      '[ nip @ dup ] find
@@ -38,20 +37,5 @@ MACRO: (init-from-tag) ( specs -- )
  : init-from-tag ( tag tuple specs -- tuple )
      over [ (init-from-tag) ] dip ; inline
  
-SYMBOL: tag-handlers
-SYMBOL: tag-handler-word
-
-: <TAGS:
-    CREATE tag-handler-word set
-    H{ } clone tag-handlers set ; parsing
-
-: (TAG:) ( name quot -- ) swap tag-handlers get set-at ;
-
-: TAG:
-    scan parse-definition
-    (TAG:) ; parsing
-
-: TAGS>
-    tag-handler-word get
-    tag-handlers get >alist [ [ dup main>> ] dip case ] curry
-    define ; parsing
+: <?insensitive-regexp> ( string ? -- regexp )
+    "i" "" ? <optioned-regexp> ;
author	Daniel Ehrenberg <littledan@Macintosh-103.local>
	Mon, 16 Feb 2009 02:42:45 +0000 (20:42 -0600)
committer	Daniel Ehrenberg <littledan@Macintosh-103.local>
	Mon, 16 Feb 2009 02:42:45 +0000 (20:42 -0600)
basis/ascii/ascii.factor		patch \| blob \| history
basis/regexp/classes/classes.factor		patch \| blob \| history
basis/regexp/nfa/nfa.factor		patch \| blob \| history
basis/regexp/regexp-tests.factor		patch \| blob \| history
basis/regexp/transition-tables/transition-tables.factor		patch \| blob \| history
basis/regexp/traversal/traversal.factor		patch \| blob \| history
basis/regexp/utils/utils.factor		patch \| blob \| history
basis/xmode/catalog/catalog.factor		patch \| blob \| history
basis/xmode/loader/loader.factor		patch \| blob \| history
basis/xmode/loader/syntax/syntax.factor		patch \| blob \| history
basis/xmode/marker/marker.factor		patch \| blob \| history
basis/xmode/rules/rules.factor		patch \| blob \| history
basis/xmode/utilities/utilities-tests.factor		patch \| blob \| history
basis/xmode/utilities/utilities.factor		patch \| blob \| history