Fixing HTML dependancy on state-parser

author Daniel Ehrenberg <littledan@Macintosh-103.local>

Thu, 22 Jan 2009 03:57:44 +0000 (21:57 -0600)

committer Daniel Ehrenberg <littledan@Macintosh-103.local>

Thu, 22 Jan 2009 03:57:44 +0000 (21:57 -0600)
author Daniel Ehrenberg <littledan@Macintosh-103.local>
Thu, 22 Jan 2009 03:57:44 +0000 (21:57 -0600)
committer Daniel Ehrenberg <littledan@Macintosh-103.local>
Thu, 22 Jan 2009 03:57:44 +0000 (21:57 -0600)
diff --git a/extra/html/parser/parser.factor b/extra/html/parser/parser.factor

index 836693026a41da1152f6851da2b6f79ca5c9376d..c445b708c5859bf73e2ad6bf6f317f7f2ca3608f 100644 (file)
--- a/extra/html/parser/parser.factor
+++ b/extra/html/parser/parser.factor
@@ -2,7 +2,7 @@
  ! See http://factorcode.org/license.txt for BSD license.
  USING: accessors arrays html.parser.utils hashtables io kernel
  namespaces make prettyprint quotations sequences splitting
-state-parser strings unicode.categories unicode.case ;
+html.parser.state strings unicode.categories unicode.case ;
  IN: html.parser
  
  TUPLE: tag name attributes text closing? ;
@@ -59,8 +59,8 @@ SYMBOL: tagstack
      [ get-char CHAR: " = ] take-until ;
  
  : read-quote ( -- string )
-    get-char next* CHAR: ' =
-    [ read-single-quote ] [ read-double-quote ] if next* ;
+    get-char next CHAR: ' =
+    [ read-single-quote ] [ read-double-quote ] if next ;
  
  : read-key ( -- string )
      read-whitespace*
@@ -68,7 +68,7 @@ SYMBOL: tagstack
  
  : read-= ( -- )
      read-whitespace*
-    [ get-char CHAR: = = ] take-until drop next* ;
+    [ get-char CHAR: = = ] take-until drop next ;
  
  : read-value ( -- string )
      read-whitespace*
@@ -76,14 +76,14 @@ SYMBOL: tagstack
      [ blank? ] trim ;
  
  : read-comment ( -- )
-    "-->" take-string* make-comment-tag push-tag ;
+    "-->" take-string make-comment-tag push-tag ;
  
  : read-dtd ( -- )
-    ">" take-string* make-dtd-tag push-tag ;
+    ">" take-string make-dtd-tag push-tag ;
  
  : read-bang ( -- )
-    next* get-char CHAR: - = get-next CHAR: - = and [
-        next* next*
+    next get-char CHAR: - = get-next CHAR: - = and [
+        next next
          read-comment
      ] [
          read-dtd
@@ -91,10 +91,10 @@ SYMBOL: tagstack
  
  : read-tag ( -- string )
      [ get-char CHAR: > = get-char CHAR: < = or ] take-until
-    get-char CHAR: < = [ next* ] unless ;
+    get-char CHAR: < = [ next ] unless ;
  
  : read-< ( -- string )
-    next* get-char CHAR: ! = [
+    next get-char CHAR: ! = [
          read-bang f
      ] [
          read-tag
diff --git a/extra/html/parser/state/state-tests.factor b/extra/html/parser/state/state-tests.factor

new file mode 100644 (file)

index 0000000..a9be38c
--- /dev/null
+++ b/extra/html/parser/state/state-tests.factor
@@ -0,0 +1,13 @@
+USING: tools.test html.parser.state ascii kernel ;
+IN: html.parser.state.tests
+
+: take-rest ( -- string )
+    [ f ] take-until ;
+
+: take-char ( -- string )
+    [ get-char = ] curry take-until ;
+
+[ "hello" ] [ "hello" [ take-rest ] string-parse ] unit-test
+[ "hi" " how are you?" ] [ "hi how are you?" [ [ get-char blank? ] take-until take-rest ] string-parse ] unit-test
+[ "foo" ";bar" ] [ "foo;bar" [ CHAR: ; take-char take-rest ] string-parse ] unit-test
+! [ "foo " " bar" ] [ "foo and bar" [ "and" take-string take-rest ] string-parse ] unit-test
diff --git a/extra/html/parser/state/state.factor b/extra/html/parser/state/state.factor

new file mode 100644 (file)

index 0000000..4b1027d
--- /dev/null
+++ b/extra/html/parser/state/state.factor
@@ -0,0 +1,41 @@
+! Copyright (C) 2005, 2009 Daniel Ehrenberg
+! See http://factorcode.org/license.txt for BSD license.
+USING: namespaces math kernel sequences accessors fry circular ;
+IN: html.parser.state
+
+TUPLE: state string i ;
+
+: get-i ( -- i ) state get i>> ;
+
+: get-char ( -- char )
+    state get [ i>> ] [ string>> ] bi ?nth ;
+
+: get-next ( -- char )
+    state get [ i>> 1+ ] [ string>> ] bi ?nth ;
+
+: next ( -- )
+    state get [ 1+ ] change-i drop ;
+
+: string-parse ( string quot -- )
+    [ 0 state boa state ] dip with-variable ;
+
+: short* ( n seq -- n' seq )
+    over [ nip dup length swap ] unless ;
+
+: skip-until ( quot: ( -- ? ) -- )
+    get-char [
+        [ call ] keep swap
+        [ drop ] [ next skip-until ] if
+    ] [ drop ] if ; inline recursive
+
+: take-until ( quot: ( -- ? ) -- )
+    [ get-i ] dip skip-until get-i
+    state get string>> subseq ;
+
+: string-matches? ( string circular -- ? )
+    get-char over push-circular sequence= ;
+
+: take-string ( match -- string )
+    dup length <circular-string>
+    [ 2dup string-matches? ] take-until nip
+    dup length rot length 1- - head next ;
diff --git a/extra/html/parser/utils/utils-tests.factor b/extra/html/parser/utils/utils-tests.factor

index 4b25db16fd860a3e1c578d099f32e8fb3239af76..6d8e3bc05f07128f9c288fd3247ecd74ef30d905 100644 (file)
--- a/extra/html/parser/utils/utils-tests.factor
+++ b/extra/html/parser/utils/utils-tests.factor
@@ -1,7 +1,7 @@
  USING: assocs combinators continuations hashtables
  hashtables.private io kernel math
  namespaces prettyprint quotations sequences splitting
-state-parser strings tools.test ;
+strings tools.test ;
  USING: html.parser.utils ;
  IN: html.parser.utils.tests
  
diff --git a/extra/html/parser/utils/utils.factor b/extra/html/parser/utils/utils.factor

index c2a9d73af89de917a2335c59807d6354ee8069d3..c913b9d306cebd77db6e8785706300fb7063b73e 100644 (file)
--- a/extra/html/parser/utils/utils.factor
+++ b/extra/html/parser/utils/utils.factor
@@ -2,17 +2,12 @@
  ! See http://factorcode.org/license.txt for BSD license.
  USING: assocs circular combinators continuations hashtables
  hashtables.private io kernel math namespaces prettyprint
-quotations sequences splitting state-parser strings
+quotations sequences splitting html.parser.state strings
  combinators.short-circuit ;
  IN: html.parser.utils
  
  : string-parse-end? ( -- ? ) get-next not ;
  
-: take-string* ( match -- string )
-    dup length <circular-string>
-    [ 2dup string-matches? ] take-until nip
-    dup length rot length 1- - head next* ;
-
  : trim1 ( seq ch -- newseq )
      [ [ ?head-slice drop ] [ ?tail-slice drop ] bi ] 2keep drop like ;
author	Daniel Ehrenberg <littledan@Macintosh-103.local>
	Thu, 22 Jan 2009 03:57:44 +0000 (21:57 -0600)
committer	Daniel Ehrenberg <littledan@Macintosh-103.local>
	Thu, 22 Jan 2009 03:57:44 +0000 (21:57 -0600)
extra/html/parser/parser.factor		patch \| blob \| history
extra/html/parser/state/state-tests.factor	[new file with mode: 0644]	patch \| blob
extra/html/parser/state/state.factor	[new file with mode: 0644]	patch \| blob
extra/html/parser/utils/utils-tests.factor		patch \| blob \| history
extra/html/parser/utils/utils.factor		patch \| blob \| history