Add a scan-token word which is like scan, except throws an error on EOF; document...

author Slava Pestov <slava@slava-pestovs-macbook-pro.local>

Tue, 6 Jul 2010 20:20:08 +0000 (16:20 -0400)

committer Slava Pestov <slava@slava-pestovs-macbook-pro.local>

Tue, 6 Jul 2010 20:20:08 +0000 (16:20 -0400)
author Slava Pestov <slava@slava-pestovs-macbook-pro.local>
Tue, 6 Jul 2010 20:20:08 +0000 (16:20 -0400)
committer Slava Pestov <slava@slava-pestovs-macbook-pro.local>
Tue, 6 Jul 2010 20:20:08 +0000 (16:20 -0400)
diff --git a/basis/alien/parser/parser.factor b/basis/alien/parser/parser.factor

index 332683a0ac02218a9400b0463ac0b16eb3dc24d3..7d7244281978c972c992fa5f171e0481217d7fca 100755 (executable)
--- a/basis/alien/parser/parser.factor
+++ b/basis/alien/parser/parser.factor
@@ -32,7 +32,7 @@ SYMBOL: current-library
      (parse-c-type) dup valid-c-type? [ no-c-type ] unless ;
  
  : scan-c-type ( -- c-type )
-    scan {
+    scan-token {
          { [ dup "{" = ] [ drop \ } parse-until >array ] }
          { [ dup "pointer:" = ] [ drop scan-c-type <pointer> ] }
          [ parse-c-type ]
diff --git a/basis/alien/syntax/syntax.factor b/basis/alien/syntax/syntax.factor

index 570ebf60a52920b79340f9e3ab3c4fa692757fcd..6c2dc5ca85e97abcc51c6bb62d9448ca62d97a50 100755 (executable)
--- a/basis/alien/syntax/syntax.factor
+++ b/basis/alien/syntax/syntax.factor
@@ -19,7 +19,7 @@ SYNTAX: FUNCTION:
      (FUNCTION:) make-function define-declared ;
  
  SYNTAX: FUNCTION-ALIAS:
-    scan create-function
+    scan-token create-function
      (FUNCTION:) (make-function) define-declared ;
  
  SYNTAX: CALLBACK:
diff --git a/basis/classes/struct/struct.factor b/basis/classes/struct/struct.factor

index c15e21f65184650c6063a8c9c62ccf265b67d526..3699cdb7d1743964c6be18326d4a79158409058c 100644 (file)
--- a/basis/classes/struct/struct.factor
+++ b/basis/classes/struct/struct.factor
@@ -334,10 +334,9 @@ PRIVATE>
      scan scan-c-type \ } parse-until <struct-slot-spec> ;
  
  : parse-struct-slots ( slots -- slots' more? )
-    scan {
+    scan-token {
          { ";" [ f ] }
          { "{" [ parse-struct-slot suffix! t ] }
-        { f [ unexpected-eof ] }
          [ invalid-struct-slot ]
      } case ;
  
diff --git a/basis/functors/backend/backend.factor b/basis/functors/backend/backend.factor

index 331864417e3577880f2735787aa323040e269c04..9ade1d50f894c15b2932009a69bb1e72ed117cf4 100644 (file)
--- a/basis/functors/backend/backend.factor
+++ b/basis/functors/backend/backend.factor
@@ -20,7 +20,7 @@ SYNTAX: FUNCTOR-SYNTAX:
      dup search dup lexical? [ nip ] [ drop ] if ;
  
  : scan-string-param ( -- name/param )
-    scan >string-param ;
+    scan-token >string-param ;
  
  : scan-c-type-param ( -- c-type/param )
      scan dup "{" = [ drop \ } parse-until >array ] [ >string-param ] if ;
diff --git a/basis/locals/parser/parser.factor b/basis/locals/parser/parser.factor

index 01be7bcd20ae44b13a380fab80a9d645d7c24670..5248d50ced963adcacddfb7d4d9b62b6edcfc5b7 100644 (file)
--- a/basis/locals/parser/parser.factor
+++ b/basis/locals/parser/parser.factor
@@ -55,8 +55,7 @@ M: lambda-parser parse-quotation ( -- quotation )
      H{ } clone (parse-lambda) ;
  
  : parse-binding ( end -- pair/f )
-    scan {
-        { [ dup not ] [ unexpected-eof ] }
+    scan-token {
          { [ 2dup = ] [ 2drop f ] }
          [ nip scan-object 2array ]
      } cond ;
diff --git a/core/classes/tuple/parser/parser.factor b/core/classes/tuple/parser/parser.factor

index 5016bb38f620553d84fa161da8db98ea41daa1dd..631ab92743835f684a164249bf42d0b040bf6e38 100644 (file)
--- a/core/classes/tuple/parser/parser.factor
+++ b/core/classes/tuple/parser/parser.factor
@@ -34,21 +34,19 @@ ERROR: invalid-slot-name name ;
      [ scan , \ } parse-until % ] { } make ;
  
  : parse-slot-name-delim ( end-delim string/f -- ? )
-    #! This isn't meant to enforce any kind of policy, just
-    #! to check for mistakes of this form:
-    #!
-    #! TUPLE: blahblah foo bing
-    #!
-    #! : ...
+    ! Check for mistakes of this form:
+    !
+    ! TUPLE: blahblah foo bing
+    !
+    ! : ...
      {
-        { [ dup not ] [ unexpected-eof ] }
          { [ dup { ":" "(" "<" "\"" "!" } member? ] [ invalid-slot-name ] }
          { [ 2dup = ] [ drop f ] }
          [ dup "{" = [ drop parse-long-slot-name ] when , t ]
      } cond nip ;
  
  : parse-tuple-slots-delim ( end-delim -- )
-    dup scan parse-slot-name-delim [ parse-tuple-slots-delim ] [ drop ] if ;
+    dup scan-token parse-slot-name-delim [ parse-tuple-slots-delim ] [ drop ] if ;
  
  : parse-slot-name ( string/f -- ? )
      ";" swap parse-slot-name-delim ;
@@ -74,16 +72,14 @@ ERROR: bad-slot-name class slot ;
      2dup swap slot-named* nip [ 2nip ] [ nip bad-slot-name ] if ;
  
  : parse-slot-value ( class slots -- )
-    scan check-slot-name scan-object 2array , scan {
-        { f [ \ } unexpected-eof ] }
+    scan check-slot-name scan-object 2array , scan-token {
          { "}" [ ] }
          [ bad-literal-tuple ]
      } case ;
  
  : (parse-slot-values) ( class slots -- )
      2dup parse-slot-value
-    scan {
-        { f [ 2drop \ } unexpected-eof ] }
+    scan-token {
          { "{" [ (parse-slot-values) ] }
          { "}" [ 2drop ] }
          [ 2nip bad-literal-tuple ]
@@ -109,8 +105,7 @@ M: tuple-class boa>object
      assoc-union! seq>> boa>object ;
  
  : parse-tuple-literal-slots ( class slots -- tuple )
-    scan {
-        { f [ unexpected-eof ] }
+    scan-token {
          { "f" [ drop \ } parse-until boa>object ] }
          { "{" [ 2dup parse-slot-values assoc>object ] }
          { "}" [ drop new ] }
diff --git a/core/effects/parser/parser.factor b/core/effects/parser/parser.factor

index cd484ddd2e6113dd8636889d6fe0775eb3129ba2..07ecc0d88b266cf56938c52c9b922544c2749c93 100644 (file)
--- a/core/effects/parser/parser.factor
+++ b/core/effects/parser/parser.factor
@@ -26,9 +26,8 @@ SYMBOL: effect-var
  
  : parse-effect-value ( token -- value )
      ":" ?tail [
-        scan {
+        scan-token {
              { [ dup "(" = ] [ drop ")" parse-effect ] }
-            { [ dup f = ] [ ")" unexpected-eof ] }
              [ parse-word dup class? [ bad-effect ] unless ]
          } cond 2array
      ] when ;
diff --git a/core/lexer/authors.txt b/core/lexer/authors.txt

index 1901f27a24507e2512d93a1f956aaaa0d2f05714..580f882c8d78327fd1fc737a4da0624407fe0e7a 100644 (file)
--- a/core/lexer/authors.txt
+++ b/core/lexer/authors.txt
@@ -1 +1,2 @@
  Slava Pestov
+Joe Groff
diff --git a/core/lexer/lexer-docs.factor b/core/lexer/lexer-docs.factor

index 3dc534cdfd8cd53697743830a9cb55977bcab09c..0fbf3b3563f53cf717431f23b1f314c9f93f444a 100644 (file)
--- a/core/lexer/lexer-docs.factor
+++ b/core/lexer/lexer-docs.factor
@@ -59,7 +59,12 @@ HELP: parse-token
  
  HELP: scan
  { $values { "str/f" { $maybe string } } }
-{ $description "Reads the next token from the lexer. See " { $link parse-token } " for details." }
+{ $description "Reads the next token from the lexer. Tokens are delimited by whitespace, with the exception that " { $snippet "\"" } " is treated like a single token even when not followed by whitespace. This word outputs " { $link f } " on end of input. To throw an error on end of input, use " { $link scan-token } " instead." }
+$parsing-note ;
+
+HELP: scan-token
+{ $values { "str" string } }
+{ $description "Reads the next token from the lexer. Tokens are delimited by whitespace, with the exception that " { $snippet "\"" } " is treated like a single token even when not followed by whitespace. This word throws " { $link unexpected-eof } " on end of input. To output " { $link f } " on end of input, use " { $link scan } " instead." }
  $parsing-note ;
  
  HELP: still-parsing?
diff --git a/core/lexer/lexer.factor b/core/lexer/lexer.factor

index d5eecde1a2da219a5078fdf446ebf690de5b226e..98a1277ac78d487a9d49603a39c3dc5bd2a109c0 100644 (file)
--- a/core/lexer/lexer.factor
+++ b/core/lexer/lexer.factor
@@ -1,4 +1,4 @@
-! Copyright (C) 2008, 2009 Slava Pestov.
+! Copyright (C) 2008, 2010 Slava Pestov, Joe Groff.
  ! See http://factorcode.org/license.txt for BSD license.
  USING: kernel sequences accessors namespaces math words strings
  io vectors arrays math.parser combinators continuations
@@ -18,12 +18,12 @@ TUPLE: lexer-parsing-word word line line-text column ;
  
  : push-parsing-word ( word -- )
      lexer-parsing-word new
-        swap >>word
-        lexer get [
-            [ line>>      >>line      ]
-            [ line-text>> >>line-text ]
-            [ column>>    >>column    ] tri
-        ] [ parsing-words>> push ] bi ;
+    swap >>word
+    lexer get [
+        [ line>>      >>line      ]
+        [ line-text>> >>line-text ]
+        [ column>>    >>column    ] tri
+    ] [ parsing-words>> push ] bi ;
  
  : pop-parsing-word ( -- )
      lexer get parsing-words>> pop drop ;
@@ -77,7 +77,7 @@ M: lexer skip-word ( lexer -- )
          [ line-text>> ]
      } cleave subseq ;
  
-:  parse-token ( lexer -- str/f )
+: parse-token ( lexer -- str/f )
      dup still-parsing? [
          dup skip-blank
          dup still-parsing-line?
@@ -90,18 +90,14 @@ PREDICATE: unexpected-eof < unexpected got>> not ;
  
  : unexpected-eof ( word -- * ) f unexpected ;
  
+: scan-token ( -- str ) scan [ "token" unexpected-eof ] unless* ;
+
  : expect ( token -- )
-    scan
-    [ 2dup = [ 2drop ] [ unexpected ] if ]
-    [ unexpected-eof ]
-    if* ;
+    scan-token 2dup = [ 2drop ] [ unexpected ] if ;
  
  : each-token ( ... end quot: ( ... token -- ... ) -- ... )
-    [ scan ] 2dip {
-        { [ 2over = ] [ 3drop ] }
-        { [ pick not ] [ drop unexpected-eof ] }
-        [ [ nip call ] [ each-token ] 2bi ]
-    } cond ; inline recursive
+    [ scan-token ] 2dip 2over =
+    [ 3drop ] [ [ nip call ] [ each-token ] 2bi ] if ; inline recursive
  
  : map-tokens ( ... end quot: ( ... token -- ... elt ) -- ... seq )
      collector [ each-token ] dip { } like ; inline
@@ -117,14 +113,14 @@ M: lexer-error error-line [ error>> error-line ] [ line>> ] bi or ;
  
  : <lexer-error> ( msg -- error )
      \ lexer-error new
-        lexer get [
-            [ line>> >>line ]
-            [ column>> >>column ] bi
-        ] [ 
-            [ line-text>> >>line-text ]
-            [ parsing-words>> clone >>parsing-words ] bi
-        ] bi
-        swap >>error ;
+    lexer get [
+        [ line>> >>line ]
+        [ column>> >>column ] bi
+    ] [
+        [ line-text>> >>line-text ]
+        [ parsing-words>> clone >>parsing-words ] bi
+    ] bi
+    swap >>error ;
  
  : simple-lexer-dump ( error -- )
      [ line>> number>string ": " append ]
@@ -148,7 +144,9 @@ M: lexer-error error-line [ error>> error-line ] [ line>> ] bi or ;
      [ (parsing-word-lexer-dump) ] if ;
  
  : lexer-dump ( error -- )
-    dup parsing-words>> [ simple-lexer-dump ] [ last parsing-word-lexer-dump ] if-empty ;
+    dup parsing-words>>
+    [ simple-lexer-dump ]
+    [ last parsing-word-lexer-dump ] if-empty ;
  
  : with-lexer ( lexer quot -- newquot )
      [ lexer set ] dip [ <lexer-error> rethrow ] recover ; inline
diff --git a/core/parser/parser-docs.factor b/core/parser/parser-docs.factor

index c04a0f568ee0fa1091a6c0b8153cc0bce031281c..6889f497e17c4cb99739850a2ccc73fb2d91c2e2 100644 (file)
--- a/core/parser/parser-docs.factor
+++ b/core/parser/parser-docs.factor
@@ -7,6 +7,11 @@ IN: parser
  
  ARTICLE: "reading-ahead" "Reading ahead"
  "Parsing words can consume input:"
+{ $subsections
+    scan-token
+    scan-object
+}
+"Lower-level words:"
  { $subsections
      scan
      scan-word
@@ -249,3 +254,8 @@ HELP: staging-violation
  HELP: auto-use?
  { $var-description "If set to a true value, the behavior of the parser when encountering an unknown word name is changed. If only one loaded vocabulary has a word with this name, instead of throwing an error, the parser adds the vocabulary to the search path and prints a parse note. Off by default." }
  { $notes "This feature is intended to help during development. To generate a " { $link POSTPONE: USING: } " form automatically, enable " { $link auto-use? } ", load the source file, and copy and paste the " { $link POSTPONE: USING: } " form printed by the parser back into the file, then disable " { $link auto-use? } ". See " { $link "word-search-errors" } "." } ;
+
+HELP: scan-object
+{ $values { "object" object } }
+{ $description "Parses a literal representation of an object." }
+$parsing-note ;
diff --git a/core/syntax/syntax.factor b/core/syntax/syntax.factor

index 92211a5b01d8476df3b6c89822e6dc36fe40440a..07ff0d3c922a99020c39524e9fd14d1ab26a0c8d 100644 (file)
--- a/core/syntax/syntax.factor
+++ b/core/syntax/syntax.factor
@@ -41,32 +41,32 @@ IN: bootstrap.syntax
  
      "#!" [ POSTPONE: ! ] define-core-syntax
  
-    "IN:" [ scan set-current-vocab ] define-core-syntax
+    "IN:" [ scan-token set-current-vocab ] define-core-syntax
  
      "<PRIVATE" [ begin-private ] define-core-syntax
  
      "PRIVATE>" [ end-private ] define-core-syntax
  
-    "USE:" [ scan use-vocab ] define-core-syntax
+    "USE:" [ scan-token use-vocab ] define-core-syntax
  
-    "UNUSE:" [ scan unuse-vocab ] define-core-syntax
+    "UNUSE:" [ scan-token unuse-vocab ] define-core-syntax
  
      "USING:" [ ";" [ use-vocab ] each-token ] define-core-syntax
  
-    "QUALIFIED:" [ scan dup add-qualified ] define-core-syntax
+    "QUALIFIED:" [ scan-token dup add-qualified ] define-core-syntax
  
-    "QUALIFIED-WITH:" [ scan scan add-qualified ] define-core-syntax
+    "QUALIFIED-WITH:" [ scan-token scan-token add-qualified ] define-core-syntax
  
      "FROM:" [
-        scan "=>" expect ";" parse-tokens add-words-from
+        scan-token "=>" expect ";" parse-tokens add-words-from
      ] define-core-syntax
  
      "EXCLUDE:" [
-        scan "=>" expect ";" parse-tokens add-words-excluding
+        scan-token "=>" expect ";" parse-tokens add-words-excluding
      ] define-core-syntax
  
      "RENAME:" [
-        scan scan "=>" expect scan add-renamed-word
+        scan-token scan-token "=>" expect scan-token add-renamed-word
      ] define-core-syntax
  
      "HEX:" [ 16 parse-base ] define-core-syntax
@@ -79,7 +79,7 @@ IN: bootstrap.syntax
      "t" "syntax" lookup define-singleton-class
  
      "CHAR:" [
-        scan {
+        scan-token {
              { [ dup length 1 = ] [ first ] }
              { [ "\\" ?head ] [ next-escape >string "" assert= ] }
              [ name>char-hook get call( name -- char ) ]
@@ -133,7 +133,7 @@ IN: bootstrap.syntax
      ] define-core-syntax
  
      "DEFER:" [
-        scan current-vocab create
+        scan-token current-vocab create
          [ fake-definition ] [ set-word ] [ undefined-def define ] tri
      ] define-core-syntax
      
@@ -190,7 +190,7 @@ IN: bootstrap.syntax
  
      "PREDICATE:" [
          CREATE-CLASS
-        scan "<" assert=
+        "<" expect
          scan-word
          parse-definition define-predicate-class
      ] define-core-syntax
@@ -208,7 +208,7 @@ IN: bootstrap.syntax
      ] define-core-syntax
  
      "SLOT:" [
-        scan define-protocol-slot
+        scan-token define-protocol-slot
      ] define-core-syntax
  
      "C:" [
author	Slava Pestov <slava@slava-pestovs-macbook-pro.local>
	Tue, 6 Jul 2010 20:20:08 +0000 (16:20 -0400)
committer	Slava Pestov <slava@slava-pestovs-macbook-pro.local>
	Tue, 6 Jul 2010 20:20:08 +0000 (16:20 -0400)
basis/alien/parser/parser.factor		patch \| blob \| history
basis/alien/syntax/syntax.factor		patch \| blob \| history
basis/classes/struct/struct.factor		patch \| blob \| history
basis/functors/backend/backend.factor		patch \| blob \| history
basis/locals/parser/parser.factor		patch \| blob \| history
core/classes/tuple/parser/parser.factor		patch \| blob \| history
core/effects/parser/parser.factor		patch \| blob \| history
core/lexer/authors.txt		patch \| blob \| history
core/lexer/lexer-docs.factor		patch \| blob \| history
core/lexer/lexer.factor		patch \| blob \| history
core/parser/parser-docs.factor		patch \| blob \| history
core/syntax/syntax.factor		patch \| blob \| history