use radix literals

[factor.git] / basis / xml / autoencoding / autoencoding.factor
diff --git a/basis/xml/autoencoding/autoencoding.factor b/basis/xml/autoencoding/autoencoding.factor

index 20a661cfa79e98f3a9f2082161d07255ff42e970..ed9b341c52dbdedacb0e43e3dd2fae24d3a40bb3 100644 (file)
--- a/basis/xml/autoencoding/autoencoding.factor
+++ b/basis/xml/autoencoding/autoencoding.factor
@@ -3,44 +3,50 @@
  USING: kernel namespaces xml.name io.encodings.utf8 xml.elements
  io.encodings.utf16 xml.tokenize xml.state math ascii sequences
  io.encodings.string io.encodings combinators accessors
-xml.data io.encodings.iana ;
+xml.data io.encodings.iana xml.errors ;
  IN: xml.autoencoding
  
+: decode-stream ( encoding -- )
+    spot get [ swap re-decode ] change-stream drop ;
+
  : continue-make-tag ( str -- tag )
      parse-name-starting middle-tag end-tag ;
  
  : start-utf16le ( -- tag )
-    utf16le decode-input
+    utf16le decode-stream
      "?\0" expect
      check instruct ;
  
  : 10xxxxxx? ( ch -- ? )
      -6 shift 3 bitand 2 = ;
-          
+
  : start<name ( ch -- tag )
      ! This is unfortunate, and exists for the corner case
      ! that the first letter of the document is < and second is
      ! not ASCII
      ascii?
-    [ utf8 decode-input next make-tag ] [
+    [ utf8 decode-stream next make-tag ] [
          next
-        [ get-next 10xxxxxx? not ] take-until
+        [ drop get-next 10xxxxxx? not ] take-until
          get-char suffix utf8 decode
-        utf8 decode-input next
+        utf8 decode-stream next
          continue-make-tag
      ] if ;
  
  : prolog-encoding ( prolog -- )
      encoding>> dup "UTF-16" =
-    [ drop ] [ name>encoding [ decode-input ] when* ] if ;
+    [ drop ] [
+        dup name>encoding
+        [ decode-stream ] [ bad-encoding ] ?if
+    ] if ;
  
  : instruct-encoding ( instruct/prolog -- )
      dup prolog?
      [ prolog-encoding ]
-    [ drop utf8 decode-input ] if ;
+    [ drop utf8 decode-stream ] if ;
  
  : go-utf8 ( -- )
-    check utf8 decode-input next next ;
+    check utf8 decode-stream next next ;
  
  : start< ( -- tag )
      ! What if first letter of processing instruction is non-ASCII?
@@ -52,11 +58,11 @@ IN: xml.autoencoding
      } case ;
  
  : skip-utf8-bom ( -- tag )
-    "\u0000bb\u0000bf" expect utf8 decode-input
+    "\u0000bb\u0000bf" expect utf8 decode-stream
      "<" expect check make-tag ;
  
  : decode-expecting ( encoding string -- tag )
-    [ decode-input next ] [ expect ] bi* check make-tag ;
+    [ decode-stream next ] [ expect ] bi* check make-tag ;
  
  : start-utf16be ( -- tag )
      utf16be "<" decode-expecting ;
@@ -71,9 +77,9 @@ IN: xml.autoencoding
      get-char {
          { CHAR: < [ start< ] }
          { 0 [ start-utf16be ] }
-        { HEX: EF [ skip-utf8-bom ] }
-        { HEX: FF [ skip-utf16le-bom ] }
-        { HEX: FE [ skip-utf16be-bom ] }
-        [ drop utf8 decode-input check f ]
+        { 0xEF [ skip-utf8-bom ] }
+        { 0xFF [ skip-utf16le-bom ] }
+        { 0xFE [ skip-utf16be-bom ] }
+        [ drop utf8 decode-stream check f ]
      } case ;