use reject instead of [ ... not ] filter.

[factor.git] / basis / unicode / breaks / breaks-tests.factor
diff --git a/basis/unicode/breaks/breaks-tests.factor b/basis/unicode/breaks/breaks-tests.factor

index 77ba0e82fa702f4bf85997ba2bb2a0e11b690613..a3acaf3c4ff06b5e36eaa6d187747244a0b62af4 100644 (file)
--- a/basis/unicode/breaks/breaks-tests.factor
+++ b/basis/unicode/breaks/breaks-tests.factor
@@ -1,7 +1,54 @@
-USING: tools.test unicode.breaks sequences math kernel ;
+USING: tools.test unicode.breaks sequences math kernel splitting
+unicode.categories io.pathnames io.encodings.utf8 io.files
+strings quotations math.parser locals ;
+IN: unicode.breaks.tests
  
  [ "\u001112\u001161\u0011abA\u000300a\r\r\n" ]
  [ "\r\n\raA\u000300\u001112\u001161\u0011ab" string-reverse ] unit-test
  [ "dcba" ] [ "abcd" string-reverse ] unit-test
  [ 3 ] [ "\u001112\u001161\u0011abA\u000300a"
          dup last-grapheme head last-grapheme ] unit-test
+
+[ 3 ] [ 2 "hello" first-grapheme-from ] unit-test
+[ 1 ] [ 2 "hello" last-grapheme-from ] unit-test
+
+[ 4 ] [ 2 "what am I saying" first-word-from ] unit-test
+[ 0 ] [ 2 "what am I saying" last-word-from ] unit-test
+[ 16 ] [ 11 "what am I saying" first-word-from ] unit-test
+[ 10 ] [ 11 "what am I saying" last-word-from ] unit-test
+
+: grapheme-break-test ( -- filename )
+    "vocab:unicode/breaks/GraphemeBreakTest.txt" ;
+
+: word-break-test ( -- filename )
+    "vocab:unicode/breaks/WordBreakTest.txt" ;
+
+: parse-test-file ( file-name -- tests )
+    utf8 file-lines
+    [ "#" split1 drop ] map harvest [
+        "÷" split
+        [
+            "×" split
+            [ [ blank? ] trim hex> ] map
+            [ { f 0 } member? ] reject
+            >string
+        ] map
+        harvest
+    ] map ;
+
+:: test ( tests quot -- )
+    tests [
+        [ 1quotation ]
+        [ concat [ quot call [ "" like ] map ] curry ] bi unit-test
+    ] each ;
+
+: grapheme-test ( tests -- )
+    [
+        [ 1quotation ]
+        [ concat [ >graphemes [ "" like ] map ] curry ] bi unit-test
+    ] each ;
+
+grapheme-break-test parse-test-file [ >graphemes ] test
+word-break-test parse-test-file [ >words ] test
+
+[ { t f t t f t } ] [ 6 iota [ "as df" word-break-at? ] map ] unit-test