basis/unicode/normalize/normalize-tests.factor

   1 USING: unicode.normalize kernel tools.test sequences
   2 unicode.data io.encodings.utf8 io.files splitting math.parser
   3 locals math quotations assocs combinators ;
   4 IN: unicode.normalize.tests
   5
   6 [ "ab\u000323\u000302cd" ] [ "ab\u000302" "\u000323cd" string-append ] unit-test
   7
   8 [ "ab\u00064b\u000347\u00034e\u00034d\u000346" ] [ "ab\u000346\u000347\u00064b\u00034e\u00034d" dup reorder ] unit-test
   9 [ "hello" "hello" ] [ "hello" [ nfd ] keep nfkd ] unit-test
  10 [ "\u00FB012\u002075\u00017F\u000323\u000307" "fi25s\u000323\u000307" ]
  11 [ "\u00FB012\u002075\u001E9B\u000323" [ nfd ] keep nfkd ] unit-test
  12
  13 [ "\u001E69" "s\u000323\u000307" ] [ "\u001E69" [ nfc ] keep nfd ] unit-test
  14 [ "\u001E0D\u000307" ] [ "\u001E0B\u000323" nfc ] unit-test
  15
  16 [ 54620 ] [ 4370 4449 4523 jamo>hangul ] unit-test
  17 [ 4370 4449 4523 ] [ 54620 hangul>jamo first3 ] unit-test
  18 [ t ] [ 54620 hangul? ] unit-test
  19 [ f ] [ 0 hangul? ] unit-test
  20 [ "\u001112\u001161\u0011ab" ] [ "\u00d55c" nfd ] unit-test
  21 [ "\u00d55c" ] [ "\u001112\u001161\u0011ab" nfc ] unit-test
  22
  23 : parse-test ( -- tests )
  24     "resource:basis/unicode/normalize/NormalizationTest.txt"
  25     utf8 file-lines filter-comments
  26     [ ";" split 5 head [ " " split [ hex> ] "" map-as ] map ] map ;
  27
  28 :: assert= ( test spec quot -- )
  29     spec [
  30         [
  31             [ 1- test nth ] bi@
  32             [ 1quotation ] [ quot curry ] bi* unit-test
  33         ] with each
  34     ] assoc-each ;
  35
  36 : run-line ( test -- )
  37     {
  38         [ { { 2 { 1 2 3 } } { 4 { 4 5 } } } [ nfc ] assert= ]
  39         [ { { 3 { 1 2 3 } } { 5 { 4 5 } } } [ nfd ] assert= ]
  40         [ { { 4 { 1 2 3 4 5 } } } [ nfkc ] assert= ]
  41         [ { { 5 { 1 2 3 4 5 } } } [ nfkd ] assert= ]
  42     } cleave ;
  43
  44 ! parse-test [ run-line ] each