1 USING: accessors assocs combinators html.parser
2 html.parser.utils io io.streams.string kernel math math.order
3 namespaces sequences strings unicode.categories ;
4 IN: html.parser.printer
7 TUPLE: text-printer < html-printer ;
8 TUPLE: src-printer < html-printer ;
9 TUPLE: html-prettyprinter < html-printer ;
11 HOOK: print-text-tag html-printer ( tag -- )
12 HOOK: print-comment-tag html-printer ( tag -- )
13 HOOK: print-dtd-tag html-printer ( tag -- )
14 HOOK: print-opening-tag html-printer ( tag -- )
15 HOOK: print-closing-tag html-printer ( tag -- )
17 ERROR: unknown-tag-error tag ;
19 : print-tag ( tag -- )
21 { [ dup name>> text = ] [ print-text-tag ] }
22 { [ dup name>> comment = ] [ print-comment-tag ] }
23 { [ dup name>> dtd = ] [ print-dtd-tag ] }
24 { [ dup name>> string? ]
27 [ print-closing-tag ] [ print-opening-tag ] if
33 : print-tags ( vector -- ) [ print-tag ] each ;
35 : html-text. ( vector -- )
36 T{ text-printer } html-printer [ print-tags ] with-variable ;
38 : html-text ( vector -- string )
39 [ html-text. ] with-string-writer ;
41 : html-src. ( vector -- )
42 T{ src-printer } html-printer [ print-tags ] with-variable ;
44 : html-src ( vector -- string )
45 [ html-src. ] with-string-writer ;
47 M: text-printer print-opening-tag
52 { "li" [ " * " write ] }
56 M: text-printer print-closing-tag
59 { "p" "blockquote" "h1" "h2" "h3" "h4" "h5" }
60 member? [ nl nl ] when
63 { "ul" "ol" "li" "tr" } member? [ nl ] when
65 [ "td" = [ bl ] when ] tri ;
67 M: text-printer print-comment-tag drop ;
69 M: html-printer print-text-tag ( tag -- )
72 M: html-printer print-comment-tag ( tag -- )
73 "<!--" write text>> write "-->" write ;
75 M: html-printer print-dtd-tag ( tag -- )
76 "<!" write text>> write ">" write ;
78 : print-attributes ( hashtable -- )
79 [ [ bl write "=" write ] [ ?quote write ] bi* ] assoc-each ;
81 M: src-printer print-opening-tag ( tag -- )
84 [ attributes>> dup assoc-empty? [ drop ] [ print-attributes ] if ] bi
87 M: src-printer print-closing-tag ( tag -- )
96 : prettyprint-html ( vector -- )
98 T{ html-prettyprinter } html-printer set
99 V{ } clone tagstack set
106 tab-width get #indentations get 0 max * CHAR: \s <repetition> ;
108 M: html-prettyprinter print-opening-tag ( tag -- )
110 [ tabs write "<" write write ">\n" write ]
111 ! These tags usually don't have any closing tag associated with them.
112 [ { "br" "img" } member? [ #indentations inc ] unless ] bi ;
114 M: html-prettyprinter print-closing-tag ( tag -- )
115 ! These tags usually don't have any closing tag associated with them.
116 [ { "br" "img" } member? [ #indentations dec ] unless ]
117 [ tabs write "</" write name>> write ">\n" write ] bi ;
119 M: html-prettyprinter print-text-tag ( tag -- )
120 text>> [ blank? ] trim [ tabs write write "\n" write ] unless-empty ;