1 ! Copyright (C) 2008 Slava Pestov.
\r
2 ! See http://factorcode.org/license.txt for BSD license.
\r
3 USING: accessors assocs math kernel shuffle generalizations
\r
4 words quotations arrays combinators sequences math.vectors
\r
5 io.styles prettyprint vocabs sorting io generic
\r
6 math.statistics math.order locals.types
\r
10 : badness ( word -- n )
\r
72 : vsum ( pairs -- pair ) { 0 0 } [ v+ ] reduce ;
\r
74 GENERIC: noise ( obj -- pair )
\r
76 M: word noise badness 1 2array ;
\r
78 M: wrapper noise wrapped>> noise ;
\r
80 M: let noise body>> noise ;
\r
82 M: lambda noise body>> noise ;
\r
84 M: object noise drop { 0 0 } ;
\r
86 M: quotation noise [ noise ] map vsum { 1/4 1/2 } v+ ;
\r
88 M: array noise [ noise ] map vsum ;
\r
90 : noise-factor ( x y -- z ) / 100 * >integer ;
\r
92 : quot-noise-factor ( quot -- n )
\r
93 #! For very short words, noise doesn't count so much
\r
94 #! (so dup foo swap bar isn't penalized as badly).
\r
96 { [ over 4 <= ] [ [ drop 0 ] dip ] }
\r
97 { [ over 15 >= ] [ [ 2 * ] dip ] }
\r
101 ! short words are easier to read
\r
102 { [ dup 10 <= ] [ [ 2 / ] dip ] }
\r
103 { [ dup 5 <= ] [ [ 3 / ] dip ] }
\r
104 ! long words are penalized even more
\r
105 { [ dup 25 >= ] [ [ 2 * ] dip 20 max ] }
\r
106 { [ dup 20 >= ] [ [ 5/3 * ] dip ] }
\r
107 { [ dup 15 >= ] [ [ 3/2 * ] dip ] }
\r
109 } cond noise-factor ;
\r
111 GENERIC: word-noise-factor ( word -- factor )
\r
113 M: word word-noise-factor
\r
114 def>> quot-noise-factor ;
\r
116 M: lambda-word word-noise-factor
\r
117 "lambda" word-prop quot-noise-factor ;
\r
119 : flatten-generics ( words -- words' )
\r
121 dup generic? [ "methods" word-prop values ] [ 1array ] if
\r
124 : noisy-words ( -- alist )
\r
125 all-words flatten-generics
\r
126 [ dup word-noise-factor ] { } map>assoc
\r
127 sort-values reverse ;
\r
129 : noise. ( alist -- )
\r
130 standard-table-style [
\r
132 [ [ pprint-cell ] [ pprint-cell ] bi* ] with-row
\r
136 : vocab-noise-factor ( vocab -- factor )
\r
137 words flatten-generics
\r
138 [ word-noise-factor dup 20 < [ drop 0 ] when ] map
\r
140 [ [ sum ] [ length 5 max ] bi /i ]
\r
145 : noisy-vocabs ( -- alist )
\r
146 vocabs [ dup vocab-noise-factor ] { } map>assoc
\r
147 sort-values reverse ;
\r
149 : noise-report ( -- )
\r
150 "NOISY WORDS:" print
\r
151 noisy-words 80 head noise.
\r
153 "NOISY VOCABS:" print
\r
154 noisy-vocabs 80 head noise. ;
\r