| 
									
										
										
										
											2008-08-27 17:24:04 -04:00
										 |  |  | ! Copyright (C) 2008 Slava Pestov. | 
					
						
							|  |  |  | ! See http://factorcode.org/license.txt for BSD license. | 
					
						
							| 
									
										
										
										
											2008-07-07 20:36:33 -04:00
										 |  |  | USING: accessors assocs math kernel shuffle generalizations | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  | words quotations arrays combinators sequences math.vectors | 
					
						
							| 
									
										
										
										
											2008-12-08 21:13:04 -05:00
										 |  |  | io.styles prettyprint vocabs sorting io generic | 
					
						
							| 
									
										
										
										
											2008-12-17 20:52:47 -05:00
										 |  |  | math.statistics math.order locals.types | 
					
						
							| 
									
										
										
										
											2008-12-08 21:13:04 -05:00
										 |  |  | locals.definitions ;
 | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  | IN: reports.noise | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : badness ( word -- n )
 | 
					
						
							|  |  |  |     H{ | 
					
						
							|  |  |  |         { -nrot 5 } | 
					
						
							|  |  |  |         { -roll 4 } | 
					
						
							|  |  |  |         { -rot 3 } | 
					
						
							| 
									
										
										
										
											2008-03-29 21:36:58 -04:00
										 |  |  |         { bi@ 1 } | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  |         { 2curry 1 } | 
					
						
							|  |  |  |         { 2drop 1 } | 
					
						
							| 
									
										
										
										
											2008-03-17 05:31:13 -04:00
										 |  |  |         { 2dup 1 } | 
					
						
							|  |  |  |         { 2keep 1 } | 
					
						
							|  |  |  |         { 2nip 2 } | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  |         { 2over 4 } | 
					
						
							|  |  |  |         { 2slip 2 } | 
					
						
							|  |  |  |         { 2swap 3 } | 
					
						
							|  |  |  |         { 3curry 2 } | 
					
						
							|  |  |  |         { 3drop 1 } | 
					
						
							|  |  |  |         { 3dup 2 } | 
					
						
							|  |  |  |         { 3keep 3 } | 
					
						
							|  |  |  |         { 3slip 3 } | 
					
						
							|  |  |  |         { 4drop 2 } | 
					
						
							|  |  |  |         { 4dup 3 } | 
					
						
							|  |  |  |         { compose 1/2 } | 
					
						
							| 
									
										
										
										
											2008-03-17 05:31:13 -04:00
										 |  |  |         { curry 1/3 } | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  |         { dip 1 } | 
					
						
							| 
									
										
										
										
											2008-05-23 23:48:58 -04:00
										 |  |  |         { 2dip 2 } | 
					
						
							| 
									
										
										
										
											2008-03-17 05:31:13 -04:00
										 |  |  |         { drop 1/3 } | 
					
						
							|  |  |  |         { dup 1/3 } | 
					
						
							|  |  |  |         { if 1/3 } | 
					
						
							|  |  |  |         { when 1/4 } | 
					
						
							|  |  |  |         { unless 1/4 } | 
					
						
							|  |  |  |         { when* 1/3 } | 
					
						
							|  |  |  |         { unless* 1/3 } | 
					
						
							|  |  |  |         { ?if 1/2 } | 
					
						
							|  |  |  |         { cond 1/2 } | 
					
						
							|  |  |  |         { case 1/2 } | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  |         { keep 1 } | 
					
						
							|  |  |  |         { napply 2 } | 
					
						
							|  |  |  |         { ncurry 3 } | 
					
						
							|  |  |  |         { ndip 5 } | 
					
						
							|  |  |  |         { ndrop 2 } | 
					
						
							|  |  |  |         { ndup 3 } | 
					
						
							|  |  |  |         { nip 2 } | 
					
						
							|  |  |  |         { nkeep 5 } | 
					
						
							|  |  |  |         { npick 6 } | 
					
						
							|  |  |  |         { nrot 5 } | 
					
						
							|  |  |  |         { nslip 5 } | 
					
						
							|  |  |  |         { ntuck 6 } | 
					
						
							|  |  |  |         { nwith 4 } | 
					
						
							|  |  |  |         { over 2 } | 
					
						
							|  |  |  |         { pick 4 } | 
					
						
							|  |  |  |         { roll 4 } | 
					
						
							|  |  |  |         { rot 3 } | 
					
						
							|  |  |  |         { slip 1 } | 
					
						
							|  |  |  |         { spin 3 } | 
					
						
							|  |  |  |         { swap 1 } | 
					
						
							|  |  |  |         { swapd 3 } | 
					
						
							|  |  |  |         { tuck 2 } | 
					
						
							| 
									
										
										
										
											2008-03-17 05:31:13 -04:00
										 |  |  |         { with 1/2 } | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  | 
 | 
					
						
							|  |  |  |         { bi 1/2 } | 
					
						
							|  |  |  |         { tri 1 } | 
					
						
							|  |  |  |         { bi* 1/2 } | 
					
						
							|  |  |  |         { tri* 1 } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         { cleave 2 } | 
					
						
							|  |  |  |         { spread 2 } | 
					
						
							|  |  |  |     } at 0 or ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2008-06-09 03:14:14 -04:00
										 |  |  | : vsum ( pairs -- pair ) { 0 0 } [ v+ ] reduce ;
 | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  | 
 | 
					
						
							|  |  |  | GENERIC: noise ( obj -- pair )
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | M: word noise badness 1 2array ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2008-06-30 17:06:14 -04:00
										 |  |  | M: wrapper noise wrapped>> noise ;
 | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2008-08-27 17:24:04 -04:00
										 |  |  | M: let noise body>> noise ;
 | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2008-08-27 17:24:04 -04:00
										 |  |  | M: wlet noise body>> noise ;
 | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2008-08-27 17:24:04 -04:00
										 |  |  | M: lambda noise body>> noise ;
 | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  | 
 | 
					
						
							|  |  |  | M: object noise drop { 0 0 } ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2008-03-17 05:31:13 -04:00
										 |  |  | M: quotation noise [ noise ] map vsum { 1/4 1/2 } v+ ;
 | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2008-03-17 05:31:13 -04:00
										 |  |  | M: array noise [ noise ] map vsum ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2008-06-09 03:14:14 -04:00
										 |  |  | : noise-factor ( x y -- z ) / 100 * >integer ;
 | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  | 
 | 
					
						
							|  |  |  | : quot-noise-factor ( quot -- n )
 | 
					
						
							|  |  |  |     #! For very short words, noise doesn't count so much | 
					
						
							|  |  |  |     #! (so dup foo swap bar isn't penalized as badly). | 
					
						
							| 
									
										
										
										
											2008-03-17 05:31:13 -04:00
										 |  |  |     noise first2 { | 
					
						
							| 
									
										
										
										
											2008-12-17 20:52:47 -05:00
										 |  |  |         { [ over 4 <= ] [ [ drop 0 ] dip ] } | 
					
						
							|  |  |  |         { [ over 15 >= ] [ [ 2 * ] dip ] } | 
					
						
							| 
									
										
										
										
											2008-04-11 13:57:43 -04:00
										 |  |  |         [ ] | 
					
						
							| 
									
										
										
										
											2008-03-17 05:31:13 -04:00
										 |  |  |     } cond
 | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         ! short words are easier to read | 
					
						
							| 
									
										
										
										
											2008-12-17 20:52:47 -05:00
										 |  |  |         { [ dup 10 <= ] [ [ 2 / ] dip ] } | 
					
						
							|  |  |  |         { [ dup 5 <= ] [ [ 3 / ] dip ] } | 
					
						
							| 
									
										
										
										
											2008-03-17 05:31:13 -04:00
										 |  |  |         ! long words are penalized even more | 
					
						
							| 
									
										
										
										
											2008-12-17 20:52:47 -05:00
										 |  |  |         { [ dup 25 >= ] [ [ 2 * ] dip 20 max ] } | 
					
						
							|  |  |  |         { [ dup 20 >= ] [ [ 5/3 * ] dip ] } | 
					
						
							|  |  |  |         { [ dup 15 >= ] [ [ 3/2 * ] dip ] } | 
					
						
							| 
									
										
										
										
											2008-04-11 13:57:43 -04:00
										 |  |  |         [ ] | 
					
						
							| 
									
										
										
										
											2008-03-17 05:31:13 -04:00
										 |  |  |     } cond noise-factor ;
 | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  | 
 | 
					
						
							|  |  |  | GENERIC: word-noise-factor ( word -- factor )
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | M: word word-noise-factor | 
					
						
							| 
									
										
										
										
											2008-06-28 03:36:20 -04:00
										 |  |  |     def>> quot-noise-factor ;
 | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  | 
 | 
					
						
							|  |  |  | M: lambda-word word-noise-factor | 
					
						
							|  |  |  |     "lambda" word-prop quot-noise-factor ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2008-03-17 05:31:13 -04:00
										 |  |  | : flatten-generics ( words -- words' )
 | 
					
						
							|  |  |  |     [ | 
					
						
							| 
									
										
										
										
											2008-04-03 07:11:18 -04:00
										 |  |  |         dup generic? [ "methods" word-prop values ] [ 1array ] if
 | 
					
						
							| 
									
										
										
										
											2008-03-17 05:31:13 -04:00
										 |  |  |     ] map concat ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | : noisy-words ( -- alist )
 | 
					
						
							|  |  |  |     all-words flatten-generics | 
					
						
							|  |  |  |     [ dup word-noise-factor ] { } map>assoc
 | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  |     sort-values reverse ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2008-03-17 05:31:13 -04:00
										 |  |  | : noise. ( alist -- )
 | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  |     standard-table-style [ | 
					
						
							|  |  |  |         [ | 
					
						
							|  |  |  |             [ [ pprint-cell ] [ pprint-cell ] bi* ] with-row | 
					
						
							|  |  |  |         ] assoc-each
 | 
					
						
							|  |  |  |     ] tabular-output ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2008-03-17 05:31:13 -04:00
										 |  |  | : vocab-noise-factor ( vocab -- factor )
 | 
					
						
							|  |  |  |     words flatten-generics | 
					
						
							|  |  |  |     [ word-noise-factor dup 20 < [ drop 0 ] when ] map
 | 
					
						
							| 
									
										
										
										
											2008-09-06 18:15:25 -04:00
										 |  |  |     [ 0 ] [ | 
					
						
							| 
									
										
										
										
											2008-03-17 05:31:13 -04:00
										 |  |  |         [ [ sum ] [ length 5 max ] bi /i ] | 
					
						
							|  |  |  |         [ supremum ] | 
					
						
							|  |  |  |         bi +
 | 
					
						
							| 
									
										
										
										
											2008-09-06 18:15:25 -04:00
										 |  |  |     ] if-empty ;
 | 
					
						
							| 
									
										
										
										
											2008-03-17 05:31:13 -04:00
										 |  |  | 
 | 
					
						
							|  |  |  | : noisy-vocabs ( -- alist )
 | 
					
						
							|  |  |  |     vocabs [ dup vocab-noise-factor ] { } map>assoc
 | 
					
						
							|  |  |  |     sort-values reverse ;
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  | : noise-report ( -- )
 | 
					
						
							| 
									
										
										
										
											2008-03-17 05:31:13 -04:00
										 |  |  |     "NOISY WORDS:" print
 | 
					
						
							|  |  |  |     noisy-words 80 head noise. | 
					
						
							|  |  |  |     nl
 | 
					
						
							|  |  |  |     "NOISY VOCABS:" print
 | 
					
						
							|  |  |  |     noisy-vocabs 80 head noise. ;
 | 
					
						
							| 
									
										
										
										
											2008-03-17 00:42:21 -04:00
										 |  |  | 
 | 
					
						
							|  |  |  | MAIN: noise-report |