math.statistics: make collect-by row polymorphic, simplify words.

author John Benediktsson <mrjbq7@gmail.com>

Mon, 22 Apr 2013 13:25:50 +0000 (06:25 -0700)

committer John Benediktsson <mrjbq7@gmail.com>

Mon, 22 Apr 2013 13:25:50 +0000 (06:25 -0700)
author John Benediktsson <mrjbq7@gmail.com>
Mon, 22 Apr 2013 13:25:50 +0000 (06:25 -0700)
committer John Benediktsson <mrjbq7@gmail.com>
Mon, 22 Apr 2013 13:25:50 +0000 (06:25 -0700)
diff --git a/basis/math/statistics/statistics-docs.factor b/basis/math/statistics/statistics-docs.factor

index f3d20b50a077473e6735984dc3332257c806a7bb..7397b9f4f1361e627259c3b00ea0630a3e831626 100644 (file)
--- a/basis/math/statistics/statistics-docs.factor
+++ b/basis/math/statistics/statistics-docs.factor
@@ -238,7 +238,7 @@ HELP: rescale
  
  HELP: collect-by
  { $values
-    { "seq" sequence } { "quot" { $quotation "( obj -- ? )" } }
+    { "seq" sequence } { "quot" { $quotation "( ... obj -- ... key )" } }
      { "hashtable" hashtable }
  }
  { $description "Applies a quotation to each element in the input sequence and returns a " { $snippet "hashtable" } " of like elements. The keys of this " { $snippet "hashtable" } " are the output of " { $snippet "quot" } " and the values at each key are the elements that transformed to that key." }
@@ -254,7 +254,7 @@ HELP: collect-by
  
  HELP: collect-index-by
  { $values
-    { "seq" sequence } { "quot" { $quotation "( obj -- ? )" } }
+    { "seq" sequence } { "quot" { $quotation "( ... obj -- ... key )" } }
      { "hashtable" hashtable }
  }
  { $description "Applies a quotation to each element in the input sequence and returns a " { $snippet "hashtable" } " of like elements. The keys of this " { $snippet "hashtable" } " are the output of " { $snippet "quot" } " and the values at each key are the indices for the elements that transformed to that key." }
diff --git a/basis/math/statistics/statistics.factor b/basis/math/statistics/statistics.factor

index 713ff46494825a65527d4c21c41f596123fdb192..30fbce55edc8120e6ca35dfc545602cf8ee7a946 100644 (file)
--- a/basis/math/statistics/statistics.factor
+++ b/basis/math/statistics/statistics.factor
@@ -247,18 +247,17 @@ PRIVATE>
  : normalized-histogram ( seq -- alist )
      [ histogram ] [ length ] bi '[ _ / ] assoc-map ;
  
-: collect-index-by ( seq quot -- hashtable )
-    [ swap ] prepose [ push-at ] sequence-index>hashtable ; inline
+: collect-index-by ( ... seq quot: ( ... obj -- ... key ) -- ... hashtable )
+    [ dip swap ] curry [ push-at ] sequence-index>hashtable ; inline
  
-: collect-by ( seq quot -- hashtable )
-    [ dup ] prepose [ push-at ] sequence>hashtable ; inline
+: collect-by ( ... seq quot: ( ... obj -- ... key ) -- ... hashtable )
+    [ keep swap ] curry [ push-at ] sequence>hashtable ; inline
  
  : equal-probabilities ( n -- array )
      dup recip <array> ; inline
  
  : mode ( seq -- x )
-    histogram >alist
-    [ ] [ [ [ second ] bi@ > ] most ] map-reduce first ;
+    histogram >alist [ second ] supremum-by first ;
  
  : minmax ( seq -- min max )
      [ first dup ] keep [ [ min ] [ max ] bi-curry bi* ] each ;
@@ -380,18 +379,16 @@ ALIAS: std sample-std
      flip [ standardize ] map flip ;
  
  : differences ( u -- v )
-    [ 1 tail-slice ] keep v- ;
+    [ rest-slice ] keep v- ;
  
  : rescale ( u -- v )
      dup minmax over - [ v-n ] [ v/n ] bi* ;
  
+: rankings ( histogram -- assoc )
+    sort-keys 0 swap [ rot [ + ] keep swapd ] H{ } assoc-map-as nip ;
+
  : rank-values ( seq -- seq' )
-    [
-        [ ] [ length iota ] bi zip sort-keys
-        [ [ first ] bi@ = ] monotonic-split
-        [ values ] map [ 0 [ length + ] accumulate nip ] [ ] bi zip
-    ] [ length f <array> ] bi
-    [ '[ first2 [ _ set-nth ] with each ] each ] keep ;
+    dup histogram rankings '[ _ at ] map ;
  
  : z-score ( seq -- n )
      [ demean ] [ sample-std ] bi v/n ;
author	John Benediktsson <mrjbq7@gmail.com>
	Mon, 22 Apr 2013 13:25:50 +0000 (06:25 -0700)
committer	John Benediktsson <mrjbq7@gmail.com>
	Mon, 22 Apr 2013 13:25:50 +0000 (06:25 -0700)
basis/math/statistics/statistics-docs.factor		patch \| blob \| history
basis/math/statistics/statistics.factor		patch \| blob \| history