[Map list automatic filtering] adding doc.

e5419936 · Alexandre Delanoë · 541b5a3b · e5419936
Commit e5419936 authored Jun 09, 2018 by Alexandre Delanoë
Hide whitespace changes
Inline Side-by-side

Showing with 11 additions and 10 deletions

Metrics.hs src/Gargantext/Text/Metrics.hs +11 -10

No files found.
--- a/src/Gargantext/Text/Metrics.hs
+++ b/src/Gargantext/Text/Metrics.hs
@@ -60,20 +60,21 @@ import GHC.Real (round)
 -- . fromIndex fi $ filterMat $ cooc2mat ti m
-type ListSize  = Int
+type MapListSize  = Int
-type BinSize = Double
+type SampleBins = Double
+type Clusters = Int
-- Map list creation
+-- | Map list creation
-- Kmean split into 2 main clusters with Inclusion/Exclusion (relevance score)
+-- Kmeans split into (Clusters::Int) main clusters with Inclusion/Exclusion (relevance score)
-- Sample the main cluster ordered by specificity/genericity in s parts
+-- Sample the main cluster ordered by specificity/genericity in (SampleBins::Double) parts
 -- each parts is then ordered by Inclusion/Exclusion
-- take n scored terms in each parts where n * s = l
+-- take n scored terms in each parts where n * SampleBins = MapListSize.
-takeSome :: Ord t => ListSize -> BinSize -> [Scored t] -> [Scored t]
+takeSome :: Ord t => MapListSize -> SampleBins -> Clusters -> [Scored t] -> [Scored t]
-takeSome l s scores = L.take l
+takeSome l s k scores = L.take l
                    $ takeSample n m
-                    $ splitKmeans 2 scores
+                    $ splitKmeans k scores
  where
-    -- (TODO: benchmark with accelerate-example kmeans version)
+    -- TODO: benchmark with accelerate-example kmeans version
    splitKmeans x xs = elements
                     $ V.head
                     $ kmeans (\i -> VU.fromList ([(_scored_incExc i :: Double)]))