Commit a52e3832 authored by Quentin Lobbé's avatar Quentin Lobbé

Merge branch 'dev-phylo' of https://gitlab.iscpif.fr/gargantext/haskell-gargantext into dev-phylo

parents d341c4b2 3f46358d
Pipeline #351 canceled with stage
......@@ -241,6 +241,30 @@ executables:
- unordered-containers
- full-text-search
gargantext-phylo:
main: Main.hs
source-dirs: bin/gargantext-phylo
ghc-options:
- -threaded
- -rtsopts
- -with-rtsopts=-N
- -O2
- -Wmissing-signatures
dependencies:
- aeson
- async
- base
- bytestring
- containers
- gargantext
- vector
- parallel
- cassava
- ini
- optparse-generic
- split
- unordered-containers
gargantext-import:
main: Main.hs
source-dirs: bin/gargantext-import
......
......@@ -18,7 +18,7 @@ commentary with @some markup@.
module Gargantext.Text.Terms.WithList where
import qualified Data.Algorithms.KMP as KMP
import Data.Text (Text)
import Data.Text (Text, concat)
import qualified Data.IntMap.Strict as IntMap
import Gargantext.Text.Context
......@@ -75,3 +75,12 @@ buildPatterns = sortWith (Down . _pat_length) . concatMap buildPattern
extractTermsWithList :: Patterns -> Text -> Corpus [Text]
extractTermsWithList pats = map (replaceTerms pats) . monoTextsBySentence
-- | Extract terms
-- >>> let termList = [(["chat blanc"], [["chat","blanc"]])] :: TermList
-- extractTermsWithList' (buildPatterns termList) "Le chat blanc"["chat blanc"]
-- ["chat blanc"]
extractTermsWithList' :: Patterns -> Text -> [Text]
extractTermsWithList' pats = map (concat . map concat . replaceTerms pats) . monoTextsBySentence
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment