Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
haskell-gargantext
Project
Project
Details
Activity
Releases
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
Grégoire Locqueville
haskell-gargantext
Commits
e72fb3c7
Commit
e72fb3c7
authored
Jan 20, 2020
by
Alexandre Delanoë
Browse files
Options
Browse Files
Download
Plain Diff
Merge branch 'dev' into dev-db-schema
parents
4da8baa0
253a938c
Changes
5
Show whitespace changes
Inline
Side-by-side
Showing
5 changed files
with
56 additions
and
77 deletions
+56
-77
package.yaml
package.yaml
+1
-0
API.hs
src/Gargantext/API.hs
+2
-2
New.hs
src/Gargantext/API/Corpus/New.hs
+46
-74
CSV.hs
src/Gargantext/Text/Corpus/Parsers/CSV.hs
+4
-0
stack.yaml
stack.yaml
+3
-1
No files found.
package.yaml
View file @
e72fb3c7
...
...
@@ -186,6 +186,7 @@ library:
-
servant-auth-swagger
-
servant-blaze
-
servant-client
-
servant-flatten
-
servant-job
-
servant-mock
-
servant-multipart
...
...
src/Gargantext/API.hs
View file @
e72fb3c7
...
...
@@ -395,9 +395,9 @@ addWithFile cid i f =
JobFunction
(
\
_i
log
->
New
.
addToCorpusWithFile
cid
i
f
(
liftIO
.
log
))
addWithForm
::
GargServer
New
.
AddWithForm
addWithForm
cid
f
=
addWithForm
cid
=
serveJobsAPI
$
JobFunction
(
\
_i
log
->
New
.
addToCorpusWithForm
cid
f
(
liftIO
.
log
))
JobFunction
(
\
i
log
->
New
.
addToCorpusWithForm
cid
i
(
liftIO
.
log
))
serverStatic
::
Server
(
Get
'[
H
TML
]
Html
)
serverStatic
=
$
(
do
...
...
src/Gargantext/API/Corpus/New.hs
View file @
e72fb3c7
...
...
@@ -24,33 +24,37 @@ New corpus means either:
module
Gargantext.API.Corpus.New
where
import
Web.FormUrlEncoded
(
FromForm
)
import
Data.Either
--import Gargantext.Text.Corpus.Parsers (parseFile, FileFormat(..)
)
import
Control.Lens
hiding
(
elements
)
import
Control.Monad.IO.Class
(
liftIO
)
import
Data.Aeson.TH
(
deriveJSON
)
import
Data.Aeson
import
Servant.Job.Utils
(
jsonOptions
)
import
Control.Lens
hiding
(
elements
)
import
Servant.Multipart
import
Data.Aeson.TH
(
deriveJSON
)
import
Data.Either
import
Data.Swagger
import
Data.Text
(
Text
)
import
GHC.Generics
(
Generic
)
import
Servant.Job.Types
import
Gargantext.API.Corpus.New.File
import
Gargantext.API.Orchestrator.Types
import
Gargantext.Core
(
Lang
(
..
))
import
Gargantext.Core.Utils.Prefix
(
unPrefix
,
unPrefixSwagger
)
import
Gargantext.Database.Flow
(
FlowCmdM
,
flowCorpus
)
import
Gargantext.Database.Flow
(
flowCorpusSearchInDatabase
)
import
Gargantext.Database.Types.Node
(
CorpusId
)
import
Gargantext.Text.Terms
(
TermType
(
..
))
import
Gargantext.Database.Types.Node
(
ToHyperdataDocument
(
..
))
import
Gargantext.Database.Types.Node
(
UserId
)
import
Gargantext.Prelude
import
Gargantext.API.Orchestrator.Types
import
Gargantext.Text.Corpus.Parsers.CSV
(
parseHal'
)
import
Gargantext.Text.Terms
(
TermType
(
..
))
import
Servant
-- import Servant.Job.Server
import
Servant.API.Flatten
(
Flat
)
import
Servant.Job.Core
import
Servant.Job.Types
import
Servant.Job.Utils
(
jsonOptions
)
import
Servant.Multipart
import
Test.QuickCheck
(
elements
)
import
Test.QuickCheck.Arbitrary
import
Gargantext.Core
(
Lang
(
..
))
import
Gargantext.Database.Flow
(
FlowCmdM
,
flowCorpus
)
import
Web.FormUrlEncoded
(
FromForm
)
import
qualified
Gargantext.Text.Corpus.API
as
API
import
Gargantext.Database.Types.Node
(
UserId
)
import
Gargantext.API.Corpus.New.File
data
Query
=
Query
{
query_query
::
Text
,
query_corpus_id
::
Int
...
...
@@ -104,41 +108,6 @@ instance ToSchema ApiInfo
info
::
FlowCmdM
env
err
m
=>
UserId
->
m
ApiInfo
info
_u
=
pure
$
ApiInfo
API
.
externalAPIs
{-
-- Proposal to replace the Query type which seems to generically named.
data ScraperInput = ScraperInput
{ _scin_query :: !Text
, _scin_corpus_id :: !Int
, _scin_databases :: [API.ExternalAPIs]
}
deriving (Eq, Show, Generic)
makeLenses ''ScraperInput
deriveJSON (unPrefix "_scin_") 'ScraperInput
data ScraperEvent = ScraperEvent
{ _scev_message :: !(Maybe Text)
, _scev_level :: !(Maybe Text)
, _scev_date :: !(Maybe Text)
}
deriving Generic
deriveJSON (unPrefix "_scev_") 'ScraperEvent
data ScraperStatus = ScraperStatus
{ _scst_succeeded :: !(Maybe Int)
, _scst_failed :: !(Maybe Int)
, _scst_remaining :: !(Maybe Int)
, _scst_events :: !(Maybe [ScraperEvent])
}
deriving Generic
deriveJSON (unPrefix "_scst_") 'ScraperStatus
-}
------------------------------------------------------------------------
------------------------------------------------------------------------
data
WithQuery
=
WithQuery
...
...
@@ -148,11 +117,11 @@ data WithQuery = WithQuery
deriving
Generic
makeLenses
''
W
ithQuery
instance
FromJSON
WithQuery
where
parseJSON
=
genericParseJSON
$
jsonOptions
"_wq_"
instance
ToSchema
WithQuery
where
declareNamedSchema
=
genericDeclareNamedSchema
(
unPrefixSwagger
"_wq_"
)
instance
ToSchema
WithQuery
-------------------------------------------------------
data
WithForm
=
WithForm
{
_wf_filetype
::
!
FileType
...
...
@@ -160,27 +129,25 @@ data WithForm = WithForm
}
deriving
(
Eq
,
Show
,
Generic
)
makeLenses
''
W
ithForm
instance
FromForm
WithForm
instance
FromJSON
WithForm
where
parseJSON
=
genericParseJSON
$
jsonOptions
"_wf_"
instance
ToSchema
WithForm
instance
FromForm
WithForm
instance
ToSchema
WithForm
where
declareNamedSchema
=
genericDeclareNamedSchema
(
unPrefixSwagger
"_wf_"
)
------------------------------------------------------------------------
type
AddAPI
withInput
=
AsyncJobsAPI
ScraperStatus
withInput
ScraperStatus
type
AsyncJobs
event
ctI
input
output
=
Flat
(
AsyncJobsAPI'
'U
n
safe
'S
a
fe
ctI
'[
J
SON
]
Maybe
event
input
output
)
------------------------------------------------------------------------
type
AddWithQuery
=
Summary
"Add to corpus endpoint"
type
AddWithQuery
=
Summary
"Add with Query to corpus endpoint"
:>
"corpus"
:>
Capture
"corpus_id"
CorpusId
:>
"add"
:>
"query"
:>
"async"
:>
A
ddAPI
WithQuery
:>
A
syncJobsAPI
ScraperStatus
WithQuery
ScraperStatus
type
AddWithFile
=
Summary
"Add to corpus endpoint"
type
AddWithFile
=
Summary
"Add
with MultipartData
to corpus endpoint"
:>
"corpus"
:>
Capture
"corpus_id"
CorpusId
:>
"add"
...
...
@@ -188,16 +155,15 @@ type AddWithFile = Summary "Add to corpus endpoint"
:>
MultipartForm
Mem
(
MultipartData
Mem
)
:>
QueryParam
"fileType"
FileType
:>
"async"
:>
A
ddAPI
()
:>
A
syncJobs
ScraperStatus
'[
J
SON
]
()
ScraperStatus
type
AddWithForm
=
Summary
"Add to corpus endpoint"
type
AddWithForm
=
Summary
"Add
with FormUrlEncoded
to corpus endpoint"
:>
"corpus"
:>
Capture
"corpus_id"
CorpusId
:>
"add"
:>
"form"
:>
ReqBody
'[
F
ormUrlEncoded
]
WithForm
:>
"async"
:>
A
ddAPI
()
:>
A
syncJobs
ScraperStatus
'[
F
ormUrlEncoded
]
WithForm
ScraperStatus
------------------------------------------------------------------------
-- TODO WithQuery also has a corpus id
...
...
@@ -206,7 +172,7 @@ addToCorpusJobFunction :: FlowCmdM env err m
->
WithQuery
->
(
ScraperStatus
->
m
()
)
->
m
ScraperStatus
addToCorpusJobFunction
_cid
_input
logStatus
=
do
addToCorpusJobFunction
_cid
(
WithQuery
_q
_dbs
)
logStatus
=
do
-- TODO ...
logStatus
ScraperStatus
{
_scst_succeeded
=
Just
10
,
_scst_failed
=
Just
2
...
...
@@ -246,17 +212,23 @@ addToCorpusWithForm :: FlowCmdM env err m
->
WithForm
->
(
ScraperStatus
->
m
()
)
->
m
ScraperStatus
addToCorpusWithForm
_cid
(
WithForm
ft
d
)
logStatus
=
do
logStatus
ScraperStatus
{
_scst_succeeded
=
Just
10
,
_scst_failed
=
Just
2
,
_scst_remaining
=
Just
138
addToCorpusWithForm
cid
(
WithForm
_ft
d
)
logStatus
=
do
let
docs
=
splitEvery
500
$
take
10000
$
parseHal'
(
cs
d
)
logStatus
ScraperStatus
{
_scst_succeeded
=
Just
1
,
_scst_failed
=
Just
0
,
_scst_remaining
=
Just
1
,
_scst_events
=
Just
[]
}
_
<-
putStrLn
$
show
ft
_
<-
putStrLn
$
show
d
pure
ScraperStatus
{
_scst_succeeded
=
Just
137
,
_scst_failed
=
Just
13
cid'
<-
flowCorpus
"user1"
(
Right
[
cid
])
(
Multi
EN
)
(
map
(
map
toHyperdataDocument
)
docs
)
printDebug
"cid'"
cid'
pure
ScraperStatus
{
_scst_succeeded
=
Just
2
,
_scst_failed
=
Just
0
,
_scst_remaining
=
Just
0
,
_scst_events
=
Just
[]
}
...
...
src/Gargantext/Text/Corpus/Parsers/CSV.hs
View file @
e72fb3c7
...
...
@@ -387,6 +387,10 @@ csv2doc (CsvDoc title source
------------------------------------------------------------------------
parseHal
::
FilePath
->
IO
[
HyperdataDocument
]
parseHal
fp
=
V
.
toList
<$>
V
.
map
csvHal2doc
<$>
snd
<$>
readCsvHal
fp
parseHal'
::
BL
.
ByteString
->
[
HyperdataDocument
]
parseHal'
=
V
.
toList
.
V
.
map
csvHal2doc
.
snd
.
readCsvHalLazyBS
------------------------------------------------------------------------
parseCsv
::
FilePath
->
IO
[
HyperdataDocument
]
...
...
stack.yaml
View file @
e72fb3c7
...
...
@@ -3,6 +3,7 @@ flags: {}
extra-package-dbs
:
[]
packages
:
-
.
#- 'deps/servant-job'
docker
:
enable
:
false
...
...
@@ -35,7 +36,8 @@ extra-deps:
#
-
git
:
https://gitlab.iscpif.fr/gargantext/patches-class
commit
:
746b4ce0af8f9e600d555ad7e5b2973a940cdad9
#- git: https://github.com/delanoe/servant-job.git
#- git: https://github.com/delanoe/servant-job.git
#commit: 7a7b7100e6d132adb4c11b25b2128e6309690ac0
-
git
:
https://github.com/np/servant-job.git
commit
:
4016c76398a56e1a352a45b3ee9d698dd0dd2597
-
git
:
https://gitlab.iscpif.fr/gargantext/clustering-louvain.git
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment