2 Module : Gargantext.Database.Flow.Utils
3 Description : Database Flow
4 Copyright : (c) CNRS, 2017-Present
5 License : AGPL + CECILL v3
6 Maintainer : team@gargantext.org
7 Stability : experimental
12 {-# LANGUAGE FlexibleContexts #-}
13 {-# LANGUAGE NoImplicitPrelude #-}
14 {-# LANGUAGE OverloadedStrings #-}
15 {-# LANGUAGE RankNTypes #-}
17 module Gargantext.Database.Flow.Utils
21 import qualified Data.Map as DM
22 import Gargantext.Prelude
23 import Gargantext.Database.Schema.Ngrams
24 import Gargantext.Database.Types.Node (NodeId, Node, NodePoly(..), Hyperdata)
25 import Gargantext.Database.Utils (Cmd)
26 import Gargantext.Database.Schema.NodeNodeNgrams
27 import Gargantext.Database.Types.Node
30 => (a -> Map (NgramsT Ngrams) Int)
32 -> Map (NgramsT Ngrams) (Map NodeId Int)
33 toMaps fun ns = mapNodeIdNgrams $ documentIdWithNgrams fun ns'
35 ns' = map (\(Node nId _ _ _ _ _ json) -> DocumentWithId nId json) ns
37 mapNodeIdNgrams :: Hyperdata a
38 => [DocumentIdWithNgrams a]
39 -> Map (NgramsT Ngrams) (Map NodeId Int)
40 mapNodeIdNgrams ds = DM.map (DM.fromListWith (+)) $ DM.fromListWith (<>) xs
42 xs = [(ng, [(nId, i)]) | (nId, n2i') <- n2i ds, (ng, i) <- DM.toList n2i']
43 n2i = map (\d -> ((documentId . documentWithId) d, document_ngrams d))
46 documentIdWithNgrams :: Hyperdata a
47 => (a -> Map (NgramsT Ngrams) Int)
49 -> [DocumentIdWithNgrams a]
50 documentIdWithNgrams f = map (\d -> DocumentIdWithNgrams d ((f . documentData) d))
53 data DocumentWithId a =
54 DocumentWithId { documentId :: NodeId
59 data DocumentIdWithNgrams a =
61 { documentWithId :: DocumentWithId a
62 , document_ngrams :: Map (NgramsT Ngrams) Int
66 docNgrams2nodeNodeNgrams :: CorpusId
69 docNgrams2nodeNodeNgrams cId (DocNgrams d n nt w) =
70 NodeNodeNgrams cId d n nt w
72 data DocNgrams = DocNgrams { dn_doc_id :: DocId
74 , dn_ngrams_type :: NgramsTypeId
78 insertDocNgramsOn :: CorpusId
81 insertDocNgramsOn cId dn =
83 $ (map (docNgrams2nodeNodeNgrams cId) dn)
85 insertDocNgrams :: CorpusId
86 -> Map NgramsIndexed (Map NgramsType (Map NodeId Int))
88 insertDocNgrams cId m =
89 insertDocNgramsOn cId [ DocNgrams n (_ngramsId ng) (ngramsTypeId t) (fromIntegral i)
90 | (ng, t2n2i) <- DM.toList m
91 , (t, n2i) <- DM.toList t2n2i
92 , (n, i) <- DM.toList n2i