The main type is Phylo which is synonym of Phylomemy (only difference is
the number of chars).
-References:
+References:
Chavalarias, D., Cointet, J.-P., 2013. Phylomemetic patterns
in science evolution — the rise and fall of scientific fields. PloS
one 8, e54847.
-}
-{-# LANGUAGE DeriveGeneric #-}
+{-# LANGUAGE DeriveGeneric, DeriveAnyClass #-}
{-# LANGUAGE NoImplicitPrelude #-}
{-# LANGUAGE TemplateHaskell #-}
{-# LANGUAGE MultiParamTypeClasses #-}
module Gargantext.Viz.Phylo where
+import Prelude (Bounded)
import Control.Lens (makeLenses)
-import Data.Aeson.TH (deriveJSON)
+import Data.Aeson.TH (deriveJSON,defaultOptions)
import Data.Maybe (Maybe)
import Data.Text (Text)
import Data.Set (Set)
import Data.Map (Map)
import Data.Vector (Vector)
-import Data.Time.Clock.POSIX (POSIXTime)
+import Data.Swagger
+--import Data.Time.Clock.POSIX (POSIXTime)
import GHC.Generics (Generic)
-import Gargantext.Database.Schema.Ngrams (NgramsId)
-import Gargantext.Core.Utils.Prefix (unPrefix)
+--import Gargantext.Database.Schema.Ngrams (NgramsId)
+import Gargantext.Core.Utils.Prefix (unPrefix, unPrefixSwagger)
+import Gargantext.Text.Context (TermList)
import Gargantext.Prelude
-------------------------------------------------------------------------
-data PhyloExport =
- PhyloExport { _phyloExport_param :: PhyloParam
- , _phyloExport_data :: Phylo
- } deriving (Generic)
+import Control.DeepSeq
--- | .phylo parameters
-data PhyloParam =
- PhyloParam { _phyloParam_version :: Text -- Double ?
- , _phyloParam_software :: Software
- , _phyloParam_params :: Hash
- } deriving (Generic)
+--------------------
+-- | PhyloParam | --
+--------------------
-type Hash = Text
--- | Software
--- TODO move somewhere since it is generic
+-- | Global parameters of a Phylo
+data PhyloParam =
+ PhyloParam { _phyloParam_version :: Text -- Double ?
+ , _phyloParam_software :: Software
+ , _phyloParam_query :: PhyloQueryBuild
+ } deriving (Generic, Show, Eq)
+
+
+-- | Software parameters
data Software =
Software { _software_name :: Text
, _software_version :: Text
- } deriving (Generic)
+ } deriving (Generic, Show, Eq)
+
-------------------------------------------------------------------------
+---------------
+-- | Phylo | --
+---------------
--- | Phylo datatype descriptor of a phylomemy
--- Duration : time Segment of the whole phylomemy (start,end)
--- Ngrams : list of all (possible) terms contained in the phylomemy (with their id)
--- Steps : list of all steps to build the phylomemy
+
+-- | Phylo datatype of a phylomemy
+-- Duration : time Segment of the whole Phylo
+-- Foundations : vector of all the Ngrams contained in a Phylo (build from a list of actants)
+-- Periods : list of all the periods of a Phylo
data Phylo =
- Phylo { _phylo_duration :: (Start, End)
- , _phylo_ngrams :: PhyloNgrams
- , _phylo_periods :: [PhyloPeriod]
- , _phylo_branches :: [PhyloBranch]
+ Phylo { _phylo_duration :: (Start, End)
+ , _phylo_foundations :: PhyloFoundations
+ , _phylo_periods :: [PhyloPeriod]
+ , _phylo_docsByYears :: Map Date Double
+ , _phylo_cooc :: !(Map Date (Map (Int,Int) Double))
+ , _phylo_fis :: !(Map (Date,Date) [PhyloFis])
+ , _phylo_param :: PhyloParam
}
- deriving (Generic, Show)
+ deriving (Generic, Show, Eq)
+
+
+-- | The foundations of a phylomemy created from a given TermList
+data PhyloFoundations =
+ PhyloFoundations { _phylo_foundationsRoots :: Vector Ngrams
+ , _phylo_foundationsTermsList :: TermList
+ } deriving (Generic, Show, Eq)
-- | Date : a simple Integer
type Start = Date
type End = Date
+
+---------------------
+-- | PhyloPeriod | --
+---------------------
+
+
-- | PhyloStep : steps of phylomemy on temporal axis
-- Period: tuple (start date, end date) of the step of the phylomemy
-- Levels: levels of granularity
data PhyloPeriod =
PhyloPeriod { _phylo_periodId :: PhyloPeriodId
, _phylo_periodLevels :: [PhyloLevel]
- }
- deriving (Generic, Show)
+ }
+ deriving (Generic, Show, Eq)
+
+
+--------------------
+-- | PhyloLevel | --
+--------------------
-- | PhyloLevel : levels of phylomemy on level axis
PhyloLevel { _phylo_levelId :: PhyloLevelId
, _phylo_levelGroups :: [PhyloGroup]
}
- deriving (Generic, Show)
+ deriving (Generic, Show, Eq)
+
+
+--------------------
+-- | PhyloGroup | --
+--------------------
-- | PhyloGroup : group of ngrams at each level and step
-- Label : maybe has a label as text
-- Ngrams: set of terms that build the group
--- Quality : map of measures (support, etc.) that depict some qualitative aspects of a phylo
+-- Quality : map of measures (support, etc.) that depict some qualitative aspects of a phylo
-- Period Parents|Childs: weighted link to Parents|Childs (Temporal Period axis)
-- Level Parents|Childs: weighted link to Parents|Childs (Level Granularity axis)
-- Pointers are directed link from Self to any PhyloGroup (/= Self ?)
PhyloGroup { _phylo_groupId :: PhyloGroupId
, _phylo_groupLabel :: Text
, _phylo_groupNgrams :: [Int]
- , _phylo_groupQuality :: Map Text Double
- , _phylo_groupCooc :: Map (Int, Int) Double
-
+ , _phylo_groupNgramsMeta :: Map Text [Double]
+ , _phylo_groupMeta :: Map Text Double
+ , _phylo_groupBranchId :: Maybe PhyloBranchId
+ , _phylo_groupCooc :: !(Map (Int,Int) Double)
+
, _phylo_groupPeriodParents :: [Pointer]
, _phylo_groupPeriodChilds :: [Pointer]
-
+
, _phylo_groupLevelParents :: [Pointer]
, _phylo_groupLevelChilds :: [Pointer]
}
- deriving (Generic, Show, Eq, Ord)
+ deriving (Generic, NFData, Show, Eq, Ord)
-data PhyloBranch =
- PhyloBranch { _phylo_branchId :: (Level,Int)
- , _phylo_branchLabel :: Text
- , _phylo_branchGroups :: [PhyloGroupId]
- }
- deriving (Generic, Show)
+-- instance NFData PhyloGroup
--- | Level : A level of aggregation (-1 = Txt, 0 = Ngrams, 1 = Fis, [2..] = Cluster)
-type Level = Int
+-- | Level : A level of aggregation (-1 = Txt, 0 = Ngrams, 1 = Fis, [2..] = Cluster)
+type Level = Int
-- | Index : A generic index of an element (PhyloGroup, PhyloBranch, etc) in a given List
type Index = Int
type Weight = Double
-- | Pointer : A weighted linked with a given PhyloGroup
type Pointer = (PhyloGroupId, Weight)
-
-
-- | Ngrams : a contiguous sequence of n terms
type Ngrams = Text
--- | PhyloNgrams : Vector of all the Ngrams (PhyloGroup of level -1) used within a Phylo
-type PhyloNgrams = Vector Ngrams
--- | Clique : Set of ngrams cooccurring in the same Document
-type Clique = Set Ngrams
--- | Support : Number of Documents where a Clique occurs
-type Support = Int
--- | Fis : Frequent Items Set (ie: the association between a Clique and a Support)
-type Fis = (Clique,Support)
+--------------------
+-- | Aggregates | --
+--------------------
-- | Document : a piece of Text linked to a Date
data Document = Document
{ date :: Date
- , text :: Text
- } deriving (Show)
-
+ , text :: [Ngrams]
+ } deriving (Show,Generic,NFData)
-type Cluster = [PhyloGroup]
+-- | Clique : Set of ngrams cooccurring in the same Document
+type Clique = Set Ngrams
+-- | Support : Number of Documents where a Clique occurs
+type Support = Int
+-- | Fis : Frequent Items Set (ie: the association between a Clique and a Support)
+data PhyloFis = PhyloFis
+ { _phyloFis_clique :: Clique
+ , _phyloFis_support :: Support
+ , _phyloFis_period :: (Date,Date)
+ } deriving (Generic,NFData,Show,Eq)
+
+-- | A list of clustered PhyloGroup
+type PhyloCluster = [PhyloGroup]
+
+
+-- | A PhyloGroup in a Graph
+type GroupNode = PhyloGroup
+-- | A weighted links between two PhyloGroups in a Graph
+type GroupEdge = ((PhyloGroup,PhyloGroup),Weight)
+-- | The association as a Graph between a list of Nodes and a list of Edges
+type GroupGraph = ([GroupNode],[GroupEdge])
--- | A List of PhyloGroup in a PhyloGraph
-type PhyloNodes = [PhyloGroup]
--- | A List of weighted links between some PhyloGroups in a PhyloGraph
-type PhyloEdges = [((PhyloGroup,PhyloGroup),Weight)]
--- | The association as a Graph between a list of Nodes and a list of Edges
-type PhyloGraph = (PhyloNodes,PhyloEdges)
+---------------
+-- | Error | --
+---------------
data PhyloError = LevelDoesNotExist
| LevelUnassigned
- deriving (Show)
+ deriving (Show)
--- | A List of Proximity mesures or strategies
-data Proximity = WeightedLogJaccard | Hamming | FromPairs
--- | A List of Clustering methods
-data Clustering = Louvain | RelatedComponents
+-----------------
+-- | Cluster | --
+-----------------
-data PairTo = Childs | Parents
+-- | Cluster constructors
+data Cluster = Fis FisParams
+ | RelatedComponents RCParams
+ | Louvain LouvainParams
+ deriving (Generic, Show, Eq, Read)
+
+-- | Parameters for Fis clustering
+data FisParams = FisParams
+ { _fis_keepMinorFis :: Bool
+ , _fis_minSupport :: Support
+ , _fis_minSize :: Int
+ } deriving (Generic, Show, Eq, Read)
+
+-- | Parameters for RelatedComponents clustering
+data RCParams = RCParams
+ { _rc_proximity :: Proximity } deriving (Generic, Show, Eq, Read)
+
+-- | Parameters for Louvain clustering
+data LouvainParams = LouvainParams
+ { _louvain_proximity :: Proximity } deriving (Generic, Show, Eq, Read)
+
+
+-------------------
+-- | Proximity | --
+-------------------
+
+
+-- | Proximity constructors
+data Proximity = WeightedLogJaccard WLJParams
+ | Hamming HammingParams
+ | Filiation
+ deriving (Generic, Show, Eq, Read)
+
+-- | Parameters for WeightedLogJaccard proximity
+data WLJParams = WLJParams
+ { _wlj_threshold :: Double
+ , _wlj_sensibility :: Double
+ } deriving (Generic, Show, Eq, Read)
+
+-- | Parameters for Hamming proximity
+data HammingParams = HammingParams
+ { _hamming_threshold :: Double } deriving (Generic, Show, Eq, Read)
+
+
+----------------
+-- | Filter | --
+----------------
+
+
+-- | Filter constructors
+data Filter = LonelyBranch LBParams
+ | SizeBranch SBParams
+ deriving (Generic, Show, Eq)
+
+-- | Parameters for LonelyBranch filter
+data LBParams = LBParams
+ { _lb_periodsInf :: Int
+ , _lb_periodsSup :: Int
+ , _lb_minNodes :: Int } deriving (Generic, Show, Eq)
+
+-- | Parameters for SizeBranch filter
+data SBParams = SBParams
+ { _sb_minSize :: Int } deriving (Generic, Show, Eq)
+
+
+----------------
+-- | Metric | --
+----------------
+
+
+-- | Metric constructors
+data Metric = BranchAge | BranchBirth | BranchGroups deriving (Generic, Show, Eq, Read)
+
+
+----------------
+-- | Tagger | --
+----------------
+
+
+-- | Tagger constructors
+data Tagger = BranchPeakFreq | BranchPeakCooc | BranchPeakInc
+ | GroupLabelCooc | GroupLabelInc | GroupLabelIncDyn deriving (Show,Generic,Read)
+
+
+--------------
+-- | Sort | --
+--------------
+
+
+-- | Sort constructors
+data Sort = ByBranchAge | ByBranchBirth deriving (Generic, Show, Read, Enum, Bounded)
+data Order = Asc | Desc deriving (Generic, Show, Read)
+
+
+--------------------
+-- | PhyloQuery | --
+--------------------
+
+
+-- | A Phyloquery describes a phylomemic reconstruction
+data PhyloQueryBuild = PhyloQueryBuild
+ { _q_phyloTitle :: Text
+ , _q_phyloDesc :: Text
+
+ -- Grain and Steps for the PhyloPeriods
+ , _q_periodGrain :: Int
+ , _q_periodSteps :: Int
+
+ -- Clustering method for building the contextual unit of Phylo (ie: level 1)
+ , _q_contextualUnit :: Cluster
+ , _q_contextualUnitMetrics :: [Metric]
+ , _q_contextualUnitFilters :: [Filter]
+
+ -- Inter-temporal matching method of the Phylo
+ , _q_interTemporalMatching :: Proximity
+ , _q_interTemporalMatchingFrame :: Int
+ , _q_interTemporalMatchingFrameTh :: Double
+
+ , _q_reBranchThr :: Double
+ , _q_reBranchNth :: Int
+
+ -- Last level of reconstruction
+ , _q_nthLevel :: Level
+ -- Clustering method used from level 1 to nthLevel
+ , _q_nthCluster :: Cluster
+ } deriving (Generic, Show, Eq)
+
+-- | To choose the Phylo edge you want to export : --> <-- <--> <=>
+data Filiation = Ascendant | Descendant | Merge | Complete deriving (Generic, Show, Read)
+data EdgeType = PeriodEdge | LevelEdge deriving (Generic, Show, Eq)
+
+-------------------
+-- | PhyloView | --
+-------------------
+
+
+-- | A PhyloView is the output type of a Phylo
+data PhyloView = PhyloView
+ { _pv_param :: PhyloParam
+ , _pv_title :: Text
+ , _pv_description :: Text
+ , _pv_filiation :: Filiation
+ , _pv_level :: Level
+ , _pv_periods :: [PhyloPeriodId]
+ , _pv_metrics :: Map Text [Double]
+ , _pv_branches :: [PhyloBranch]
+ , _pv_nodes :: [PhyloNode]
+ , _pv_edges :: [PhyloEdge]
+ } deriving (Generic, Show)
+
+-- | A phyloview is made of PhyloBranches, edges and nodes
+data PhyloBranch = PhyloBranch
+ { _pb_id :: PhyloBranchId
+ , _pb_peak :: Text
+ , _pb_metrics :: Map Text [Double]
+ } deriving (Generic, Show)
+
+data PhyloEdge = PhyloEdge
+ { _pe_source :: PhyloGroupId
+ , _pe_target :: PhyloGroupId
+ , _pe_type :: EdgeType
+ , _pe_weight :: Weight
+ } deriving (Generic, Show)
+
+data PhyloNode = PhyloNode
+ { _pn_id :: PhyloGroupId
+ , _pn_bid :: Maybe PhyloBranchId
+ , _pn_label :: Text
+ , _pn_idx :: [Int]
+ , _pn_ngrams :: Maybe [Ngrams]
+ , _pn_metrics :: Map Text [Double]
+ , _pn_cooc :: Map (Int,Int) Double
+ , _pn_parents :: Maybe [PhyloGroupId]
+ , _pn_childs :: [PhyloNode]
+ } deriving (Generic, Show)
+
+------------------------
+-- | PhyloQueryView | --
+------------------------
+
+
+data ExportMode = Json | Dot | Svg
+ deriving (Generic, Show, Read)
+data DisplayMode = Flat | Nested
+ deriving (Generic, Show, Read)
+
+-- | A PhyloQueryView describes a Phylo as an output view
+data PhyloQueryView = PhyloQueryView
+ { _qv_lvl :: Level
+
+ -- Does the PhyloGraph contain ascendant, descendant or a complete Filiation ? Complet redondant et merge (avec le max)
+ , _qv_filiation :: Filiation
+
+ -- Does the PhyloGraph contain some levelChilds ? How deep must it go ?
+ , _qv_levelChilds :: Bool
+ , _qv_levelChildsDepth :: Level
+
+ -- Ordered lists of filters, taggers and metrics to be applied to the PhyloGraph
+ -- Firstly the metrics, then the filters and the taggers
+ , _qv_metrics :: [Metric]
+ , _qv_filters :: [Filter]
+ , _qv_taggers :: [Tagger]
+
+ -- An asc or desc sort to apply to the PhyloGraph
+ , _qv_sort :: Maybe (Sort,Order)
+
+ -- A display mode to apply to the PhyloGraph, ie: [Node[Node,Edge],Edge] or [[Node,Node],[Edge,Edge]]
+ , _qv_export :: ExportMode
+ , _qv_display :: DisplayMode
+ , _qv_verbose :: Bool
+ }
+
+
+----------------
+-- | Lenses | --
+----------------
+
--- | Lenses
-makeLenses ''Phylo
makeLenses ''PhyloParam
-makeLenses ''PhyloExport
makeLenses ''Software
+--
+makeLenses ''Phylo
+makeLenses ''PhyloFoundations
makeLenses ''PhyloGroup
makeLenses ''PhyloLevel
makeLenses ''PhyloPeriod
+makeLenses ''PhyloFis
+--
+makeLenses ''Proximity
+makeLenses ''Cluster
+makeLenses ''Filter
+--
+makeLenses ''PhyloQueryBuild
+makeLenses ''PhyloQueryView
+--
+makeLenses ''PhyloView
makeLenses ''PhyloBranch
+makeLenses ''PhyloNode
+makeLenses ''PhyloEdge
--- | JSON instances
-$(deriveJSON (unPrefix "_phylo_" ) ''Phylo )
-$(deriveJSON (unPrefix "_phylo_period" ) 'PhyloPeriod )
+
+------------------------
+-- | JSON instances | --
+------------------------
+
+
+$(deriveJSON (unPrefix "_phylo_" ) ''Phylo )
+$(deriveJSON (unPrefix "_phylo_foundations" ) ''PhyloFoundations )
+$(deriveJSON (unPrefix "_phylo_period" ) ''PhyloPeriod )
$(deriveJSON (unPrefix "_phylo_level" ) ''PhyloLevel )
$(deriveJSON (unPrefix "_phylo_group" ) ''PhyloGroup )
-$(deriveJSON (unPrefix "_phylo_branch" ) ''PhyloBranch )
---
+$(deriveJSON (unPrefix "_phyloFis_" ) ''PhyloFis )
+--
$(deriveJSON (unPrefix "_software_" ) ''Software )
$(deriveJSON (unPrefix "_phyloParam_" ) ''PhyloParam )
-$(deriveJSON (unPrefix "_phyloExport_" ) ''PhyloExport )
-
--- | TODO XML instances
+--
+$(deriveJSON defaultOptions ''Filter )
+$(deriveJSON defaultOptions ''Metric )
+$(deriveJSON defaultOptions ''Cluster )
+$(deriveJSON defaultOptions ''Proximity )
+--
+$(deriveJSON (unPrefix "_fis_" ) ''FisParams )
+$(deriveJSON (unPrefix "_hamming_" ) ''HammingParams )
+$(deriveJSON (unPrefix "_louvain_" ) ''LouvainParams )
+$(deriveJSON (unPrefix "_rc_" ) ''RCParams )
+$(deriveJSON (unPrefix "_wlj_" ) ''WLJParams )
+--
+$(deriveJSON (unPrefix "_lb_" ) ''LBParams )
+$(deriveJSON (unPrefix "_sb_" ) ''SBParams )
+--
+$(deriveJSON (unPrefix "_q_" ) ''PhyloQueryBuild )
+$(deriveJSON (unPrefix "_pv_" ) ''PhyloView )
+$(deriveJSON (unPrefix "_pb_" ) ''PhyloBranch )
+$(deriveJSON (unPrefix "_pe_" ) ''PhyloEdge )
+$(deriveJSON (unPrefix "_pn_" ) ''PhyloNode )
+
+$(deriveJSON defaultOptions ''Filiation )
+$(deriveJSON defaultOptions ''EdgeType )
+
+---------------------------
+-- | Swagger instances | --
+---------------------------
+
+instance ToSchema Phylo where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_phylo_")
+instance ToSchema PhyloFoundations where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_phylo_foundations")
+instance ToSchema PhyloPeriod where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_phylo_period")
+instance ToSchema PhyloLevel where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_phylo_level")
+instance ToSchema PhyloGroup where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_phylo_group")
+instance ToSchema PhyloFis where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_phyloFis_")
+instance ToSchema Software where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_software_")
+instance ToSchema PhyloParam where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_phyloParam_")
+instance ToSchema Filter
+instance ToSchema Metric
+instance ToSchema Cluster
+instance ToSchema Proximity where
+ declareNamedSchema = genericDeclareNamedSchemaUnrestricted defaultSchemaOptions
+instance ToSchema FisParams where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_fis_")
+instance ToSchema HammingParams where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_hamming_")
+instance ToSchema LouvainParams where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_louvain_")
+instance ToSchema RCParams where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_rc_")
+instance ToSchema WLJParams where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_wlj_")
+instance ToSchema LBParams where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_lb_")
+instance ToSchema SBParams where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_sb_")
+instance ToSchema PhyloQueryBuild where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_q_")
+instance ToSchema PhyloView where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_pv_")
+instance ToSchema PhyloBranch where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_pb_")
+instance ToSchema PhyloEdge where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_pe_")
+instance ToSchema PhyloNode where
+ declareNamedSchema = genericDeclareNamedSchema (unPrefixSwagger "_pn_")
+instance ToSchema Filiation
+instance ToSchema EdgeType
+
+----------------------------
+-- | TODO XML instances | --
+----------------------------