{-| Module : Main.hs Description : Gargantext Import Corpus Copyright : (c) CNRS, 2017-Present License : AGPL + CECILL v3 Maintainer : team@gargantext.org Stability : experimental Portability : POSIX Import a corpus binary. -} {-# LANGUAGE Strict #-} module Main where import Control.Exception (finally) import Data.Either import Data.Maybe (Maybe(..)) import Data.Text (Text) import System.Environment (getArgs) import qualified Data.Text as Text import Text.Read (readMaybe) import Gargantext.API.Dev (withDevEnv, runCmdDev) import Gargantext.API.Admin.EnvTypes (DevEnv(..)) import Gargantext.API.Node () -- instances import Gargantext.API.Prelude (GargError) import Gargantext.Core (Lang(..)) import Gargantext.Core.Types.Individu (User(..)) import Gargantext.Database.Action.Flow (flowCorpusFile, flowAnnuaire, TermType(..)) import Gargantext.Database.Action.Flow.Types (FlowCmdM) import Gargantext.Database.Admin.Types.Hyperdata (toHyperdataDocument) import Gargantext.Database.Admin.Types.Node (CorpusId) import Gargantext.Database.Prelude (Cmd) import Gargantext.Prelude import Gargantext.Core.Text.Corpus.Parsers (FileFormat(..), FileType(..)) main :: IO () main = do [fun, user, name, iniPath, limit, corpusPath] <- getArgs --{- let --tt = (Unsupervised EN 6 0 Nothing) tt = (Multi EN) format = CsvGargV3 -- CsvHal --WOS limit' = case (readMaybe limit :: Maybe Int) of Nothing -> panic $ "Cannot read limit: " <> (Text.pack limit) Just l -> l corpus :: forall m. FlowCmdM DevEnv GargError m => m CorpusId corpus = flowCorpusFile (UserName $ cs user) (Left (cs name :: Text)) limit' tt format Plain corpusPath Nothing (\_ -> pure ()) corpusCsvHal :: forall m. FlowCmdM DevEnv GargError m => m CorpusId corpusCsvHal = flowCorpusFile (UserName $ cs user) (Left (cs name :: Text)) limit' tt CsvHal Plain corpusPath Nothing (\_ -> pure ()) annuaire :: forall m. FlowCmdM DevEnv GargError m => m CorpusId annuaire = flowAnnuaire (UserName $ cs user) (Left "Annuaire") (Multi EN) corpusPath (\_ -> pure ()) {- let debatCorpus :: forall m. FlowCmdM DevEnv GargError m => m CorpusId debatCorpus = do docs <- liftIO ( splitEvery 500 <$> take (read limit :: Int) <$> readFile corpusPath :: IO [[GrandDebatReference ]] ) flowCorpus (Text.pack user) (Text.pack name) (Multi FR) (map (map toHyperdataDocument) docs) --} withDevEnv iniPath $ \env -> do _ <- if fun == "corpus" then runCmdDev env corpus else pure 0 --(cs "false") _ <- if fun == "corpusCsvHal" then runCmdDev env corpusCsvHal else pure 0 --(cs "false") _ <- if fun == "annuaire" then runCmdDev env annuaire else pure 0 {- _ <- if corpusType == "csv" then runCmdDev env csvCorpus else if corpusType == "debat" then runCmdDev env debatCorpus else panic "corpusType unknown: try \"csv\" or \"debat\"" -} pure ()