Mu-Sigma
diff --git a/‎DESCRIPTION
Lines changed: 16 additions & 10 deletions b/‎DESCRIPTION
Lines changed: 16 additions & 10 deletions
diff --git a/‎NAMESPACE
Lines changed: 40 additions & 1 deletion b/‎NAMESPACE
Lines changed: 40 additions & 1 deletion
@@ -1,23 +1,29 @@
 Package: analysisPipelines
 Type: Package
-Title: Put analyis reports and pipelines into production
+Title: Compose interoperable analysis pipelines, and put them into production
 Version: 0.1.0
-Authors@R:c(
+Authors@R: c(
       person("Naren","Srinivasan", email = "Naren.Srinivasan@mu-sigma.com", role = c("cre","aut")),
-      person("Neeratyoy","Mallik", email = "Neeratyoy.Mallik@mu-sigma.com", role = c("aut")),
-		  person("Sanjay","",  email = "Sanjay@mu-sigma.com", role = c("aut")),
-		  person("Anoop S","",  email = "Anoop.S@mu-sigma.com", role = c("ctb")),
-		  person("Vedavyas C","",  email = "Vedavyas.C@mu-sigma.com", role = c("ctb"))
+      person("Sanjay","",  email = "Sanjay@mu-sigma.com", role = c("ctb")),
+      person("Neeratyoy","Mallik", email = "Neeratyoy.Mallik@mu-sigma.com", role = c("ctb")),
+		  person("Anoop S","",  email = "Anoop.S@mu-sigma.com", role = c("ctb"))
 		  )
-Maintainer: Naren Srinivasan <Naren.Srinivasan@mu-sigma.com>
-Description: This package allows data scientists to compose and generate reports as a set of analytical operations. The sequence of generation can be stored as pipelines and reused, specifically for production systems where these tasks are run repetitively. Additionally, the package implements a form of lazy evaluation where the pipelines are run on datasets only when outputs/ reports need to be generated. The package also has functions implemented for working with Spark through SparkR for both traditional Spark jobs on Spark DataFrames, as well as Spark Structured Streaming.
+Description: The package aims at enabling data scientists to compose pipelines of analysis which consist of data manipulation, exploratory analysis & reporting, as well as modeling steps. It also aims to enable data scientists to use tools of their choice through an R interface, and compose interoperable pipelines between R, Spark, and Python.
 Depends: R (>= 3.4.0), tibble, magrittr, data.table, pipeR, devtools
-Imports: ggplot2, dplyr
-Suggests: plotly, knitr, rmarkdown, SparkR
+Imports: ggplot2, dplyr, futile.logger
+Suggests: plotly, knitr, rmarkdown, SparkR, parallel, visNetwork, rjson, DT
 Remotes: github::cran/SparkR
 Encoding: UTF-8
 License: Apache License 2.0
 LazyLoad: yes
 LazyData: yes
 RoxygenNote: 6.0.1
 VignetteBuilder: knitr
+Collate: 
+    'analysisPipelines_package.R'
+    'core-functions.R'
+    'core-functions-batch.R'
+    'core-streaming-functions.R'
+    'r-batch-eda-utilities.R'
+    'spark-structured-streaming-utilities.R'
+    'zzz.R'
@@ -1 +1,40 @@
-exportPattern("^[[:alpha:]]+")
+# Generated by roxygen2: do not edit by hand
+
+export(AnalysisPipeline)
+export(BaseAnalysisPipeline)
+export(CheckColumnType)
+export(StreamingAnalysisPipeline)
+export(assessEngineSetUp)
+export(bivarPlots)
+export(castKafkaStreamAsString)
+export(convertKafkaValueFromJson)
+export(correlationMatPlot)
+export(generateReport)
+export(genericPipelineException)
+export(getDatatype)
+export(getInput)
+export(getLoggerDetails)
+export(getOutputById)
+export(getPipeline)
+export(getRegistry)
+export(ignoreCols)
+export(loadPipeline)
+export(loadPredefinedFunctionRegistry)
+export(multiVarOutlierPlot)
+export(outlierPlot)
+export(prepExecution)
+export(registerFunction)
+export(savePipeline)
+export(setInput)
+export(setLoggerDetails)
+export(sparkRSessionCreateIfNotPresent)
+export(univarCatDistPlots)
+export(updateObject)
+export(visualizePipeline)
+exportClasses(AnalysisPipeline)
+exportClasses(BaseAnalysisPipeline)
+exportClasses(StreamingAnalysisPipeline)
+exportMethods(checkSchemaMatch)
+exportMethods(generateOutput)
+exportMethods(initialize)
+import(SparkR)