From 284fcd7b56b8fe934438bfd290ca1cb2ee79bf22 Mon Sep 17 00:00:00 2001
From: "pieths.dev@gmail.com" <PH Schouten>
Date: Fri, 17 Jan 2020 09:46:15 -0800
Subject: [PATCH 01/34] Use latest ML.Net dev packages from MachineLearning
 feed.

---
 nuget.config                                  |  3 ++-
 src/DotNetBridge/DotNetBridge.csproj          | 22 +++++++++----------
 src/Platforms/build.csproj                    | 22 +++++++++----------
 .../internal/core/timeseries/ssaforecaster.py |  2 +-
 ...iesprocessingentrypoints_ssaforecasting.py |  2 +-
 ...eneralizedadditivemodelbinaryclassifier.py |  2 +-
 ...iners_generalizedadditivemodelregressor.py |  2 +-
 .../trainers_logisticregressionclassifier.py  |  2 +-
 .../transforms_missingvaluehandler.py         |  2 +-
 .../nimbusml/timeseries/ssaforecaster.py      |  2 +-
 src/python/tools/manifest.json                | 10 ++++-----
 11 files changed, 36 insertions(+), 35 deletions(-)
diff --git a/nuget.config b/nuget.config
index cedba361..1d7d1de7 100644
--- a/nuget.config
+++ b/nuget.config
@@ -4,7 +4,8 @@
     <add key="repositoryPath" value="./packages" />
   </config>
   <packageSources>
-    <add key="nuget.org" value="https://api.nuget.org/v3/index.json" />
+    <!-- <add key="nuget.org" value="https://api.nuget.org/v3/index.json" /> -->
+    <add key="MachineLearning" value="https://pkgs.dev.azure.com/dnceng/public/_packaging/MachineLearning/nuget/v3/index.json" />
     <add key="MlNet_Daily" value="https://dotnet.myget.org/F/dotnet-core/api/v3/index.json" />
   </packageSources>
 </configuration>
diff --git a/src/DotNetBridge/DotNetBridge.csproj b/src/DotNetBridge/DotNetBridge.csproj
index 00688f17..e00969a5 100644
--- a/src/DotNetBridge/DotNetBridge.csproj
+++ b/src/DotNetBridge/DotNetBridge.csproj
@@ -32,17 +32,17 @@
       <PrivateAssets>all</PrivateAssets>
       <IncludeAssets>runtime; build; native; contentfiles; analyzers</IncludeAssets>
     </PackageReference>
-    <PackageReference Include="Microsoft.ML" Version="1.5.0-preview" /> 
-    <PackageReference Include="Microsoft.ML.CpuMath" Version="1.5.0-preview" />
-    <PackageReference Include="Microsoft.ML.EntryPoints" Version="0.17.0-preview" />
-    <PackageReference Include="Microsoft.ML.Mkl.Components" Version="1.5.0-preview" />
-    <PackageReference Include="Microsoft.ML.ImageAnalytics" Version="1.5.0-preview" />
-    <PackageReference Include="Microsoft.ML.LightGBM" Version="1.5.0-preview" />
-    <PackageReference Include="Microsoft.ML.OnnxTransformer" Version="1.5.0-preview" />
-    <PackageReference Include="Microsoft.ML.TensorFlow" Version="1.5.0-preview" />
-    <PackageReference Include="Microsoft.ML.Vision" Version="1.5.0-preview" />
-    <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-preview" />
-    <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-preview" />
+    <PackageReference Include="Microsoft.ML" Version="1.5.0-preview*" />
+    <PackageReference Include="Microsoft.ML.CpuMath" Version="1.5.0-preview*" />
+    <PackageReference Include="Microsoft.ML.EntryPoints" Version="0.17.0-preview*" />
+    <PackageReference Include="Microsoft.ML.Mkl.Components" Version="1.5.0-preview*" />
+    <PackageReference Include="Microsoft.ML.ImageAnalytics" Version="1.5.0-preview*" />
+    <PackageReference Include="Microsoft.ML.LightGBM" Version="1.5.0-preview*" />
+    <PackageReference Include="Microsoft.ML.OnnxTransformer" Version="1.5.0-preview*" />
+    <PackageReference Include="Microsoft.ML.TensorFlow" Version="1.5.0-preview*" />
+    <PackageReference Include="Microsoft.ML.Vision" Version="1.5.0-preview*" />
+    <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-preview*" />
+    <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-preview*" />
     <PackageReference Include="Microsoft.DataPrep" Version="0.0.3.2-preview" />
     <PackageReference Include="TensorFlow.NET" Version="0.11.8.1" />
     <PackageReference Include="SciSharp.TensorFlow.Redist" Version="1.14.0" />
diff --git a/src/Platforms/build.csproj b/src/Platforms/build.csproj
index ef1b03d4..81b80d14 100644
--- a/src/Platforms/build.csproj
+++ b/src/Platforms/build.csproj
@@ -11,17 +11,17 @@
   </PropertyGroup>
 
   <ItemGroup>
-    <PackageReference Include="Microsoft.ML" Version="1.5.0-preview" />
-    <PackageReference Include="Microsoft.ML.CpuMath" Version="1.5.0-preview" />
-    <PackageReference Include="Microsoft.ML.EntryPoints" Version="0.17.0-preview" />
-    <PackageReference Include="Microsoft.ML.Mkl.Components" Version="1.5.0-preview" />
-    <PackageReference Include="Microsoft.ML.ImageAnalytics" Version="1.5.0-preview" />
-    <PackageReference Include="Microsoft.ML.LightGBM" Version="1.5.0-preview" />
-    <PackageReference Include="Microsoft.ML.OnnxTransformer" Version="1.5.0-preview" />
-    <PackageReference Include="Microsoft.ML.TensorFlow" Version="1.5.0-preview" />
-    <PackageReference Include="Microsoft.ML.Vision" Version="1.5.0-preview" />
-    <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-preview" />
-    <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-preview" />
+    <PackageReference Include="Microsoft.ML" Version="1.5.0-preview*" />
+    <PackageReference Include="Microsoft.ML.CpuMath" Version="1.5.0-preview*" />
+    <PackageReference Include="Microsoft.ML.EntryPoints" Version="0.17.0-preview*" />
+    <PackageReference Include="Microsoft.ML.Mkl.Components" Version="1.5.0-preview*" />
+    <PackageReference Include="Microsoft.ML.ImageAnalytics" Version="1.5.0-preview*" />
+    <PackageReference Include="Microsoft.ML.LightGBM" Version="1.5.0-preview*" />
+    <PackageReference Include="Microsoft.ML.OnnxTransformer" Version="1.5.0-preview*" />
+    <PackageReference Include="Microsoft.ML.TensorFlow" Version="1.5.0-preview*" />
+    <PackageReference Include="Microsoft.ML.Vision" Version="1.5.0-preview*" />
+    <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-preview*" />
+    <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-preview*" />
     <PackageReference Include="Microsoft.DataPrep" Version="0.0.3.2-preview" />
     <PackageReference Include="TensorFlow.NET" Version="0.11.8.1" />
     <PackageReference Include="SciSharp.TensorFlow.Redist" Version="1.14.0" />
diff --git a/src/python/nimbusml/internal/core/timeseries/ssaforecaster.py b/src/python/nimbusml/internal/core/timeseries/ssaforecaster.py
index ce9064b5..f1ee5f6b 100644
--- a/src/python/nimbusml/internal/core/timeseries/ssaforecaster.py
+++ b/src/python/nimbusml/internal/core/timeseries/ssaforecaster.py
@@ -38,7 +38,7 @@ class SsaForecaster(BasePipelineItem, DefaultSignature):
     :param series_length: The length of series that is kept in buffer for
         modeling (parameter N).
 
-    :param train_size: The length of series from the begining used for
+    :param train_size: The length of series from the beginning used for
         training.
 
     :param horizon: The number of values to forecast.
diff --git a/src/python/nimbusml/internal/entrypoints/timeseriesprocessingentrypoints_ssaforecasting.py b/src/python/nimbusml/internal/entrypoints/timeseriesprocessingentrypoints_ssaforecasting.py
index f02da3a7..1684783c 100644
--- a/src/python/nimbusml/internal/entrypoints/timeseriesprocessingentrypoints_ssaforecasting.py
+++ b/src/python/nimbusml/internal/entrypoints/timeseriesprocessingentrypoints_ssaforecasting.py
@@ -43,7 +43,7 @@ def timeseriesprocessingentrypoints_ssaforecasting(
         building the trajectory matrix (parameter L). (inputs).
     :param series_length: The length of series that is kept in buffer
         for modeling (parameter N). (inputs).
-    :param train_size: The length of series from the begining used
+    :param train_size: The length of series from the beginning used
         for training. (inputs).
     :param horizon: The number of values to forecast. (inputs).
     :param confidence_level: The confidence level in [0, 1) for
diff --git a/src/python/nimbusml/internal/entrypoints/trainers_generalizedadditivemodelbinaryclassifier.py b/src/python/nimbusml/internal/entrypoints/trainers_generalizedadditivemodelbinaryclassifier.py
index e5b62a23..5c281338 100644
--- a/src/python/nimbusml/internal/entrypoints/trainers_generalizedadditivemodelbinaryclassifier.py
+++ b/src/python/nimbusml/internal/entrypoints/trainers_generalizedadditivemodelbinaryclassifier.py
@@ -36,7 +36,7 @@ def trainers_generalizedadditivemodelbinaryclassifier(
     **Description**
         Trains a gradient boosted stump per feature, on all features
         simultaneously, to fit target values using least-squares. It
-        mantains no interactions between features.
+        maintains no interactions between features.
 
     :param number_of_iterations: Total number of iterations over all
         features (inputs).
diff --git a/src/python/nimbusml/internal/entrypoints/trainers_generalizedadditivemodelregressor.py b/src/python/nimbusml/internal/entrypoints/trainers_generalizedadditivemodelregressor.py
index 1c56a706..2b9334f8 100644
--- a/src/python/nimbusml/internal/entrypoints/trainers_generalizedadditivemodelregressor.py
+++ b/src/python/nimbusml/internal/entrypoints/trainers_generalizedadditivemodelregressor.py
@@ -36,7 +36,7 @@ def trainers_generalizedadditivemodelregressor(
     **Description**
         Trains a gradient boosted stump per feature, on all features
         simultaneously, to fit target values using least-squares. It
-        mantains no interactions between features.
+        maintains no interactions between features.
 
     :param number_of_iterations: Total number of iterations over all
         features (inputs).
diff --git a/src/python/nimbusml/internal/entrypoints/trainers_logisticregressionclassifier.py b/src/python/nimbusml/internal/entrypoints/trainers_logisticregressionclassifier.py
index 5db498b1..61759e4d 100644
--- a/src/python/nimbusml/internal/entrypoints/trainers_logisticregressionclassifier.py
+++ b/src/python/nimbusml/internal/entrypoints/trainers_logisticregressionclassifier.py
@@ -33,7 +33,7 @@ def trainers_logisticregressionclassifier(
         **params):
     """
     **Description**
-        Maximum entrypy classification is a method in statistics used to
+        Maximum entropy classification is a method in statistics used to
         predict the probabilities of parallel events. The model
         predicts the probabilities of parallel events by fitting data
         to a softmax function.
diff --git a/src/python/nimbusml/internal/entrypoints/transforms_missingvaluehandler.py b/src/python/nimbusml/internal/entrypoints/transforms_missingvaluehandler.py
index 1f1a3870..121115b4 100644
--- a/src/python/nimbusml/internal/entrypoints/transforms_missingvaluehandler.py
+++ b/src/python/nimbusml/internal/entrypoints/transforms_missingvaluehandler.py
@@ -21,7 +21,7 @@ def transforms_missingvaluehandler(
     **Description**
         Handle missing values by replacing them with either the default value
         or the mean/min/max value (for non-text columns only). An
-        indicator column can optionally be concatenated, if theinput
+        indicator column can optionally be concatenated, if the input
         column type is numeric.
 
     :param column: New column definition(s) (optional form:
diff --git a/src/python/nimbusml/timeseries/ssaforecaster.py b/src/python/nimbusml/timeseries/ssaforecaster.py
index 3cbe540f..35516d15 100644
--- a/src/python/nimbusml/timeseries/ssaforecaster.py
+++ b/src/python/nimbusml/timeseries/ssaforecaster.py
@@ -41,7 +41,7 @@ class SsaForecaster(core, BaseTransform, TransformerMixin):
     :param series_length: The length of series that is kept in buffer for
         modeling (parameter N).
 
-    :param train_size: The length of series from the begining used for
+    :param train_size: The length of series from the beginning used for
         training.
 
     :param horizon: The number of values to forecast.
diff --git a/src/python/tools/manifest.json b/src/python/tools/manifest.json
index e54ff2c2..fdc99a12 100644
--- a/src/python/tools/manifest.json
+++ b/src/python/tools/manifest.json
@@ -3981,7 +3981,7 @@
         {
           "Name": "TrainSize",
           "Type": "Int",
-          "Desc": "The length of series from the begining used for training.",
+          "Desc": "The length of series from the beginning used for training.",
           "Required": true,
           "SortOrder": 2.0,
           "IsNullable": false,
@@ -10418,7 +10418,7 @@
     },
     {
       "Name": "Trainers.GeneralizedAdditiveModelBinaryClassifier",
-      "Desc": "Trains a gradient boosted stump per feature, on all features simultaneously, to fit target values using least-squares. It mantains no interactions between features.",
+      "Desc": "Trains a gradient boosted stump per feature, on all features simultaneously, to fit target values using least-squares. It maintains no interactions between features.",
       "FriendlyName": "Generalized Additive Model for Binary Classification",
       "ShortName": "gam",
       "Inputs": [
@@ -10718,7 +10718,7 @@
     },
     {
       "Name": "Trainers.GeneralizedAdditiveModelRegressor",
-      "Desc": "Trains a gradient boosted stump per feature, on all features simultaneously, to fit target values using least-squares. It mantains no interactions between features.",
+      "Desc": "Trains a gradient boosted stump per feature, on all features simultaneously, to fit target values using least-squares. It maintains no interactions between features.",
       "FriendlyName": "Generalized Additive Model for Regression",
       "ShortName": "gamr",
       "Inputs": [
@@ -13739,7 +13739,7 @@
     },
     {
       "Name": "Trainers.LogisticRegressionClassifier",
-      "Desc": "Maximum entrypy classification is a method in statistics used to predict the probabilities of parallel events. The model predicts the probabilities of parallel events by fitting data to a softmax function.",
+      "Desc": "Maximum entropy classification is a method in statistics used to predict the probabilities of parallel events. The model predicts the probabilities of parallel events by fitting data to a softmax function.",
       "FriendlyName": "Multi-class Logistic Regression",
       "ShortName": "mlr",
       "Inputs": [
@@ -20637,7 +20637,7 @@
     },
     {
       "Name": "Transforms.MissingValueHandler",
-      "Desc": "Handle missing values by replacing them with either the default value or the mean/min/max value (for non-text columns only). An indicator column can optionally be concatenated, if theinput column type is numeric.",
+      "Desc": "Handle missing values by replacing them with either the default value or the mean/min/max value (for non-text columns only). An indicator column can optionally be concatenated, if the input column type is numeric.",
       "FriendlyName": "NA Handle Transform",
       "ShortName": "NAHandle",
       "Inputs": [

From ad00b7077385ce4bc975d8c058ca9b6126b4046f Mon Sep 17 00:00:00 2001
From: "pieths.dev@gmail.com" <PH Schouten>
Date: Fri, 17 Jan 2020 10:21:22 -0800
Subject: [PATCH 02/34] Re-enable the default nuget.org feed. It does not
 appear to cause any conflicts with getting the latest packages so long as the
 * is used in the PackageReference Version attributes. Keeping this enabled
 will allow other packages which are not part of the the MachineLearning feed
 to be retrieved (ie. Microsoft.MLFeaturizers).

---
 nuget.config | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/nuget.config b/nuget.config
index 1d7d1de7..2f64d057 100644
--- a/nuget.config
+++ b/nuget.config
@@ -4,7 +4,7 @@
     <add key="repositoryPath" value="./packages" />
   </config>
   <packageSources>
-    <!-- <add key="nuget.org" value="https://api.nuget.org/v3/index.json" /> -->
+    <add key="nuget.org" value="https://api.nuget.org/v3/index.json" />
     <add key="MachineLearning" value="https://pkgs.dev.azure.com/dnceng/public/_packaging/MachineLearning/nuget/v3/index.json" />
     <add key="MlNet_Daily" value="https://dotnet.myget.org/F/dotnet-core/api/v3/index.json" />
   </packageSources>

From 258a799be5af21e25087af093672206f937e9d30 Mon Sep 17 00:00:00 2001
From: "pieths.dev@gmail.com" <PH Schouten>
Date: Tue, 21 Jan 2020 11:14:11 -0800
Subject: [PATCH 03/34] Add whitespace change to restart CI build. Linux timed
 out.

---
 nuget.config | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/nuget.config b/nuget.config
index 2f64d057..c0efdcaa 100644
--- a/nuget.config
+++ b/nuget.config
@@ -5,7 +5,7 @@
   </config>
   <packageSources>
     <add key="nuget.org" value="https://api.nuget.org/v3/index.json" />
-    <add key="MachineLearning" value="https://pkgs.dev.azure.com/dnceng/public/_packaging/MachineLearning/nuget/v3/index.json" />
+    <add key="MachineLearning" value="https://pkgs.dev.azure.com/dnceng/public/_packaging/MachineLearning/nuget/v3/index.json"  />
     <add key="MlNet_Daily" value="https://dotnet.myget.org/F/dotnet-core/api/v3/index.json" />
   </packageSources>
 </configuration>

From c542c1d982393388b024adfeea705c774a632d99 Mon Sep 17 00:00:00 2001
From: "pieths.dev@gmail.com" <PH Schouten>
Date: Tue, 21 Jan 2020 13:39:40 -0800
Subject: [PATCH 04/34] Fix build issue when using pip version >= 20.0.0

---
 build.cmd | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/build.cmd b/build.cmd
index f2da6cfa..36ba13ef 100644
--- a/build.cmd
+++ b/build.cmd
@@ -387,7 +387,7 @@ if "%InstallPythonPackages%" == "True" (
     echo "#################################"
     echo "Installing python packages ... "
     echo "#################################"
-    call "%PythonExe%" -m pip install --upgrade pip
+    call "%PythonExe%" -m pip install --upgrade "pip==19.3.1"
     call "%PythonExe%" -m pip install --upgrade nose pytest pytest-xdist graphviz imageio pytest-cov "jupyter_client>=4.4.0" "nbconvert>=4.2.0"
 
     if %PythonVersion% == 2.7 (

From 5feb56dc01f6d3cfdb1de8ad0c2c0123c3853ae8 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Wed, 25 Mar 2020 16:57:36 -0700
Subject: [PATCH 05/34] preview3

---
 src/DotNetBridge/DotNetBridge.csproj | 26 +++++++++++++-------------
 src/Platforms/build.csproj           | 26 +++++++++++++-------------
 2 files changed, 26 insertions(+), 26 deletions(-)

diff --git a/src/DotNetBridge/DotNetBridge.csproj b/src/DotNetBridge/DotNetBridge.csproj
index f07b6845..1132f5f2 100644
--- a/src/DotNetBridge/DotNetBridge.csproj
+++ b/src/DotNetBridge/DotNetBridge.csproj
@@ -32,20 +32,20 @@
       <PrivateAssets>all</PrivateAssets>
       <IncludeAssets>runtime; build; native; contentfiles; analyzers</IncludeAssets>
     </PackageReference>
-    <PackageReference Include="Microsoft.ML" Version="1.5.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.CpuMath" Version="1.5.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.EntryPoints" Version="0.17.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.Mkl.Components" Version="1.5.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.ImageAnalytics" Version="1.5.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.LightGBM" Version="1.5.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.OnnxConverter" Version="0.17.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.OnnxTransformer" Version="1.5.0-preview2*" />
+    <PackageReference Include="Microsoft.ML" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.CpuMath" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.EntryPoints" Version="0.17.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.Mkl.Components" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.ImageAnalytics" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.LightGBM" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.OnnxConverter" Version="0.17.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.OnnxTransformer" Version="1.5.0-preview3*" />
     <PackageReference Include="Microsoft.ML.OnnxRuntime" Version="1.2.0" />
-    <PackageReference Include="Microsoft.ML.TensorFlow" Version="1.5.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.Vision" Version="1.5.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.Featurizers" Version="0.17.0-preview2*" />
+    <PackageReference Include="Microsoft.ML.TensorFlow" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.Vision" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.Featurizers" Version="0.17.0-preview3*" />
     <PackageReference Include="Microsoft.MLFeaturizers" Version="0.3.5" />
     <PackageReference Include="Microsoft.DataPrep" Version="0.0.3.2-preview" />
     <PackageReference Include="TensorFlow.NET" Version="0.11.8.1" />
diff --git a/src/Platforms/build.csproj b/src/Platforms/build.csproj
index 647fd6e7..3705a235 100644
--- a/src/Platforms/build.csproj
+++ b/src/Platforms/build.csproj
@@ -21,20 +21,20 @@
   </Target> 
   
   <ItemGroup>
-    <PackageReference Include="Microsoft.ML" Version="1.5.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.CpuMath" Version="1.5.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.EntryPoints" Version="0.17.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.Mkl.Components" Version="1.5.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.ImageAnalytics" Version="1.5.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.LightGBM" Version="1.5.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.OnnxConverter" Version="0.17.0-preview2*" />
+    <PackageReference Include="Microsoft.ML" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.CpuMath" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.EntryPoints" Version="0.17.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.Mkl.Components" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.ImageAnalytics" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.LightGBM" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.OnnxConverter" Version="0.17.0-preview3*" />
     <PackageReference Include="Microsoft.ML.OnnxRuntime" Version="1.2.0" />
-    <PackageReference Include="Microsoft.ML.OnnxTransformer" Version="1.5.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.TensorFlow" Version="1.5.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.Vision" Version="1.5.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-preview2*" />
-    <PackageReference Include="Microsoft.ML.Featurizers" Version="0.17.0-preview2*" />
+    <PackageReference Include="Microsoft.ML.OnnxTransformer" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.TensorFlow" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.Vision" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.Featurizers" Version="0.17.0-preview3*" />
     <PackageReference Include="Microsoft.MLFeaturizers" Version="0.3.5" />
     <PackageReference Include="Microsoft.DataPrep" Version="0.0.3.2-preview" />
     <PackageReference Include="TensorFlow.NET" Version="0.11.8.1" />

From fed9aa2c417bc1ac8be7ad90bd9480051049c057 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Thu, 26 Mar 2020 08:16:27 -0700
Subject: [PATCH 06/34] fix signing

---
 build.cmd                                      | 17 ++++++++++-------
 .../tests_extended/test_export_to_onnx.py      | 18 ++++++++++++++++--
 2 files changed, 26 insertions(+), 9 deletions(-)

diff --git a/build.cmd b/build.cmd
index 271599f6..62e716b6 100644
--- a/build.cmd
+++ b/build.cmd
@@ -184,12 +184,20 @@ if "%AzureBuild%" == "True" (
 :: Build managed code
 echo ""
 echo "#################################"
-echo "Building DotNet Bridge ... "
+echo "Building Managed code ... "
 echo "#################################"
 set _dotnet=%_dotnetRoot%\dotnet.exe
 
+if "%Configuration:~-5%" == "Py3.7" set VerifyManifest=True
+if "%VerifyManifest%" == "True" set BuildManifestGenerator=True
+if "%UpdateManifest%" == "True" set BuildManifestGenerator=True
+
 if "%SkipDotNetBridge%" == "False" ( 
     call "%_dotnet%" build -c %Configuration% -o "%BuildOutputDir%%Configuration%"  --force "%__currentScriptDir%src\DotNetBridge\DotNetBridge.csproj"
+) else (
+    set VerifyManifest=False
+    set UpdateManifest=False
+    set BuildManifestGenerator=False
 )
 if "%BuildDotNetBridgeOnly%" == "True" ( 
     exit /b %ERRORLEVEL%
@@ -197,11 +205,6 @@ if "%BuildDotNetBridgeOnly%" == "True" (
 call "%_dotnet%" build -c %Configuration% --force "%__currentScriptDir%src\Platforms\build.csproj"
 call "%_dotnet%" publish "%__currentScriptDir%src\Platforms\build.csproj" --force --self-contained -r win-x64 -c %Configuration%
 
-
-if "%Configuration:~-5%" == "Py3.7" set VerifyManifest=True
-if "%VerifyManifest%" == "True" set BuildManifestGenerator=True
-if "%UpdateManifest%" == "True" set BuildManifestGenerator=True
-
 if "%BuildManifestGenerator%" == "True" (
     echo ""
     echo "#################################"
@@ -255,7 +258,7 @@ if not exist "%BoostRoot%\.done" (
 
 echo ""
 echo "#################################"
-echo "Building Native Bridge ... "
+echo "Building Native code ... "
 echo "#################################"
 :: Setting native code build environment
 echo Setting native build environment ...
diff --git a/src/python/tests_extended/test_export_to_onnx.py b/src/python/tests_extended/test_export_to_onnx.py
index c96e6988..4749fb3a 100644
--- a/src/python/tests_extended/test_export_to_onnx.py
+++ b/src/python/tests_extended/test_export_to_onnx.py
@@ -361,8 +361,22 @@
     'LogisticRegressionBinaryClassifier':  {'cols': [('PredictedLabel', 'PredictedLabel', 'PredictedLabel.output')]},
     'LogisticRegressionClassifier':  {'cols': [('PredictedLabel', 'PredictedLabel', 'PredictedLabel.output')]},
     'LpScaler': {'num_cols': 10, 'cols': 0},
-    'MeanVarianceScaler': {'num_cols': 5, 'cols': 0},
-    'MinMaxScaler': {'num_cols': 5, 'cols': 0},
+    'MeanVarianceScaler': {
+        'num_cols': 5,
+        'cols': [('Petal_Length', 'Petal_Length', 'Petal_Length.output'),
+                 ('Petal_Width', 'Petal_Width', 'Petal_Width.output'),
+                 ('Sepal_Length', 'Sepal_Length', 'Sepal_Length.output'),
+                 ('Sepal_Width', 'Sepal_Width', 'Sepal_Width.output'),
+                 ('Setosa', 'Setosa', 'Setosa.output')]
+    },
+    'MinMaxScaler': {
+        'num_cols': 5,
+        'cols': [('Petal_Length', 'Petal_Length', 'Petal_Length.output'),
+                 ('Petal_Width', 'Petal_Width', 'Petal_Width.output'),
+                 ('Sepal_Length', 'Sepal_Length', 'Sepal_Length.output'),
+                 ('Sepal_Width', 'Sepal_Width', 'Sepal_Width.output'),
+                 ('Setosa', 'Setosa', 'Setosa.output')]
+    },
     'MutualInformationSelector': {'num_cols': 8, 'cols': 0},
     'NGramFeaturizer': {'num_cols': 273, 'cols': 0},
     'NaiveBayesClassifier': {'cols': [('PredictedLabel', 'PredictedLabel', 'PredictedLabel.output')]},

From 039356abd979305883b8b209c9750231b26da9b3 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Thu, 26 Mar 2020 08:30:12 -0700
Subject: [PATCH 07/34] run ep only if VerifyManifest

---
 build.cmd | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/build.cmd b/build.cmd
index 62e716b6..95fc02d3 100644
--- a/build.cmd
+++ b/build.cmd
@@ -334,7 +334,7 @@ if exist %libs% rd %libs% /S /Q
 md %libs%
 echo.>"%__currentScriptDir%src\python\nimbusml\internal\libs\__init__.py"
 
-if %PythonVersion% == 3.7 (
+if "%VerifyManifest%" == "True" (
     :: Running the check in one python is enough. Entrypoint compiler doesn't run in py2.7.
     echo Generating low-level Python API from mainifest.json ...
     call "%PythonExe%" -m pip install --upgrade autopep8 autoflake isort jinja2

From cbe0e75e9678f4a21721eac0762010ba95d1d385 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Tue, 31 Mar 2020 12:51:56 -0700
Subject: [PATCH 08/34] draft of timeseries transforms

---
 src/python/nimbusml.pyproj                    |  17 +
 .../timeseries/analyticalrollingwindow.py     |  75 +++
 .../core/timeseries/forecastingpivot.py       |  50 ++
 .../core/timeseries/lagleadoperator.py        |  66 ++
 .../internal/core/timeseries/shortdrop.py     |  70 +++
 .../core/timeseries/simplerollingwindow.py    |  75 +++
 ...partitionedpathparser_parquetpathparser.py |  26 +
 ..._partitionedpathparser_simplepathparser.py |  71 +++
 .../transforms_analyticalrollingwindow.py     | 103 +++
 .../transforms_forecastingpivot.py            |  64 ++
 .../entrypoints/transforms_lagleadoperator.py |  88 +++
 .../entrypoints/transforms_shortdrop.py       |  95 +++
 .../transforms_simplerollingwindow.py         | 105 ++++
 .../timeseries/analyticalrollingwindow.py     |  77 +++
 .../nimbusml/timeseries/forecastingpivot.py   |  54 ++
 .../nimbusml/timeseries/lagleadoperator.py    |  66 ++
 src/python/nimbusml/timeseries/shortdrop.py   |  70 +++
 .../timeseries/simplerollingwindow.py         |  74 +++
 src/python/tools/manifest.json                | 594 +++++++++++++++++-
 src/python/tools/manifest_diff.json           |  30 +
 20 files changed, 1868 insertions(+), 2 deletions(-)
 create mode 100644 src/python/nimbusml/internal/core/timeseries/analyticalrollingwindow.py
 create mode 100644 src/python/nimbusml/internal/core/timeseries/forecastingpivot.py
 create mode 100644 src/python/nimbusml/internal/core/timeseries/lagleadoperator.py
 create mode 100644 src/python/nimbusml/internal/core/timeseries/shortdrop.py
 create mode 100644 src/python/nimbusml/internal/core/timeseries/simplerollingwindow.py
 create mode 100644 src/python/nimbusml/internal/entrypoints/_partitionedpathparser_parquetpathparser.py
 create mode 100644 src/python/nimbusml/internal/entrypoints/_partitionedpathparser_simplepathparser.py
 create mode 100644 src/python/nimbusml/internal/entrypoints/transforms_analyticalrollingwindow.py
 create mode 100644 src/python/nimbusml/internal/entrypoints/transforms_forecastingpivot.py
 create mode 100644 src/python/nimbusml/internal/entrypoints/transforms_lagleadoperator.py
 create mode 100644 src/python/nimbusml/internal/entrypoints/transforms_shortdrop.py
 create mode 100644 src/python/nimbusml/internal/entrypoints/transforms_simplerollingwindow.py
 create mode 100644 src/python/nimbusml/timeseries/analyticalrollingwindow.py
 create mode 100644 src/python/nimbusml/timeseries/forecastingpivot.py
 create mode 100644 src/python/nimbusml/timeseries/lagleadoperator.py
 create mode 100644 src/python/nimbusml/timeseries/shortdrop.py
 create mode 100644 src/python/nimbusml/timeseries/simplerollingwindow.py

diff --git a/src/python/nimbusml.pyproj b/src/python/nimbusml.pyproj
index 2deae4ab..24e1bcbc 100644
--- a/src/python/nimbusml.pyproj
+++ b/src/python/nimbusml.pyproj
@@ -332,8 +332,13 @@
     <Compile Include="nimbusml\internal\core\preprocessing\tokeyimputer.py" />
     <Compile Include="nimbusml\internal\core\preprocessing\tostring.py" />
     <Compile Include="nimbusml\internal\core\preprocessing\text\wordtokenizer.py" />
+    <Compile Include="nimbusml\internal\core\timeseries\analyticalrollingwindow.py" />
+    <Compile Include="nimbusml\internal\core\timeseries\forecastingpivot.py" />
     <Compile Include="nimbusml\internal\core\timeseries\iidchangepointdetector.py" />
     <Compile Include="nimbusml\internal\core\timeseries\iidspikedetector.py" />
+    <Compile Include="nimbusml\internal\core\timeseries\lagleadoperator.py" />
+    <Compile Include="nimbusml\internal\core\timeseries\shortdrop.py" />
+    <Compile Include="nimbusml\internal\core\timeseries\simplerollingwindow.py" />
     <Compile Include="nimbusml\internal\core\timeseries\ssachangepointdetector.py" />
     <Compile Include="nimbusml\internal\core\timeseries\ssaforecaster.py" />
     <Compile Include="nimbusml\internal\core\timeseries\ssaspikedetector.py" />
@@ -414,6 +419,7 @@
     <Compile Include="nimbusml\internal\entrypoints\trainers_stochasticdualcoordinateascentregressor.py" />
     <Compile Include="nimbusml\internal\entrypoints\trainers_stochasticgradientdescentbinaryclassifier.py" />
     <Compile Include="nimbusml\internal\entrypoints\trainers_symsgdbinaryclassifier.py" />
+    <Compile Include="nimbusml\internal\entrypoints\transforms_analyticalrollingwindow.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_approximatebootstrapsampler.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_binarypredictionscorecolumnsrenamer.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_binnormalizer.py" />
@@ -422,6 +428,8 @@
     <Compile Include="nimbusml\internal\entrypoints\transforms_categoryimputer.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_charactertokenizer.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_datasetscorerex.py" />
+    <Compile Include="nimbusml\internal\entrypoints\transforms_forecastingpivot.py" />
+    <Compile Include="nimbusml\internal\entrypoints\transforms_lagleadoperator.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_prefixcolumnconcatenator.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_columnconcatenator.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_columncopier.py" />
@@ -476,6 +484,8 @@
     <Compile Include="nimbusml\internal\entrypoints\transforms_scorer.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_segregator.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_sentimentanalyzer.py" />
+    <Compile Include="nimbusml\internal\entrypoints\transforms_shortdrop.py" />
+    <Compile Include="nimbusml\internal\entrypoints\transforms_simplerollingwindow.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_tensorflowscorer.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_textfeaturizer.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_texttokeyconverter.py" />
@@ -541,6 +551,8 @@
     <Compile Include="nimbusml\internal\entrypoints\_ngramextractor_ngramhash.py" />
     <Compile Include="nimbusml\internal\entrypoints\_parallellightgbm_single.py" />
     <Compile Include="nimbusml\internal\entrypoints\_paralleltraining_single.py" />
+    <Compile Include="nimbusml\internal\entrypoints\_partitionedpathparser_parquetpathparser.py" />
+    <Compile Include="nimbusml\internal\entrypoints\_partitionedpathparser_simplepathparser.py" />
     <Compile Include="nimbusml\internal\entrypoints\_regressionlossfunction_poissonloss.py" />
     <Compile Include="nimbusml\internal\entrypoints\_regressionlossfunction_squaredloss.py" />
     <Compile Include="nimbusml\internal\entrypoints\_regressionlossfunction_tweedieloss.py" />
@@ -747,8 +759,13 @@
     <Compile Include="nimbusml\tests\timeseries\test_ssaspikedetector.py" />
     <Compile Include="nimbusml\tests\timeseries\test_iidspikedetector.py" />
     <Compile Include="nimbusml\tests\timeseries\__init__.py" />
+    <Compile Include="nimbusml\timeseries\analyticalrollingwindow.py" />
+    <Compile Include="nimbusml\timeseries\forecastingpivot.py" />
     <Compile Include="nimbusml\timeseries\iidchangepointdetector.py" />
     <Compile Include="nimbusml\timeseries\iidspikedetector.py" />
+    <Compile Include="nimbusml\timeseries\lagleadoperator.py" />
+    <Compile Include="nimbusml\timeseries\shortdrop.py" />
+    <Compile Include="nimbusml\timeseries\simplerollingwindow.py" />
     <Compile Include="nimbusml\timeseries\ssachangepointdetector.py" />
     <Compile Include="nimbusml\timeseries\ssaforecaster.py" />
     <Compile Include="nimbusml\timeseries\ssaspikedetector.py" />
diff --git a/src/python/nimbusml/internal/core/timeseries/analyticalrollingwindow.py b/src/python/nimbusml/internal/core/timeseries/analyticalrollingwindow.py
new file mode 100644
index 00000000..69bfde78
--- /dev/null
+++ b/src/python/nimbusml/internal/core/timeseries/analyticalrollingwindow.py
@@ -0,0 +1,75 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+AnalyticalRollingWindow
+"""
+
+__all__ = ["AnalyticalRollingWindow"]
+
+
+from ...entrypoints.transforms_analyticalrollingwindow import \
+    transforms_analyticalrollingwindow
+from ...utils.utils import trace
+from ..base_pipeline_item import BasePipelineItem, DefaultSignature
+
+
+class AnalyticalRollingWindow(BasePipelineItem, DefaultSignature):
+    """
+    **Description**
+        Performs an analaytical calculation over a rolling timeseries window
+
+    :param grain_columns: List of grain columns.
+
+    :param target_column: Target column.
+
+    :param horizon: Maximum horizon value.
+
+    :param max_window_size: Maximum window size.
+
+    :param min_window_size: Minimum window size.
+
+    :param window_calculation: What window calculation to use.
+
+    :param params: Additional arguments sent to compute engine.
+
+    """
+
+    @trace
+    def __init__(
+            self,
+            grain_columns,
+            target_column,
+            horizon=0,
+            max_window_size=0,
+            min_window_size=0,
+            window_calculation='0',
+            **params):
+        BasePipelineItem.__init__(
+            self, type='transform', **params)
+
+        self.grain_columns = grain_columns
+        self.target_column = target_column
+        self.horizon = horizon
+        self.max_window_size = max_window_size
+        self.min_window_size = min_window_size
+        self.window_calculation = window_calculation
+
+    @property
+    def _entrypoint(self):
+        return transforms_analyticalrollingwindow
+
+    @trace
+    def _get_node(self, **all_args):
+        algo_args = dict(
+            grain_columns=self.grain_columns,
+            target_column=self.target_column,
+            horizon=self.horizon,
+            max_window_size=self.max_window_size,
+            min_window_size=self.min_window_size,
+            window_calculation=self.window_calculation)
+
+        all_args.update(algo_args)
+        return self._entrypoint(**all_args)
diff --git a/src/python/nimbusml/internal/core/timeseries/forecastingpivot.py b/src/python/nimbusml/internal/core/timeseries/forecastingpivot.py
new file mode 100644
index 00000000..cf499392
--- /dev/null
+++ b/src/python/nimbusml/internal/core/timeseries/forecastingpivot.py
@@ -0,0 +1,50 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+ForecastingPivot
+"""
+
+__all__ = ["ForecastingPivot"]
+
+
+from ...entrypoints.transforms_forecastingpivot import \
+    transforms_forecastingpivot
+from ...utils.utils import trace
+from ..base_pipeline_item import BasePipelineItem, DefaultSignature
+
+
+class ForecastingPivot(BasePipelineItem, DefaultSignature):
+    """
+    **Description**
+        Pivots the input colums and drops any rows with N/A
+
+    :param columns_to_pivot: List of columns to pivot.
+
+    :param params: Additional arguments sent to compute engine.
+
+    """
+
+    @trace
+    def __init__(
+            self,
+            columns_to_pivot,
+            **params):
+        BasePipelineItem.__init__(
+            self, type='transform', **params)
+
+        self.columns_to_pivot = columns_to_pivot
+
+    @property
+    def _entrypoint(self):
+        return transforms_forecastingpivot
+
+    @trace
+    def _get_node(self, **all_args):
+        algo_args = dict(
+            columns_to_pivot=self.columns_to_pivot)
+
+        all_args.update(algo_args)
+        return self._entrypoint(**all_args)
diff --git a/src/python/nimbusml/internal/core/timeseries/lagleadoperator.py b/src/python/nimbusml/internal/core/timeseries/lagleadoperator.py
new file mode 100644
index 00000000..4dad5691
--- /dev/null
+++ b/src/python/nimbusml/internal/core/timeseries/lagleadoperator.py
@@ -0,0 +1,66 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+LagLeadOperator
+"""
+
+__all__ = ["LagLeadOperator"]
+
+
+from ...entrypoints.transforms_lagleadoperator import \
+    transforms_lagleadoperator
+from ...utils.utils import trace
+from ..base_pipeline_item import BasePipelineItem, DefaultSignature
+
+
+class LagLeadOperator(BasePipelineItem, DefaultSignature):
+    """
+    **Description**
+        uses the offset list to create lags and leads
+
+    :param grain_columns: List of grain columns.
+
+    :param target_column: Target column.
+
+    :param horizon: Maximum horizon value.
+
+    :param offsets: Lag and Lead offset to use. A negative number is a lag,
+        positive is a lead.
+
+    :param params: Additional arguments sent to compute engine.
+
+    """
+
+    @trace
+    def __init__(
+            self,
+            grain_columns,
+            target_column,
+            offsets,
+            horizon=0,
+            **params):
+        BasePipelineItem.__init__(
+            self, type='transform', **params)
+
+        self.grain_columns = grain_columns
+        self.target_column = target_column
+        self.offsets = offsets
+        self.horizon = horizon
+
+    @property
+    def _entrypoint(self):
+        return transforms_lagleadoperator
+
+    @trace
+    def _get_node(self, **all_args):
+        algo_args = dict(
+            grain_columns=self.grain_columns,
+            target_column=self.target_column,
+            offsets=self.offsets,
+            horizon=self.horizon)
+
+        all_args.update(algo_args)
+        return self._entrypoint(**all_args)
diff --git a/src/python/nimbusml/internal/core/timeseries/shortdrop.py b/src/python/nimbusml/internal/core/timeseries/shortdrop.py
new file mode 100644
index 00000000..9e228495
--- /dev/null
+++ b/src/python/nimbusml/internal/core/timeseries/shortdrop.py
@@ -0,0 +1,70 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+ShortDrop
+"""
+
+__all__ = ["ShortDrop"]
+
+
+from ...entrypoints.transforms_shortdrop import transforms_shortdrop
+from ...utils.utils import trace
+from ..base_pipeline_item import BasePipelineItem, DefaultSignature
+
+
+class ShortDrop(BasePipelineItem, DefaultSignature):
+    """
+    **Description**
+        Drops rows if there aren't enough values per grain.
+
+    :param grain_columns: List of grain columns.
+
+    :param horizon: Maximum horizon value.
+
+    :param max_window_size: Maximum window size.
+
+    :param cross_validations: Number of cross validations being performed.
+
+    :param offsets: Lag and Lead offset to use. A negative number is a lag,
+        positive is a lead.
+
+    :param params: Additional arguments sent to compute engine.
+
+    """
+
+    @trace
+    def __init__(
+            self,
+            grain_columns,
+            offsets,
+            horizon=0,
+            max_window_size=0,
+            cross_validations=0,
+            **params):
+        BasePipelineItem.__init__(
+            self, type='transform', **params)
+
+        self.grain_columns = grain_columns
+        self.offsets = offsets
+        self.horizon = horizon
+        self.max_window_size = max_window_size
+        self.cross_validations = cross_validations
+
+    @property
+    def _entrypoint(self):
+        return transforms_shortdrop
+
+    @trace
+    def _get_node(self, **all_args):
+        algo_args = dict(
+            grain_columns=self.grain_columns,
+            offsets=self.offsets,
+            horizon=self.horizon,
+            max_window_size=self.max_window_size,
+            cross_validations=self.cross_validations)
+
+        all_args.update(algo_args)
+        return self._entrypoint(**all_args)
diff --git a/src/python/nimbusml/internal/core/timeseries/simplerollingwindow.py b/src/python/nimbusml/internal/core/timeseries/simplerollingwindow.py
new file mode 100644
index 00000000..7952887f
--- /dev/null
+++ b/src/python/nimbusml/internal/core/timeseries/simplerollingwindow.py
@@ -0,0 +1,75 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+SimpleRollingWindow
+"""
+
+__all__ = ["SimpleRollingWindow"]
+
+
+from ...entrypoints.transforms_simplerollingwindow import \
+    transforms_simplerollingwindow
+from ...utils.utils import trace
+from ..base_pipeline_item import BasePipelineItem, DefaultSignature
+
+
+class SimpleRollingWindow(BasePipelineItem, DefaultSignature):
+    """
+    **Description**
+        Performs simple rolling window calculations.
+
+    :param grain_columns: List of grain columns.
+
+    :param target_column: Target column.
+
+    :param horizon: Maximum horizon value.
+
+    :param max_window_size: Maximum window size.
+
+    :param min_window_size: Minimum window size.
+
+    :param window_calculation: What window calculation to use.
+
+    :param params: Additional arguments sent to compute engine.
+
+    """
+
+    @trace
+    def __init__(
+            self,
+            grain_columns,
+            target_column,
+            horizon=0,
+            max_window_size=0,
+            min_window_size=0,
+            window_calculation='0',
+            **params):
+        BasePipelineItem.__init__(
+            self, type='transform', **params)
+
+        self.grain_columns = grain_columns
+        self.target_column = target_column
+        self.horizon = horizon
+        self.max_window_size = max_window_size
+        self.min_window_size = min_window_size
+        self.window_calculation = window_calculation
+
+    @property
+    def _entrypoint(self):
+        return transforms_simplerollingwindow
+
+    @trace
+    def _get_node(self, **all_args):
+        algo_args = dict(
+            grain_columns=self.grain_columns,
+            target_column=self.target_column,
+            horizon=self.horizon,
+            max_window_size=self.max_window_size,
+            min_window_size=self.min_window_size,
+            window_calculation=self.window_calculation)
+
+        all_args.update(algo_args)
+        return self._entrypoint(**all_args)
diff --git a/src/python/nimbusml/internal/entrypoints/_partitionedpathparser_parquetpathparser.py b/src/python/nimbusml/internal/entrypoints/_partitionedpathparser_parquetpathparser.py
new file mode 100644
index 00000000..a5c34acb
--- /dev/null
+++ b/src/python/nimbusml/internal/entrypoints/_partitionedpathparser_parquetpathparser.py
@@ -0,0 +1,26 @@
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+ParquetPathParser
+"""
+
+
+from ..utils.entrypoints import Component
+
+
+def parquet_path_parser(
+        **params):
+    """
+    **Description**
+        Extract name/value pairs from Parquet formatted directory names.
+        Example path: Year=2018/Month=12/data1.parquet
+
+    """
+
+    entrypoint_name = 'ParquetPathParser'
+    settings = {}
+
+    component = Component(
+        name=entrypoint_name,
+        settings=settings,
+        kind='PartitionedPathParser')
+    return component
diff --git a/src/python/nimbusml/internal/entrypoints/_partitionedpathparser_simplepathparser.py b/src/python/nimbusml/internal/entrypoints/_partitionedpathparser_simplepathparser.py
new file mode 100644
index 00000000..3f63ac19
--- /dev/null
+++ b/src/python/nimbusml/internal/entrypoints/_partitionedpathparser_simplepathparser.py
@@ -0,0 +1,71 @@
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+SimplePathParser
+"""
+
+
+from ..utils.entrypoints import Component
+from ..utils.utils import try_set
+
+
+def simple_path_parser(
+        columns=None,
+        type='TX',
+        **params):
+    """
+    **Description**
+        A simple parser that extracts directory names as column values.
+        Column names are defined as arguments.
+
+    :param columns: Column definitions used to override the
+        Partitioned Path Parser. Expected with the format
+        name:type:numeric-source, for example, col=MyFeature:R4:1
+        (settings).
+    :param type: Data type of each column. (settings).
+    """
+
+    entrypoint_name = 'SimplePathParser'
+    settings = {}
+
+    if columns is not None:
+        settings['Columns'] = try_set(
+            obj=columns,
+            none_acceptable=True,
+            is_of_type=list,
+            is_column=True)
+    if type is not None:
+        settings['Type'] = try_set(
+            obj=type,
+            none_acceptable=True,
+            is_of_type=str,
+            values=[
+                'I1',
+                'U1',
+                'I2',
+                'U2',
+                'I4',
+                'U4',
+                'I8',
+                'U8',
+                'R4',
+                'Num',
+                'R8',
+                'TX',
+                'Text',
+                'TXT',
+                'BL',
+                'Bool',
+                'TimeSpan',
+                'TS',
+                'DT',
+                'DateTime',
+                'DZ',
+                'DateTimeZone',
+                'UG',
+                'U16'])
+
+    component = Component(
+        name=entrypoint_name,
+        settings=settings,
+        kind='PartitionedPathParser')
+    return component
diff --git a/src/python/nimbusml/internal/entrypoints/transforms_analyticalrollingwindow.py b/src/python/nimbusml/internal/entrypoints/transforms_analyticalrollingwindow.py
new file mode 100644
index 00000000..c1ca37f2
--- /dev/null
+++ b/src/python/nimbusml/internal/entrypoints/transforms_analyticalrollingwindow.py
@@ -0,0 +1,103 @@
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+Transforms.AnalyticalRollingWindow
+"""
+
+import numbers
+
+from ..utils.entrypoints import EntryPoint
+from ..utils.utils import try_set, unlist
+
+
+def transforms_analyticalrollingwindow(
+        grain_columns,
+        target_column,
+        data,
+        output_data=None,
+        model=None,
+        horizon=0,
+        max_window_size=0,
+        min_window_size=0,
+        window_calculation='0',
+        **params):
+    """
+    **Description**
+        Performs an analaytical calculation over a rolling timeseries window
+
+    :param grain_columns: List of grain columns (inputs).
+    :param target_column: Target column (inputs).
+    :param data: Input dataset (inputs).
+    :param horizon: Maximum horizon value (inputs).
+    :param max_window_size: Maximum window size (inputs).
+    :param min_window_size: Minimum window size (inputs).
+    :param window_calculation: What window calculation to use
+        (inputs).
+    :param output_data: Transformed dataset (outputs).
+    :param model: Transform model (outputs).
+    """
+
+    entrypoint_name = 'Transforms.AnalyticalRollingWindow'
+    inputs = {}
+    outputs = {}
+
+    if grain_columns is not None:
+        inputs['GrainColumns'] = try_set(
+            obj=grain_columns,
+            none_acceptable=False,
+            is_of_type=list,
+            is_column=True)
+    if target_column is not None:
+        inputs['TargetColumn'] = try_set(
+            obj=target_column,
+            none_acceptable=False,
+            is_of_type=str,
+            is_column=True)
+    if data is not None:
+        inputs['Data'] = try_set(
+            obj=data,
+            none_acceptable=False,
+            is_of_type=str)
+    if horizon is not None:
+        inputs['Horizon'] = try_set(
+            obj=horizon,
+            none_acceptable=False,
+            is_of_type=numbers.Real)
+    if max_window_size is not None:
+        inputs['MaxWindowSize'] = try_set(
+            obj=max_window_size,
+            none_acceptable=False,
+            is_of_type=numbers.Real)
+    if min_window_size is not None:
+        inputs['MinWindowSize'] = try_set(
+            obj=min_window_size,
+            none_acceptable=False,
+            is_of_type=numbers.Real)
+    if window_calculation is not None:
+        inputs['WindowCalculation'] = try_set(
+            obj=window_calculation,
+            none_acceptable=False,
+            is_of_type=str,
+            values=['Mean'])
+    if output_data is not None:
+        outputs['OutputData'] = try_set(
+            obj=output_data,
+            none_acceptable=False,
+            is_of_type=str)
+    if model is not None:
+        outputs['Model'] = try_set(
+            obj=model,
+            none_acceptable=False,
+            is_of_type=str)
+
+    input_variables = {
+        x for x in unlist(inputs.values())
+        if isinstance(x, str) and x.startswith("$")}
+    output_variables = {
+        x for x in unlist(outputs.values())
+        if isinstance(x, str) and x.startswith("$")}
+
+    entrypoint = EntryPoint(
+        name=entrypoint_name, inputs=inputs, outputs=outputs,
+        input_variables=input_variables,
+        output_variables=output_variables)
+    return entrypoint
diff --git a/src/python/nimbusml/internal/entrypoints/transforms_forecastingpivot.py b/src/python/nimbusml/internal/entrypoints/transforms_forecastingpivot.py
new file mode 100644
index 00000000..ebf94c23
--- /dev/null
+++ b/src/python/nimbusml/internal/entrypoints/transforms_forecastingpivot.py
@@ -0,0 +1,64 @@
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+Transforms.ForecastingPivot
+"""
+
+
+from ..utils.entrypoints import EntryPoint
+from ..utils.utils import try_set, unlist
+
+
+def transforms_forecastingpivot(
+        columns_to_pivot,
+        data,
+        output_data=None,
+        model=None,
+        **params):
+    """
+    **Description**
+        Pivots the input colums and drops any rows with N/A
+
+    :param columns_to_pivot: List of columns to pivot (inputs).
+    :param data: Input dataset (inputs).
+    :param output_data: Transformed dataset (outputs).
+    :param model: Transform model (outputs).
+    """
+
+    entrypoint_name = 'Transforms.ForecastingPivot'
+    inputs = {}
+    outputs = {}
+
+    if columns_to_pivot is not None:
+        inputs['ColumnsToPivot'] = try_set(
+            obj=columns_to_pivot,
+            none_acceptable=False,
+            is_of_type=list,
+            is_column=True)
+    if data is not None:
+        inputs['Data'] = try_set(
+            obj=data,
+            none_acceptable=False,
+            is_of_type=str)
+    if output_data is not None:
+        outputs['OutputData'] = try_set(
+            obj=output_data,
+            none_acceptable=False,
+            is_of_type=str)
+    if model is not None:
+        outputs['Model'] = try_set(
+            obj=model,
+            none_acceptable=False,
+            is_of_type=str)
+
+    input_variables = {
+        x for x in unlist(inputs.values())
+        if isinstance(x, str) and x.startswith("$")}
+    output_variables = {
+        x for x in unlist(outputs.values())
+        if isinstance(x, str) and x.startswith("$")}
+
+    entrypoint = EntryPoint(
+        name=entrypoint_name, inputs=inputs, outputs=outputs,
+        input_variables=input_variables,
+        output_variables=output_variables)
+    return entrypoint
diff --git a/src/python/nimbusml/internal/entrypoints/transforms_lagleadoperator.py b/src/python/nimbusml/internal/entrypoints/transforms_lagleadoperator.py
new file mode 100644
index 00000000..e840bd66
--- /dev/null
+++ b/src/python/nimbusml/internal/entrypoints/transforms_lagleadoperator.py
@@ -0,0 +1,88 @@
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+Transforms.LagLeadOperator
+"""
+
+import numbers
+
+from ..utils.entrypoints import EntryPoint
+from ..utils.utils import try_set, unlist
+
+
+def transforms_lagleadoperator(
+        grain_columns,
+        target_column,
+        data,
+        offsets,
+        output_data=None,
+        model=None,
+        horizon=0,
+        **params):
+    """
+    **Description**
+        uses the offset list to create lags and leads
+
+    :param grain_columns: List of grain columns (inputs).
+    :param target_column: Target column (inputs).
+    :param data: Input dataset (inputs).
+    :param horizon: Maximum horizon value (inputs).
+    :param offsets: Lag and Lead offset to use. A negative number is
+        a lag, positive is a lead (inputs).
+    :param output_data: Transformed dataset (outputs).
+    :param model: Transform model (outputs).
+    """
+
+    entrypoint_name = 'Transforms.LagLeadOperator'
+    inputs = {}
+    outputs = {}
+
+    if grain_columns is not None:
+        inputs['GrainColumns'] = try_set(
+            obj=grain_columns,
+            none_acceptable=False,
+            is_of_type=list,
+            is_column=True)
+    if target_column is not None:
+        inputs['TargetColumn'] = try_set(
+            obj=target_column,
+            none_acceptable=False,
+            is_of_type=str,
+            is_column=True)
+    if data is not None:
+        inputs['Data'] = try_set(
+            obj=data,
+            none_acceptable=False,
+            is_of_type=str)
+    if horizon is not None:
+        inputs['Horizon'] = try_set(
+            obj=horizon,
+            none_acceptable=False,
+            is_of_type=numbers.Real)
+    if offsets is not None:
+        inputs['offsets'] = try_set(
+            obj=offsets,
+            none_acceptable=False,
+            is_of_type=list)
+    if output_data is not None:
+        outputs['OutputData'] = try_set(
+            obj=output_data,
+            none_acceptable=False,
+            is_of_type=str)
+    if model is not None:
+        outputs['Model'] = try_set(
+            obj=model,
+            none_acceptable=False,
+            is_of_type=str)
+
+    input_variables = {
+        x for x in unlist(inputs.values())
+        if isinstance(x, str) and x.startswith("$")}
+    output_variables = {
+        x for x in unlist(outputs.values())
+        if isinstance(x, str) and x.startswith("$")}
+
+    entrypoint = EntryPoint(
+        name=entrypoint_name, inputs=inputs, outputs=outputs,
+        input_variables=input_variables,
+        output_variables=output_variables)
+    return entrypoint
diff --git a/src/python/nimbusml/internal/entrypoints/transforms_shortdrop.py b/src/python/nimbusml/internal/entrypoints/transforms_shortdrop.py
new file mode 100644
index 00000000..bae78343
--- /dev/null
+++ b/src/python/nimbusml/internal/entrypoints/transforms_shortdrop.py
@@ -0,0 +1,95 @@
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+Transforms.ShortDrop
+"""
+
+import numbers
+
+from ..utils.entrypoints import EntryPoint
+from ..utils.utils import try_set, unlist
+
+
+def transforms_shortdrop(
+        grain_columns,
+        data,
+        offsets,
+        output_data=None,
+        model=None,
+        horizon=0,
+        max_window_size=0,
+        cross_validations=0,
+        **params):
+    """
+    **Description**
+        Drops rows if there aren't enough values per grain.
+
+    :param grain_columns: List of grain columns (inputs).
+    :param horizon: Maximum horizon value (inputs).
+    :param data: Input dataset (inputs).
+    :param max_window_size: Maximum window size (inputs).
+    :param cross_validations: Number of cross validations being
+        performed. (inputs).
+    :param offsets: Lag and Lead offset to use. A negative number is
+        a lag, positive is a lead (inputs).
+    :param output_data: Transformed dataset (outputs).
+    :param model: Transform model (outputs).
+    """
+
+    entrypoint_name = 'Transforms.ShortDrop'
+    inputs = {}
+    outputs = {}
+
+    if grain_columns is not None:
+        inputs['GrainColumns'] = try_set(
+            obj=grain_columns,
+            none_acceptable=False,
+            is_of_type=list,
+            is_column=True)
+    if horizon is not None:
+        inputs['Horizon'] = try_set(
+            obj=horizon,
+            none_acceptable=False,
+            is_of_type=numbers.Real)
+    if data is not None:
+        inputs['Data'] = try_set(
+            obj=data,
+            none_acceptable=False,
+            is_of_type=str)
+    if max_window_size is not None:
+        inputs['MaxWindowSize'] = try_set(
+            obj=max_window_size,
+            none_acceptable=False,
+            is_of_type=numbers.Real)
+    if cross_validations is not None:
+        inputs['CrossValidations'] = try_set(
+            obj=cross_validations,
+            none_acceptable=True,
+            is_of_type=numbers.Real)
+    if offsets is not None:
+        inputs['offsets'] = try_set(
+            obj=offsets,
+            none_acceptable=False,
+            is_of_type=list)
+    if output_data is not None:
+        outputs['OutputData'] = try_set(
+            obj=output_data,
+            none_acceptable=False,
+            is_of_type=str)
+    if model is not None:
+        outputs['Model'] = try_set(
+            obj=model,
+            none_acceptable=False,
+            is_of_type=str)
+
+    input_variables = {
+        x for x in unlist(inputs.values())
+        if isinstance(x, str) and x.startswith("$")}
+    output_variables = {
+        x for x in unlist(outputs.values())
+        if isinstance(x, str) and x.startswith("$")}
+
+    entrypoint = EntryPoint(
+        name=entrypoint_name, inputs=inputs, outputs=outputs,
+        input_variables=input_variables,
+        output_variables=output_variables)
+    return entrypoint
diff --git a/src/python/nimbusml/internal/entrypoints/transforms_simplerollingwindow.py b/src/python/nimbusml/internal/entrypoints/transforms_simplerollingwindow.py
new file mode 100644
index 00000000..36f8eb43
--- /dev/null
+++ b/src/python/nimbusml/internal/entrypoints/transforms_simplerollingwindow.py
@@ -0,0 +1,105 @@
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+Transforms.SimpleRollingWindow
+"""
+
+import numbers
+
+from ..utils.entrypoints import EntryPoint
+from ..utils.utils import try_set, unlist
+
+
+def transforms_simplerollingwindow(
+        grain_columns,
+        target_column,
+        data,
+        output_data=None,
+        model=None,
+        horizon=0,
+        max_window_size=0,
+        min_window_size=0,
+        window_calculation='0',
+        **params):
+    """
+    **Description**
+        Performs simple rolling window calculations.
+
+    :param grain_columns: List of grain columns (inputs).
+    :param target_column: Target column (inputs).
+    :param data: Input dataset (inputs).
+    :param horizon: Maximum horizon value (inputs).
+    :param max_window_size: Maximum window size (inputs).
+    :param min_window_size: Minimum window size (inputs).
+    :param window_calculation: What window calculation to use
+        (inputs).
+    :param output_data: Transformed dataset (outputs).
+    :param model: Transform model (outputs).
+    """
+
+    entrypoint_name = 'Transforms.SimpleRollingWindow'
+    inputs = {}
+    outputs = {}
+
+    if grain_columns is not None:
+        inputs['GrainColumns'] = try_set(
+            obj=grain_columns,
+            none_acceptable=False,
+            is_of_type=list,
+            is_column=True)
+    if target_column is not None:
+        inputs['TargetColumn'] = try_set(
+            obj=target_column,
+            none_acceptable=False,
+            is_of_type=str,
+            is_column=True)
+    if data is not None:
+        inputs['Data'] = try_set(
+            obj=data,
+            none_acceptable=False,
+            is_of_type=str)
+    if horizon is not None:
+        inputs['Horizon'] = try_set(
+            obj=horizon,
+            none_acceptable=False,
+            is_of_type=numbers.Real)
+    if max_window_size is not None:
+        inputs['MaxWindowSize'] = try_set(
+            obj=max_window_size,
+            none_acceptable=False,
+            is_of_type=numbers.Real)
+    if min_window_size is not None:
+        inputs['MinWindowSize'] = try_set(
+            obj=min_window_size,
+            none_acceptable=False,
+            is_of_type=numbers.Real)
+    if window_calculation is not None:
+        inputs['WindowCalculation'] = try_set(
+            obj=window_calculation,
+            none_acceptable=False,
+            is_of_type=str,
+            values=[
+                'Min',
+                'Max'])
+    if output_data is not None:
+        outputs['OutputData'] = try_set(
+            obj=output_data,
+            none_acceptable=False,
+            is_of_type=str)
+    if model is not None:
+        outputs['Model'] = try_set(
+            obj=model,
+            none_acceptable=False,
+            is_of_type=str)
+
+    input_variables = {
+        x for x in unlist(inputs.values())
+        if isinstance(x, str) and x.startswith("$")}
+    output_variables = {
+        x for x in unlist(outputs.values())
+        if isinstance(x, str) and x.startswith("$")}
+
+    entrypoint = EntryPoint(
+        name=entrypoint_name, inputs=inputs, outputs=outputs,
+        input_variables=input_variables,
+        output_variables=output_variables)
+    return entrypoint
diff --git a/src/python/nimbusml/timeseries/analyticalrollingwindow.py b/src/python/nimbusml/timeseries/analyticalrollingwindow.py
new file mode 100644
index 00000000..8cdc00d0
--- /dev/null
+++ b/src/python/nimbusml/timeseries/analyticalrollingwindow.py
@@ -0,0 +1,77 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+AnalyticalRollingWindow
+"""
+
+__all__ = ["AnalyticalRollingWindow"]
+
+
+from sklearn.base import TransformerMixin
+
+from ..base_transform import BaseTransform
+from ..internal.core.timeseries.analyticalrollingwindow import \
+    AnalyticalRollingWindow as core
+from ..internal.utils.utils import trace
+
+
+class AnalyticalRollingWindow(
+        core,
+        BaseTransform,
+        TransformerMixin):
+    """
+    **Description**
+        Performs an analaytical calculation over a rolling timeseries window
+
+    :param columns: see `Columns </nimbusml/concepts/columns>`_.
+
+    :param grain_columns: List of grain columns.
+
+    :param target_column: Target column.
+
+    :param horizon: Maximum horizon value.
+
+    :param max_window_size: Maximum window size.
+
+    :param min_window_size: Minimum window size.
+
+    :param window_calculation: What window calculation to use.
+
+    :param params: Additional arguments sent to compute engine.
+
+    """
+
+    @trace
+    def __init__(
+            self,
+            grain_columns,
+            target_column,
+            horizon=0,
+            max_window_size=0,
+            min_window_size=0,
+            window_calculation='0',
+            columns=None,
+            **params):
+
+        if columns:
+            params['columns'] = columns
+        BaseTransform.__init__(self, **params)
+        core.__init__(
+            self,
+            grain_columns=grain_columns,
+            target_column=target_column,
+            horizon=horizon,
+            max_window_size=max_window_size,
+            min_window_size=min_window_size,
+            window_calculation=window_calculation,
+            **params)
+        self._columns = columns
+
+    def get_params(self, deep=False):
+        """
+        Get the parameters for this operator.
+        """
+        return core.get_params(self)
diff --git a/src/python/nimbusml/timeseries/forecastingpivot.py b/src/python/nimbusml/timeseries/forecastingpivot.py
new file mode 100644
index 00000000..bb58b553
--- /dev/null
+++ b/src/python/nimbusml/timeseries/forecastingpivot.py
@@ -0,0 +1,54 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+ForecastingPivot
+"""
+
+__all__ = ["ForecastingPivot"]
+
+
+from sklearn.base import TransformerMixin
+
+from ..base_transform import BaseTransform
+from ..internal.core.timeseries.forecastingpivot import \
+    ForecastingPivot as core
+from ..internal.utils.utils import trace
+
+
+class ForecastingPivot(core, BaseTransform, TransformerMixin):
+    """
+    **Description**
+        Pivots the input colums and drops any rows with N/A
+
+    :param columns: see `Columns </nimbusml/concepts/columns>`_.
+
+    :param columns_to_pivot: List of columns to pivot.
+
+    :param params: Additional arguments sent to compute engine.
+
+    """
+
+    @trace
+    def __init__(
+            self,
+            columns_to_pivot,
+            columns=None,
+            **params):
+
+        if columns:
+            params['columns'] = columns
+        BaseTransform.__init__(self, **params)
+        core.__init__(
+            self,
+            columns_to_pivot=columns_to_pivot,
+            **params)
+        self._columns = columns
+
+    def get_params(self, deep=False):
+        """
+        Get the parameters for this operator.
+        """
+        return core.get_params(self)
diff --git a/src/python/nimbusml/timeseries/lagleadoperator.py b/src/python/nimbusml/timeseries/lagleadoperator.py
new file mode 100644
index 00000000..373d4334
--- /dev/null
+++ b/src/python/nimbusml/timeseries/lagleadoperator.py
@@ -0,0 +1,66 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+LagLeadOperator
+"""
+
+__all__ = ["LagLeadOperator"]
+
+
+from sklearn.base import TransformerMixin
+
+from ..base_transform import BaseTransform
+from ..internal.core.timeseries.lagleadoperator import LagLeadOperator as core
+from ..internal.utils.utils import trace
+
+
+class LagLeadOperator(core, BaseTransform, TransformerMixin):
+    """
+    **Description**
+        uses the offset list to create lags and leads
+
+    :param columns: see `Columns </nimbusml/concepts/columns>`_.
+
+    :param grain_columns: List of grain columns.
+
+    :param target_column: Target column.
+
+    :param horizon: Maximum horizon value.
+
+    :param offsets: Lag and Lead offset to use. A negative number is a lag,
+        positive is a lead.
+
+    :param params: Additional arguments sent to compute engine.
+
+    """
+
+    @trace
+    def __init__(
+            self,
+            grain_columns,
+            target_column,
+            offsets,
+            horizon=0,
+            columns=None,
+            **params):
+
+        if columns:
+            params['columns'] = columns
+        BaseTransform.__init__(self, **params)
+        core.__init__(
+            self,
+            grain_columns=grain_columns,
+            target_column=target_column,
+            offsets=offsets,
+            horizon=horizon,
+            **params)
+        self._columns = columns
+
+    def get_params(self, deep=False):
+        """
+        Get the parameters for this operator.
+        """
+        return core.get_params(self)
diff --git a/src/python/nimbusml/timeseries/shortdrop.py b/src/python/nimbusml/timeseries/shortdrop.py
new file mode 100644
index 00000000..0e5e8a7e
--- /dev/null
+++ b/src/python/nimbusml/timeseries/shortdrop.py
@@ -0,0 +1,70 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+ShortDrop
+"""
+
+__all__ = ["ShortDrop"]
+
+
+from sklearn.base import TransformerMixin
+
+from ..base_transform import BaseTransform
+from ..internal.core.timeseries.shortdrop import ShortDrop as core
+from ..internal.utils.utils import trace
+
+
+class ShortDrop(core, BaseTransform, TransformerMixin):
+    """
+    **Description**
+        Drops rows if there aren't enough values per grain.
+
+    :param columns: see `Columns </nimbusml/concepts/columns>`_.
+
+    :param grain_columns: List of grain columns.
+
+    :param horizon: Maximum horizon value.
+
+    :param max_window_size: Maximum window size.
+
+    :param cross_validations: Number of cross validations being performed.
+
+    :param offsets: Lag and Lead offset to use. A negative number is a lag,
+        positive is a lead.
+
+    :param params: Additional arguments sent to compute engine.
+
+    """
+
+    @trace
+    def __init__(
+            self,
+            grain_columns,
+            offsets,
+            horizon=0,
+            max_window_size=0,
+            cross_validations=0,
+            columns=None,
+            **params):
+
+        if columns:
+            params['columns'] = columns
+        BaseTransform.__init__(self, **params)
+        core.__init__(
+            self,
+            grain_columns=grain_columns,
+            offsets=offsets,
+            horizon=horizon,
+            max_window_size=max_window_size,
+            cross_validations=cross_validations,
+            **params)
+        self._columns = columns
+
+    def get_params(self, deep=False):
+        """
+        Get the parameters for this operator.
+        """
+        return core.get_params(self)
diff --git a/src/python/nimbusml/timeseries/simplerollingwindow.py b/src/python/nimbusml/timeseries/simplerollingwindow.py
new file mode 100644
index 00000000..b3d506fb
--- /dev/null
+++ b/src/python/nimbusml/timeseries/simplerollingwindow.py
@@ -0,0 +1,74 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+SimpleRollingWindow
+"""
+
+__all__ = ["SimpleRollingWindow"]
+
+
+from sklearn.base import TransformerMixin
+
+from ..base_transform import BaseTransform
+from ..internal.core.timeseries.simplerollingwindow import \
+    SimpleRollingWindow as core
+from ..internal.utils.utils import trace
+
+
+class SimpleRollingWindow(core, BaseTransform, TransformerMixin):
+    """
+    **Description**
+        Performs simple rolling window calculations.
+
+    :param columns: see `Columns </nimbusml/concepts/columns>`_.
+
+    :param grain_columns: List of grain columns.
+
+    :param target_column: Target column.
+
+    :param horizon: Maximum horizon value.
+
+    :param max_window_size: Maximum window size.
+
+    :param min_window_size: Minimum window size.
+
+    :param window_calculation: What window calculation to use.
+
+    :param params: Additional arguments sent to compute engine.
+
+    """
+
+    @trace
+    def __init__(
+            self,
+            grain_columns,
+            target_column,
+            horizon=0,
+            max_window_size=0,
+            min_window_size=0,
+            window_calculation='0',
+            columns=None,
+            **params):
+
+        if columns:
+            params['columns'] = columns
+        BaseTransform.__init__(self, **params)
+        core.__init__(
+            self,
+            grain_columns=grain_columns,
+            target_column=target_column,
+            horizon=horizon,
+            max_window_size=max_window_size,
+            min_window_size=min_window_size,
+            window_calculation=window_calculation,
+            **params)
+        self._columns = columns
+
+    def get_params(self, deep=False):
+        """
+        Get the parameters for this operator.
+        """
+        return core.get_params(self)
diff --git a/src/python/tools/manifest.json b/src/python/tools/manifest.json
index fd7f7950..615c2303 100644
--- a/src/python/tools/manifest.json
+++ b/src/python/tools/manifest.json
@@ -17084,6 +17084,118 @@
         "ITrainerOutput"
       ]
     },
+    {
+      "Name": "Transforms.AnalyticalRollingWindow",
+      "Desc": "Performs an analaytical calculation over a rolling timeseries window",
+      "FriendlyName": "AnalyticalRollingWindowTransformer",
+      "ShortName": "AnalyticalRollingWindowTransformer",
+      "Inputs": [
+        {
+          "Name": "GrainColumns",
+          "Type": {
+            "Kind": "Array",
+            "ItemType": "String"
+          },
+          "Desc": "List of grain columns",
+          "Aliases": [
+            "grains"
+          ],
+          "Required": true,
+          "SortOrder": 0.0,
+          "IsNullable": false
+        },
+        {
+          "Name": "TargetColumn",
+          "Type": "String",
+          "Desc": "Target column",
+          "Aliases": [
+            "target"
+          ],
+          "Required": true,
+          "SortOrder": 1.0,
+          "IsNullable": false
+        },
+        {
+          "Name": "Data",
+          "Type": "DataView",
+          "Desc": "Input dataset",
+          "Required": true,
+          "SortOrder": 1.0,
+          "IsNullable": false
+        },
+        {
+          "Name": "Horizon",
+          "Type": "UInt",
+          "Desc": "Maximum horizon value",
+          "Aliases": [
+            "hor"
+          ],
+          "Required": true,
+          "SortOrder": 2.0,
+          "IsNullable": false,
+          "Default": 0
+        },
+        {
+          "Name": "MaxWindowSize",
+          "Type": "UInt",
+          "Desc": "Maximum window size",
+          "Aliases": [
+            "maxsize"
+          ],
+          "Required": true,
+          "SortOrder": 3.0,
+          "IsNullable": false,
+          "Default": 0
+        },
+        {
+          "Name": "MinWindowSize",
+          "Type": "UInt",
+          "Desc": "Minimum window size",
+          "Aliases": [
+            "minsize"
+          ],
+          "Required": true,
+          "SortOrder": 4.0,
+          "IsNullable": false,
+          "Default": 0
+        },
+        {
+          "Name": "WindowCalculation",
+          "Type": {
+            "Kind": "Enum",
+            "Values": [
+              "Mean"
+            ]
+          },
+          "Desc": "What window calculation to use",
+          "Aliases": [
+            "calc"
+          ],
+          "Required": true,
+          "SortOrder": 5.0,
+          "IsNullable": false,
+          "Default": "0"
+        }
+      ],
+      "Outputs": [
+        {
+          "Name": "OutputData",
+          "Type": "DataView",
+          "Desc": "Transformed dataset"
+        },
+        {
+          "Name": "Model",
+          "Type": "TransformModel",
+          "Desc": "Transform model"
+        }
+      ],
+      "InputKind": [
+        "ITransformInput"
+      ],
+      "OutputKind": [
+        "ITransformOutput"
+      ]
+    },
     {
       "Name": "Transforms.ApproximateBootstrapSampler",
       "Desc": "Approximate bootstrap sampling.",
@@ -18595,7 +18707,7 @@
       ]
     },
     {
-      "Name": "Transforms.DatasetScorerEx",
+         "Name": "Transforms.DatasetScorerEx",
       "Desc": "Score a dataset with a predictor model",
       "FriendlyName": null,
       "ShortName": null,
@@ -18640,7 +18752,7 @@
       ]
     },
     {
-      "Name": "Transforms.DatasetTransformScorer",
+   "Name": "Transforms.DatasetTransformScorer",
       "Desc": "Score a dataset with a transform model",
       "FriendlyName": null,
       "ShortName": null,
@@ -19237,6 +19349,54 @@
         "ITransformOutput"
       ]
     },
+    {
+      "Name": "Transforms.ForecastingPivot",
+      "Desc": "Pivots the input colums and drops any rows with N/A",
+      "FriendlyName": "ForecastingPivot",
+      "ShortName": "fpivot",
+      "Inputs": [
+        {
+          "Name": "ColumnsToPivot",
+          "Type": {
+            "Kind": "Array",
+            "ItemType": "String"
+          },
+          "Desc": "List of columns to pivot",
+          "Aliases": [
+            "cols"
+          ],
+          "Required": true,
+          "SortOrder": 0.0,
+          "IsNullable": false
+        },
+        {
+          "Name": "Data",
+          "Type": "DataView",
+          "Desc": "Input dataset",
+          "Required": true,
+          "SortOrder": 1.0,
+          "IsNullable": false
+        }
+      ],
+      "Outputs": [
+        {
+          "Name": "OutputData",
+          "Type": "DataView",
+          "Desc": "Transformed dataset"
+        },
+        {
+          "Name": "Model",
+          "Type": "TransformModel",
+          "Desc": "Transform model"
+        }
+      ],
+      "InputKind": [
+        "ITransformInput"
+      ],
+      "OutputKind": [
+        "ITransformOutput"
+      ]
+    },
     {
       "Name": "Transforms.GlobalContrastNormalizer",
       "Desc": "Performs a global contrast normalization on input values: Y = (s * X - M) / D, where s is a scale, M is mean and D is either L2 norm or standard deviation.",
@@ -20466,6 +20626,91 @@
         "ITransformOutput"
       ]
     },
+    {
+      "Name": "Transforms.LagLeadOperator",
+      "Desc": "uses the offset list to create lags and leads",
+      "FriendlyName": "LagLeadOperatorTransformer",
+      "ShortName": "LagLeadOperatorTransformer",
+      "Inputs": [
+        {
+          "Name": "GrainColumns",
+          "Type": {
+            "Kind": "Array",
+            "ItemType": "String"
+          },
+          "Desc": "List of grain columns",
+          "Aliases": [
+            "grains"
+          ],
+          "Required": true,
+          "SortOrder": 0.0,
+          "IsNullable": false
+        },
+        {
+          "Name": "TargetColumn",
+          "Type": "String",
+          "Desc": "Target column",
+          "Aliases": [
+            "target"
+          ],
+          "Required": true,
+          "SortOrder": 1.0,
+          "IsNullable": false
+        },
+        {
+          "Name": "Data",
+          "Type": "DataView",
+          "Desc": "Input dataset",
+          "Required": true,
+          "SortOrder": 1.0,
+          "IsNullable": false
+        },
+        {
+          "Name": "Horizon",
+          "Type": "UInt",
+          "Desc": "Maximum horizon value",
+          "Aliases": [
+            "hor"
+          ],
+          "Required": true,
+          "SortOrder": 2.0,
+          "IsNullable": false,
+          "Default": 0
+        },
+        {
+          "Name": "offsets",
+          "Type": {
+            "Kind": "Array",
+            "ItemType": "Int"
+          },
+          "Desc": "Lag and Lead offset to use. A negative number is a lag, positive is a lead",
+          "Aliases": [
+            "off"
+          ],
+          "Required": true,
+          "SortOrder": 3.0,
+          "IsNullable": false
+        }
+      ],
+      "Outputs": [
+        {
+          "Name": "OutputData",
+          "Type": "DataView",
+          "Desc": "Transformed dataset"
+        },
+        {
+          "Name": "Model",
+          "Type": "TransformModel",
+          "Desc": "Transform model"
+        }
+      ],
+      "InputKind": [
+        "ITransformInput"
+      ],
+      "OutputKind": [
+        "ITransformOutput"
+      ]
+    },
     {
       "Name": "Transforms.LightLda",
       "Desc": "The LDA transform implements LightLDA, a state-of-the-art implementation of Latent Dirichlet Allocation.",
@@ -23279,6 +23524,217 @@
         "ITransformOutput"
       ]
     },
+    {
+      "Name": "Transforms.ShortDrop",
+      "Desc": "Drops rows if there aren't enough values per grain.",
+      "FriendlyName": "ShortDrop",
+      "ShortName": "sgd",
+      "Inputs": [
+        {
+          "Name": "GrainColumns",
+          "Type": {
+            "Kind": "Array",
+            "ItemType": "String"
+          },
+          "Desc": "List of grain columns",
+          "Aliases": [
+            "grains"
+          ],
+          "Required": true,
+          "SortOrder": 0.0,
+          "IsNullable": false
+        },
+        {
+          "Name": "Horizon",
+          "Type": "UInt",
+          "Desc": "Maximum horizon value",
+          "Aliases": [
+            "hor"
+          ],
+          "Required": true,
+          "SortOrder": 1.0,
+          "IsNullable": false,
+          "Default": 0
+        },
+        {
+          "Name": "Data",
+          "Type": "DataView",
+          "Desc": "Input dataset",
+          "Required": true,
+          "SortOrder": 1.0,
+          "IsNullable": false
+        },
+        {
+          "Name": "MaxWindowSize",
+          "Type": "UInt",
+          "Desc": "Maximum window size",
+          "Aliases": [
+            "maxsize"
+          ],
+          "Required": true,
+          "SortOrder": 2.0,
+          "IsNullable": false,
+          "Default": 0
+        },
+        {
+          "Name": "CrossValidations",
+          "Type": "UInt",
+          "Desc": "Number of cross validations being performed.",
+          "Aliases": [
+            "crossv"
+          ],
+          "Required": false,
+          "SortOrder": 2.0,
+          "IsNullable": false,
+          "Default": 0
+        },
+        {
+          "Name": "offsets",
+          "Type": {
+            "Kind": "Array",
+            "ItemType": "Int"
+          },
+          "Desc": "Lag and Lead offset to use. A negative number is a lag, positive is a lead",
+          "Aliases": [
+            "off"
+          ],
+          "Required": true,
+          "SortOrder": 3.0,
+          "IsNullable": false
+        }
+      ],
+      "Outputs": [
+        {
+          "Name": "OutputData",
+          "Type": "DataView",
+          "Desc": "Transformed dataset"
+        },
+        {
+          "Name": "Model",
+          "Type": "TransformModel",
+          "Desc": "Transform model"
+        }
+      ],
+      "InputKind": [
+        "ITransformInput"
+      ],
+      "OutputKind": [
+        "ITransformOutput"
+      ]
+    },
+    {
+      "Name": "Transforms.SimpleRollingWindow",
+      "Desc": "Performs simple rolling window calculations.",
+      "FriendlyName": "SimpleRollingWindowTransformer",
+      "ShortName": "SimpleRollingWindowTransformer",
+      "Inputs": [
+        {
+          "Name": "GrainColumns",
+          "Type": {
+            "Kind": "Array",
+            "ItemType": "String"
+          },
+          "Desc": "List of grain columns",
+          "Aliases": [
+            "grains"
+          ],
+          "Required": true,
+          "SortOrder": 0.0,
+          "IsNullable": false
+        },
+        {
+          "Name": "TargetColumn",
+          "Type": "String",
+          "Desc": "Target column",
+          "Aliases": [
+            "target"
+          ],
+          "Required": true,
+          "SortOrder": 1.0,
+          "IsNullable": false
+        },
+        {
+          "Name": "Data",
+          "Type": "DataView",
+          "Desc": "Input dataset",
+          "Required": true,
+          "SortOrder": 1.0,
+          "IsNullable": false
+        },
+        {
+          "Name": "Horizon",
+          "Type": "UInt",
+          "Desc": "Maximum horizon value",
+          "Aliases": [
+            "hor"
+          ],
+          "Required": true,
+          "SortOrder": 2.0,
+          "IsNullable": false,
+          "Default": 0
+        },
+        {
+          "Name": "MaxWindowSize",
+          "Type": "UInt",
+          "Desc": "Maximum window size",
+          "Aliases": [
+            "maxsize"
+          ],
+          "Required": true,
+          "SortOrder": 3.0,
+          "IsNullable": false,
+          "Default": 0
+        },
+        {
+          "Name": "MinWindowSize",
+          "Type": "UInt",
+          "Desc": "Minimum window size",
+          "Aliases": [
+            "minsize"
+          ],
+          "Required": true,
+          "SortOrder": 4.0,
+          "IsNullable": false,
+          "Default": 0
+        },
+        {
+          "Name": "WindowCalculation",
+          "Type": {
+            "Kind": "Enum",
+            "Values": [
+              "Min",
+              "Max"
+            ]
+          },
+          "Desc": "What window calculation to use",
+          "Aliases": [
+            "calc"
+          ],
+          "Required": true,
+          "SortOrder": 5.0,
+          "IsNullable": false,
+          "Default": "0"
+        }
+      ],
+      "Outputs": [
+        {
+          "Name": "OutputData",
+          "Type": "DataView",
+          "Desc": "Transformed dataset"
+        },
+        {
+          "Name": "Model",
+          "Type": "TransformModel",
+          "Desc": "Transform model"
+        }
+      ],
+      "InputKind": [
+        "ITransformInput"
+      ],
+      "OutputKind": [
+        "ITransformOutput"
+      ]
+    },
     {
       "Name": "Transforms.TensorFlowScorer",
       "Desc": "Transforms the data using the TensorFlow model.",
@@ -30126,6 +30582,140 @@
         }
       ]
     },
+    {
+      "Kind": "PartitionedPathParser",
+      "Components": [
+        {
+          "Name": "ParquetPathParser",
+          "Desc": "Extract name/value pairs from Parquet formatted directory names. Example path: Year=2018/Month=12/data1.parquet",
+          "FriendlyName": "Parquet Partitioned Path Parser",
+          "Aliases": [
+            "ParqPP"
+          ],
+          "Settings": []
+        },
+        {
+          "Name": "SimplePathParser",
+          "Desc": "A simple parser that extracts directory names as column values. Column names are defined as arguments.",
+          "FriendlyName": "Simple Partitioned Path Parser",
+          "Aliases": [
+            "SmplPP"
+          ],
+          "Settings": [
+            {
+              "Name": "Columns",
+              "Type": {
+                "Kind": "Array",
+                "ItemType": {
+                  "Kind": "Struct",
+                  "Fields": [
+                    {
+                      "Name": "Name",
+                      "Type": "String",
+                      "Desc": "Name of the column.",
+                      "Required": true,
+                      "SortOrder": 150.0,
+                      "IsNullable": false
+                    },
+                    {
+                      "Name": "Type",
+                      "Type": {
+                        "Kind": "Enum",
+                        "Values": [
+                          "I1",
+                          "U1",
+                          "I2",
+                          "U2",
+                          "I4",
+                          "U4",
+                          "I8",
+                          "U8",
+                          "R4",
+                          "Num",
+                          "R8",
+                          "TX",
+                          "Text",
+                          "TXT",
+                          "BL",
+                          "Bool",
+                          "TimeSpan",
+                          "TS",
+                          "DT",
+                          "DateTime",
+                          "DZ",
+                          "DateTimeZone",
+                          "UG",
+                          "U16"
+                        ]
+                      },
+                      "Desc": "Data type of the column.",
+                      "Required": false,
+                      "SortOrder": 150.0,
+                      "IsNullable": true,
+                      "Default": null
+                    },
+                    {
+                      "Name": "Source",
+                      "Type": "Int",
+                      "Desc": "Index of the directory representing this column.",
+                      "Required": true,
+                      "SortOrder": 150.0,
+                      "IsNullable": false,
+                      "Default": 0
+                    }
+                  ]
+                }
+              },
+              "Desc": "Column definitions used to override the Partitioned Path Parser. Expected with the format name:type:numeric-source, for example, col=MyFeature:R4:1",
+              "Aliases": [
+                "col"
+              ],
+              "Required": false,
+              "SortOrder": 1.0,
+              "IsNullable": false,
+              "Default": null
+            },
+            {
+              "Name": "Type",
+              "Type": {
+                "Kind": "Enum",
+                "Values": [
+                  "I1",
+                  "U1",
+                  "I2",
+                  "U2",
+                  "I4",
+                  "U4",
+                  "I8",
+                  "U8",
+                  "R4",
+                  "Num",
+                  "R8",
+                  "TX",
+                  "Text",
+                  "TXT",
+                  "BL",
+                  "Bool",
+                  "TimeSpan",
+                  "TS",
+                  "DT",
+                  "DateTime",
+                  "DZ",
+                  "DateTimeZone",
+                  "UG",
+                  "U16"
+                ]
+              },
+              "Desc": "Data type of each column.",
+              "Required": false,
+              "SortOrder": 150.0,
+              "IsNullable": false,
+              "Default": "TX"
+            }
+          ]
+        }
+      ]
+    },
     {
       "Kind": "RegressionLossFunction",
       "Components": [
diff --git a/src/python/tools/manifest_diff.json b/src/python/tools/manifest_diff.json
index a70489ee..3b38fb2d 100644
--- a/src/python/tools/manifest_diff.json
+++ b/src/python/tools/manifest_diff.json
@@ -226,6 +226,36 @@
     "XGBoost.TrainRegression"
   ],
   "EntryPoints": [
+    {
+      "Name": "Transforms.SimpleRollingWindow",
+      "NewName": "SimpleRollingWindow",
+      "Module": "timeseries",
+      "Type": "Transform"
+    },
+    {
+      "Name": "Transforms.AnalyticalRollingWindow",
+      "NewName": "AnalyticalRollingWindow",
+      "Module": "timeseries",
+      "Type": "Transform"
+    },
+    {
+      "Name": "Transforms.LagLeadOperator",
+      "NewName": "LagLeadOperator",
+      "Module": "timeseries",
+      "Type": "Transform"
+    },
+    {
+      "Name": "Transforms.ShortDrop",
+      "NewName": "ShortDrop",
+      "Module": "timeseries",
+      "Type": "Transform"
+    },
+    {
+      "Name": "Transforms.ForecastingPivot",
+      "NewName": "ForecastingPivot",
+      "Module": "timeseries",
+      "Type": "Transform"
+    },
     {
       "Name": "Trainers.AveragedPerceptronBinaryClassifier",
       "NewName": "AveragedPerceptronBinaryClassifier",

From 6a2a913c51eb2e9a6fc6ba90ddd40c50e4d0048f Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Sun, 19 Apr 2020 09:04:44 -0700
Subject: [PATCH 09/34] Updated with latest changes

---
 nuget.config                                  |   3 +-
 src/DotNetBridge/DotNetBridge.csproj          |   2 +-
 src/Platforms/build.csproj                    |   2 +-
 src/python/nimbusml.pyproj                    |  15 +-
 .../nimbusml/examples/ForecastingPivot.py     |  31 +
 .../nimbusml/examples/LagLeadOperator.py      |  26 +
 src/python/nimbusml/examples/RollingWindow.py |  27 +
 src/python/nimbusml/examples/ShortDrop.py     |  23 +
 .../timeseries/analyticalrollingwindow.py     |  75 ---
 .../core/timeseries/forecastingpivot.py       |   7 +-
 .../core/timeseries/lagleadoperator.py        |  46 +-
 .../internal/core/timeseries/rollingwindow.py | 108 ++++
 .../internal/core/timeseries/shortdrop.py     |  24 +-
 .../core/timeseries/simplerollingwindow.py    |  75 ---
 ...partitionedpathparser_parquetpathparser.py |  26 -
 ..._partitionedpathparser_simplepathparser.py |  71 --
 .../transforms_analyticalrollingwindow.py     | 103 ---
 .../transforms_forecastingpivot.py            |   9 +
 .../entrypoints/transforms_lagleadoperator.py |  17 +-
 ...gwindow.py => transforms_rollingwindow.py} |  34 +-
 .../entrypoints/transforms_shortdrop.py       |  33 +-
 src/python/nimbusml/timeseries/__init__.py    |  10 +-
 .../timeseries/analyticalrollingwindow.py     |  77 ---
 .../nimbusml/timeseries/forecastingpivot.py   |   4 +
 .../nimbusml/timeseries/lagleadoperator.py    |   6 +-
 ...implerollingwindow.py => rollingwindow.py} |  23 +-
 src/python/nimbusml/timeseries/shortdrop.py   |  19 +-
 src/python/tools/manifest.json                | 611 ++++++------------
 src/python/tools/manifest_diff.json           |  10 +-
 29 files changed, 545 insertions(+), 972 deletions(-)
 create mode 100644 src/python/nimbusml/examples/ForecastingPivot.py
 create mode 100644 src/python/nimbusml/examples/LagLeadOperator.py
 create mode 100644 src/python/nimbusml/examples/RollingWindow.py
 create mode 100644 src/python/nimbusml/examples/ShortDrop.py
 delete mode 100644 src/python/nimbusml/internal/core/timeseries/analyticalrollingwindow.py
 create mode 100644 src/python/nimbusml/internal/core/timeseries/rollingwindow.py
 delete mode 100644 src/python/nimbusml/internal/core/timeseries/simplerollingwindow.py
 delete mode 100644 src/python/nimbusml/internal/entrypoints/_partitionedpathparser_parquetpathparser.py
 delete mode 100644 src/python/nimbusml/internal/entrypoints/_partitionedpathparser_simplepathparser.py
 delete mode 100644 src/python/nimbusml/internal/entrypoints/transforms_analyticalrollingwindow.py
 rename src/python/nimbusml/internal/entrypoints/{transforms_simplerollingwindow.py => transforms_rollingwindow.py} (80%)
 delete mode 100644 src/python/nimbusml/timeseries/analyticalrollingwindow.py
 rename src/python/nimbusml/timeseries/{simplerollingwindow.py => rollingwindow.py} (75%)

diff --git a/nuget.config b/nuget.config
index c0efdcaa..5bf65c94 100644
--- a/nuget.config
+++ b/nuget.config
@@ -5,7 +5,6 @@
   </config>
   <packageSources>
     <add key="nuget.org" value="https://api.nuget.org/v3/index.json" />
-    <add key="MachineLearning" value="https://pkgs.dev.azure.com/dnceng/public/_packaging/MachineLearning/nuget/v3/index.json"  />
-    <add key="MlNet_Daily" value="https://dotnet.myget.org/F/dotnet-core/api/v3/index.json" />
+	<add key="MachineLearning-ORTFeaturizers" value="https://devdiv.pkgs.visualstudio.com/DevDiv/_packaging/MachineLearning-ORTFeaturizers/nuget/v3/index.json" />
   </packageSources>
 </configuration>
diff --git a/src/DotNetBridge/DotNetBridge.csproj b/src/DotNetBridge/DotNetBridge.csproj
index 1132f5f2..3e20c790 100644
--- a/src/DotNetBridge/DotNetBridge.csproj
+++ b/src/DotNetBridge/DotNetBridge.csproj
@@ -46,7 +46,7 @@
     <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-preview3*" />
     <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-preview3*" />
     <PackageReference Include="Microsoft.ML.Featurizers" Version="0.17.0-preview3*" />
-    <PackageReference Include="Microsoft.MLFeaturizers" Version="0.3.5" />
+    <PackageReference Include="Microsoft.MLFeaturizers" Version="0.4.0-preview*" />
     <PackageReference Include="Microsoft.DataPrep" Version="0.0.3.2-preview" />
     <PackageReference Include="TensorFlow.NET" Version="0.11.8.1" />
     <PackageReference Include="SciSharp.TensorFlow.Redist" Version="1.14.0" />
diff --git a/src/Platforms/build.csproj b/src/Platforms/build.csproj
index 3705a235..b63cfe46 100644
--- a/src/Platforms/build.csproj
+++ b/src/Platforms/build.csproj
@@ -35,7 +35,7 @@
     <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-preview3*" />
     <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-preview3*" />
     <PackageReference Include="Microsoft.ML.Featurizers" Version="0.17.0-preview3*" />
-    <PackageReference Include="Microsoft.MLFeaturizers" Version="0.3.5" />
+    <PackageReference Include="Microsoft.MLFeaturizers" Version="0.4.0-preview*" />
     <PackageReference Include="Microsoft.DataPrep" Version="0.0.3.2-preview" />
     <PackageReference Include="TensorFlow.NET" Version="0.11.8.1" />
     <PackageReference Include="SciSharp.TensorFlow.Redist" Version="1.14.0" />
diff --git a/src/python/nimbusml.pyproj b/src/python/nimbusml.pyproj
index 24e1bcbc..d6eb1d36 100644
--- a/src/python/nimbusml.pyproj
+++ b/src/python/nimbusml.pyproj
@@ -92,6 +92,10 @@
     <Compile Include="nimbusml\examples\BootStrapSample.py" />
     <Compile Include="nimbusml\examples\CharTokenizer.py" />
     <Compile Include="nimbusml\examples\ColumnConcatenator.py" />
+    <Compile Include="nimbusml\examples\LagLeadOperator.py" />
+    <Compile Include="nimbusml\examples\ForecastingPivot.py" />
+    <Compile Include="nimbusml\examples\ShortDrop.py" />
+    <Compile Include="nimbusml\examples\RollingWindow.py" />
     <Compile Include="nimbusml\examples\examples_from_dataframe\OnnxRunner_df.py" />
     <Compile Include="nimbusml\examples\examples_from_dataframe\RobustScaler_df.py" />
     <Compile Include="nimbusml\examples\examples_from_dataframe\TimeSeriesImputer_df.py" />
@@ -332,13 +336,12 @@
     <Compile Include="nimbusml\internal\core\preprocessing\tokeyimputer.py" />
     <Compile Include="nimbusml\internal\core\preprocessing\tostring.py" />
     <Compile Include="nimbusml\internal\core\preprocessing\text\wordtokenizer.py" />
-    <Compile Include="nimbusml\internal\core\timeseries\analyticalrollingwindow.py" />
     <Compile Include="nimbusml\internal\core\timeseries\forecastingpivot.py" />
     <Compile Include="nimbusml\internal\core\timeseries\iidchangepointdetector.py" />
     <Compile Include="nimbusml\internal\core\timeseries\iidspikedetector.py" />
     <Compile Include="nimbusml\internal\core\timeseries\lagleadoperator.py" />
+    <Compile Include="nimbusml\internal\core\timeseries\rollingwindow.py" />
     <Compile Include="nimbusml\internal\core\timeseries\shortdrop.py" />
-    <Compile Include="nimbusml\internal\core\timeseries\simplerollingwindow.py" />
     <Compile Include="nimbusml\internal\core\timeseries\ssachangepointdetector.py" />
     <Compile Include="nimbusml\internal\core\timeseries\ssaforecaster.py" />
     <Compile Include="nimbusml\internal\core\timeseries\ssaspikedetector.py" />
@@ -419,7 +422,6 @@
     <Compile Include="nimbusml\internal\entrypoints\trainers_stochasticdualcoordinateascentregressor.py" />
     <Compile Include="nimbusml\internal\entrypoints\trainers_stochasticgradientdescentbinaryclassifier.py" />
     <Compile Include="nimbusml\internal\entrypoints\trainers_symsgdbinaryclassifier.py" />
-    <Compile Include="nimbusml\internal\entrypoints\transforms_analyticalrollingwindow.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_approximatebootstrapsampler.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_binarypredictionscorecolumnsrenamer.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_binnormalizer.py" />
@@ -476,6 +478,7 @@
     <Compile Include="nimbusml\internal\entrypoints\transforms_permutationfeatureimportance.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_predictedlabelcolumnoriginalvalueconverter.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_randomnumbergenerator.py" />
+    <Compile Include="nimbusml\internal\entrypoints\transforms_rollingwindow.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_rowrangefilter.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_rowskipandtakefilter.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_rowskipfilter.py" />
@@ -485,7 +488,6 @@
     <Compile Include="nimbusml\internal\entrypoints\transforms_segregator.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_sentimentanalyzer.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_shortdrop.py" />
-    <Compile Include="nimbusml\internal\entrypoints\transforms_simplerollingwindow.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_tensorflowscorer.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_textfeaturizer.py" />
     <Compile Include="nimbusml\internal\entrypoints\transforms_texttokeyconverter.py" />
@@ -551,8 +553,6 @@
     <Compile Include="nimbusml\internal\entrypoints\_ngramextractor_ngramhash.py" />
     <Compile Include="nimbusml\internal\entrypoints\_parallellightgbm_single.py" />
     <Compile Include="nimbusml\internal\entrypoints\_paralleltraining_single.py" />
-    <Compile Include="nimbusml\internal\entrypoints\_partitionedpathparser_parquetpathparser.py" />
-    <Compile Include="nimbusml\internal\entrypoints\_partitionedpathparser_simplepathparser.py" />
     <Compile Include="nimbusml\internal\entrypoints\_regressionlossfunction_poissonloss.py" />
     <Compile Include="nimbusml\internal\entrypoints\_regressionlossfunction_squaredloss.py" />
     <Compile Include="nimbusml\internal\entrypoints\_regressionlossfunction_tweedieloss.py" />
@@ -759,13 +759,12 @@
     <Compile Include="nimbusml\tests\timeseries\test_ssaspikedetector.py" />
     <Compile Include="nimbusml\tests\timeseries\test_iidspikedetector.py" />
     <Compile Include="nimbusml\tests\timeseries\__init__.py" />
-    <Compile Include="nimbusml\timeseries\analyticalrollingwindow.py" />
     <Compile Include="nimbusml\timeseries\forecastingpivot.py" />
     <Compile Include="nimbusml\timeseries\iidchangepointdetector.py" />
     <Compile Include="nimbusml\timeseries\iidspikedetector.py" />
     <Compile Include="nimbusml\timeseries\lagleadoperator.py" />
+    <Compile Include="nimbusml\timeseries\rollingwindow.py" />
     <Compile Include="nimbusml\timeseries\shortdrop.py" />
-    <Compile Include="nimbusml\timeseries\simplerollingwindow.py" />
     <Compile Include="nimbusml\timeseries\ssachangepointdetector.py" />
     <Compile Include="nimbusml\timeseries\ssaforecaster.py" />
     <Compile Include="nimbusml\timeseries\ssaspikedetector.py" />
diff --git a/src/python/nimbusml/examples/ForecastingPivot.py b/src/python/nimbusml/examples/ForecastingPivot.py
new file mode 100644
index 00000000..98d41871
--- /dev/null
+++ b/src/python/nimbusml/examples/ForecastingPivot.py
@@ -0,0 +1,31 @@
+###############################################################################
+# DateTimeSplitter
+import pandas as pd
+import numpy as np
+from nimbusml import FileDataStream, Pipeline
+from nimbusml.datasets import get_dataset
+from nimbusml.timeseries import ForecastingPivot, RollingWindow
+
+# data input (as a FileDataStream)
+path = get_dataset('infert').as_filepath()
+data = FileDataStream.read_csv(path, sep=',', numeric_dtype=np.double)
+
+# transform usage
+xf = RollingWindow(columns={'age_1': 'age'},
+                   grain_column=['education'], 
+                   window_calculation='Mean',
+                   max_window_size=1,
+                   horizon=1)
+
+xf1 = ForecastingPivot(columns_to_pivot=['age_1'])
+
+pipe = Pipeline([xf, xf1])
+
+# fit and transform
+features = pipe.fit_transform(data)
+
+features = features.drop(['row_num', 'education', 'parity', 'induced',
+                          'case', 'spontaneous', 'stratum', 'pooled.stratum'], axis=1)
+
+# print features
+print(features.head(100))
diff --git a/src/python/nimbusml/examples/LagLeadOperator.py b/src/python/nimbusml/examples/LagLeadOperator.py
new file mode 100644
index 00000000..9424b2aa
--- /dev/null
+++ b/src/python/nimbusml/examples/LagLeadOperator.py
@@ -0,0 +1,26 @@
+###############################################################################
+# DateTimeSplitter
+import pandas as pd
+import numpy as np
+from nimbusml import FileDataStream
+from nimbusml.datasets import get_dataset
+from nimbusml.timeseries import LagLeadOperator
+
+# data input (as a FileDataStream)
+path = get_dataset('infert').as_filepath()
+data = FileDataStream.read_csv(path, sep=',', numeric_dtype=np.double)
+
+# transform usage
+xf = LagLeadOperator(columns={'age_1': 'age'}, 
+                   grain_columns=['education'], 
+                   offsets=[-3, 1],
+                   horizon=1)
+
+# fit and transform
+features = xf.fit_transform(data)
+
+features = features.drop(['row_num', 'education', 'parity', 'induced',
+                          'case', 'spontaneous', 'stratum', 'pooled.stratum'], axis=1)
+
+# print features
+print(features.head(100))
diff --git a/src/python/nimbusml/examples/RollingWindow.py b/src/python/nimbusml/examples/RollingWindow.py
new file mode 100644
index 00000000..086f5a7a
--- /dev/null
+++ b/src/python/nimbusml/examples/RollingWindow.py
@@ -0,0 +1,27 @@
+###############################################################################
+# DateTimeSplitter
+import pandas as pd
+import numpy as np
+from nimbusml import FileDataStream
+from nimbusml.datasets import get_dataset
+from nimbusml.timeseries import RollingWindow
+
+# data input (as a FileDataStream)
+path = get_dataset('infert').as_filepath()
+data = FileDataStream.read_csv(path, sep=',', numeric_dtype=np.double)
+
+# transform usage
+xf = RollingWindow(columns={'age_1': 'age'},
+                   grain_column=['education'], 
+                   window_calculation='Mean',
+                   max_window_size=2,
+                   horizon=2)
+
+# fit and transform
+features = xf.fit_transform(data)
+
+features = features.drop(['row_num', 'education', 'parity', 'induced',
+                          'case', 'spontaneous', 'stratum', 'pooled.stratum'], axis=1)
+
+# print features
+print(features.head(100))
diff --git a/src/python/nimbusml/examples/ShortDrop.py b/src/python/nimbusml/examples/ShortDrop.py
new file mode 100644
index 00000000..dd8882ab
--- /dev/null
+++ b/src/python/nimbusml/examples/ShortDrop.py
@@ -0,0 +1,23 @@
+###############################################################################
+# DateTimeSplitter
+import pandas as pd
+import numpy as np
+from nimbusml import FileDataStream
+from nimbusml.datasets import get_dataset
+from nimbusml.timeseries import ShortDrop
+
+# data input (as a FileDataStream)
+path = get_dataset('infert').as_filepath()
+data = FileDataStream.read_csv(path, sep=',', numeric_dtype=np.double)
+
+# transform usage
+xf = ShortDrop(grain_columns=['education'], min_rows=4294967294) << 'age'
+
+# fit and transform
+features = xf.fit_transform(data)
+
+features = features.drop(['row_num', 'education', 'parity', 'induced',
+                          'case', 'spontaneous', 'stratum', 'pooled.stratum'], axis=1)
+
+# print features
+print(features.head(100))
diff --git a/src/python/nimbusml/internal/core/timeseries/analyticalrollingwindow.py b/src/python/nimbusml/internal/core/timeseries/analyticalrollingwindow.py
deleted file mode 100644
index 69bfde78..00000000
--- a/src/python/nimbusml/internal/core/timeseries/analyticalrollingwindow.py
+++ /dev/null
@@ -1,75 +0,0 @@
-# --------------------------------------------------------------------------------------------
-# Copyright (c) Microsoft Corporation. All rights reserved.
-# Licensed under the MIT License.
-# --------------------------------------------------------------------------------------------
-# - Generated by tools/entrypoint_compiler.py: do not edit by hand
-"""
-AnalyticalRollingWindow
-"""
-
-__all__ = ["AnalyticalRollingWindow"]
-
-
-from ...entrypoints.transforms_analyticalrollingwindow import \
-    transforms_analyticalrollingwindow
-from ...utils.utils import trace
-from ..base_pipeline_item import BasePipelineItem, DefaultSignature
-
-
-class AnalyticalRollingWindow(BasePipelineItem, DefaultSignature):
-    """
-    **Description**
-        Performs an analaytical calculation over a rolling timeseries window
-
-    :param grain_columns: List of grain columns.
-
-    :param target_column: Target column.
-
-    :param horizon: Maximum horizon value.
-
-    :param max_window_size: Maximum window size.
-
-    :param min_window_size: Minimum window size.
-
-    :param window_calculation: What window calculation to use.
-
-    :param params: Additional arguments sent to compute engine.
-
-    """
-
-    @trace
-    def __init__(
-            self,
-            grain_columns,
-            target_column,
-            horizon=0,
-            max_window_size=0,
-            min_window_size=0,
-            window_calculation='0',
-            **params):
-        BasePipelineItem.__init__(
-            self, type='transform', **params)
-
-        self.grain_columns = grain_columns
-        self.target_column = target_column
-        self.horizon = horizon
-        self.max_window_size = max_window_size
-        self.min_window_size = min_window_size
-        self.window_calculation = window_calculation
-
-    @property
-    def _entrypoint(self):
-        return transforms_analyticalrollingwindow
-
-    @trace
-    def _get_node(self, **all_args):
-        algo_args = dict(
-            grain_columns=self.grain_columns,
-            target_column=self.target_column,
-            horizon=self.horizon,
-            max_window_size=self.max_window_size,
-            min_window_size=self.min_window_size,
-            window_calculation=self.window_calculation)
-
-        all_args.update(algo_args)
-        return self._entrypoint(**all_args)
diff --git a/src/python/nimbusml/internal/core/timeseries/forecastingpivot.py b/src/python/nimbusml/internal/core/timeseries/forecastingpivot.py
index cf499392..c306f5bd 100644
--- a/src/python/nimbusml/internal/core/timeseries/forecastingpivot.py
+++ b/src/python/nimbusml/internal/core/timeseries/forecastingpivot.py
@@ -23,6 +23,8 @@ class ForecastingPivot(BasePipelineItem, DefaultSignature):
 
     :param columns_to_pivot: List of columns to pivot.
 
+    :param horizon_column_name: Name of the horizon column generated.
+
     :param params: Additional arguments sent to compute engine.
 
     """
@@ -31,11 +33,13 @@ class ForecastingPivot(BasePipelineItem, DefaultSignature):
     def __init__(
             self,
             columns_to_pivot,
+            horizon_column_name='Horizon',
             **params):
         BasePipelineItem.__init__(
             self, type='transform', **params)
 
         self.columns_to_pivot = columns_to_pivot
+        self.horizon_column_name = horizon_column_name
 
     @property
     def _entrypoint(self):
@@ -44,7 +48,8 @@ def _entrypoint(self):
     @trace
     def _get_node(self, **all_args):
         algo_args = dict(
-            columns_to_pivot=self.columns_to_pivot)
+            columns_to_pivot=self.columns_to_pivot,
+            horizon_column_name=self.horizon_column_name)
 
         all_args.update(algo_args)
         return self._entrypoint(**all_args)
diff --git a/src/python/nimbusml/internal/core/timeseries/lagleadoperator.py b/src/python/nimbusml/internal/core/timeseries/lagleadoperator.py
index 4dad5691..991963ef 100644
--- a/src/python/nimbusml/internal/core/timeseries/lagleadoperator.py
+++ b/src/python/nimbusml/internal/core/timeseries/lagleadoperator.py
@@ -19,12 +19,10 @@
 class LagLeadOperator(BasePipelineItem, DefaultSignature):
     """
     **Description**
-        uses the offset list to create lags and leads
+        Uses the offset list with the horizon to create lags and leads
 
     :param grain_columns: List of grain columns.
 
-    :param target_column: Target column.
-
     :param horizon: Maximum horizon value.
 
     :param offsets: Lag and Lead offset to use. A negative number is a lag,
@@ -38,7 +36,6 @@ class LagLeadOperator(BasePipelineItem, DefaultSignature):
     def __init__(
             self,
             grain_columns,
-            target_column,
             offsets,
             horizon=0,
             **params):
@@ -46,7 +43,6 @@ def __init__(
             self, type='transform', **params)
 
         self.grain_columns = grain_columns
-        self.target_column = target_column
         self.offsets = offsets
         self.horizon = horizon
 
@@ -56,9 +52,47 @@ def _entrypoint(self):
 
     @trace
     def _get_node(self, **all_args):
+
+        input_columns = self.input
+        if input_columns is None and 'input' in all_args:
+            input_columns = all_args['input']
+        if 'input' in all_args:
+            all_args.pop('input')
+
+        output_columns = self.output
+        if output_columns is None and 'output' in all_args:
+            output_columns = all_args['output']
+        if 'output' in all_args:
+            all_args.pop('output')
+
+        # validate input
+        if input_columns is None:
+            raise ValueError(
+                "'None' input passed when it cannot be none.")
+
+        if not isinstance(input_columns, list):
+            raise ValueError(
+                "input has to be a list of strings, instead got %s" %
+                type(input_columns))
+
+        # validate output
+        if output_columns is None:
+            output_columns = input_columns
+
+        if not isinstance(output_columns, list):
+            raise ValueError(
+                "output has to be a list of strings, instead got %s" %
+                type(output_columns))
+
         algo_args = dict(
+            column=[
+                dict(
+                    Source=i,
+                    Name=o) for i,
+                o in zip(
+                    input_columns,
+                    output_columns)] if input_columns else None,
             grain_columns=self.grain_columns,
-            target_column=self.target_column,
             offsets=self.offsets,
             horizon=self.horizon)
 
diff --git a/src/python/nimbusml/internal/core/timeseries/rollingwindow.py b/src/python/nimbusml/internal/core/timeseries/rollingwindow.py
new file mode 100644
index 00000000..4a67f54d
--- /dev/null
+++ b/src/python/nimbusml/internal/core/timeseries/rollingwindow.py
@@ -0,0 +1,108 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+# - Generated by tools/entrypoint_compiler.py: do not edit by hand
+"""
+RollingWindow
+"""
+
+__all__ = ["RollingWindow"]
+
+
+from ...entrypoints.transforms_rollingwindow import transforms_rollingwindow
+from ...utils.utils import trace
+from ..base_pipeline_item import BasePipelineItem, DefaultSignature
+
+
+class RollingWindow(BasePipelineItem, DefaultSignature):
+    """
+    **Description**
+        Performs a calculation over a rolling timeseries window
+
+    :param grain_column: List of grain columns.
+
+    :param horizon: Maximum horizon value.
+
+    :param max_window_size: Maximum window size.
+
+    :param min_window_size: Minimum window size.
+
+    :param window_calculation: What window calculation to use.
+
+    :param params: Additional arguments sent to compute engine.
+
+    """
+
+    @trace
+    def __init__(
+            self,
+            grain_column,
+            horizon=0,
+            max_window_size=0,
+            min_window_size=1,
+            window_calculation='0',
+            **params):
+        BasePipelineItem.__init__(
+            self, type='transform', **params)
+
+        self.grain_column = grain_column
+        self.horizon = horizon
+        self.max_window_size = max_window_size
+        self.min_window_size = min_window_size
+        self.window_calculation = window_calculation
+
+    @property
+    def _entrypoint(self):
+        return transforms_rollingwindow
+
+    @trace
+    def _get_node(self, **all_args):
+
+        input_columns = self.input
+        if input_columns is None and 'input' in all_args:
+            input_columns = all_args['input']
+        if 'input' in all_args:
+            all_args.pop('input')
+
+        output_columns = self.output
+        if output_columns is None and 'output' in all_args:
+            output_columns = all_args['output']
+        if 'output' in all_args:
+            all_args.pop('output')
+
+        # validate input
+        if input_columns is None:
+            raise ValueError(
+                "'None' input passed when it cannot be none.")
+
+        if not isinstance(input_columns, list):
+            raise ValueError(
+                "input has to be a list of strings, instead got %s" %
+                type(input_columns))
+
+        # validate output
+        if output_columns is None:
+            output_columns = input_columns
+
+        if not isinstance(output_columns, list):
+            raise ValueError(
+                "output has to be a list of strings, instead got %s" %
+                type(output_columns))
+
+        algo_args = dict(
+            column=[
+                dict(
+                    Source=i,
+                    Name=o) for i,
+                o in zip(
+                    input_columns,
+                    output_columns)] if input_columns else None,
+            grain_column=self.grain_column,
+            horizon=self.horizon,
+            max_window_size=self.max_window_size,
+            min_window_size=self.min_window_size,
+            window_calculation=self.window_calculation)
+
+        all_args.update(algo_args)
+        return self._entrypoint(**all_args)
diff --git a/src/python/nimbusml/internal/core/timeseries/shortdrop.py b/src/python/nimbusml/internal/core/timeseries/shortdrop.py
index 9e228495..30313d7d 100644
--- a/src/python/nimbusml/internal/core/timeseries/shortdrop.py
+++ b/src/python/nimbusml/internal/core/timeseries/shortdrop.py
@@ -22,14 +22,7 @@ class ShortDrop(BasePipelineItem, DefaultSignature):
 
     :param grain_columns: List of grain columns.
 
-    :param horizon: Maximum horizon value.
-
-    :param max_window_size: Maximum window size.
-
-    :param cross_validations: Number of cross validations being performed.
-
-    :param offsets: Lag and Lead offset to use. A negative number is a lag,
-        positive is a lead.
+    :param min_rows: Minimum number of values required.
 
     :param params: Additional arguments sent to compute engine.
 
@@ -39,19 +32,13 @@ class ShortDrop(BasePipelineItem, DefaultSignature):
     def __init__(
             self,
             grain_columns,
-            offsets,
-            horizon=0,
-            max_window_size=0,
-            cross_validations=0,
+            min_rows=0,
             **params):
         BasePipelineItem.__init__(
             self, type='transform', **params)
 
         self.grain_columns = grain_columns
-        self.offsets = offsets
-        self.horizon = horizon
-        self.max_window_size = max_window_size
-        self.cross_validations = cross_validations
+        self.min_rows = min_rows
 
     @property
     def _entrypoint(self):
@@ -61,10 +48,7 @@ def _entrypoint(self):
     def _get_node(self, **all_args):
         algo_args = dict(
             grain_columns=self.grain_columns,
-            offsets=self.offsets,
-            horizon=self.horizon,
-            max_window_size=self.max_window_size,
-            cross_validations=self.cross_validations)
+            min_rows=self.min_rows)
 
         all_args.update(algo_args)
         return self._entrypoint(**all_args)
diff --git a/src/python/nimbusml/internal/core/timeseries/simplerollingwindow.py b/src/python/nimbusml/internal/core/timeseries/simplerollingwindow.py
deleted file mode 100644
index 7952887f..00000000
--- a/src/python/nimbusml/internal/core/timeseries/simplerollingwindow.py
+++ /dev/null
@@ -1,75 +0,0 @@
-# --------------------------------------------------------------------------------------------
-# Copyright (c) Microsoft Corporation. All rights reserved.
-# Licensed under the MIT License.
-# --------------------------------------------------------------------------------------------
-# - Generated by tools/entrypoint_compiler.py: do not edit by hand
-"""
-SimpleRollingWindow
-"""
-
-__all__ = ["SimpleRollingWindow"]
-
-
-from ...entrypoints.transforms_simplerollingwindow import \
-    transforms_simplerollingwindow
-from ...utils.utils import trace
-from ..base_pipeline_item import BasePipelineItem, DefaultSignature
-
-
-class SimpleRollingWindow(BasePipelineItem, DefaultSignature):
-    """
-    **Description**
-        Performs simple rolling window calculations.
-
-    :param grain_columns: List of grain columns.
-
-    :param target_column: Target column.
-
-    :param horizon: Maximum horizon value.
-
-    :param max_window_size: Maximum window size.
-
-    :param min_window_size: Minimum window size.
-
-    :param window_calculation: What window calculation to use.
-
-    :param params: Additional arguments sent to compute engine.
-
-    """
-
-    @trace
-    def __init__(
-            self,
-            grain_columns,
-            target_column,
-            horizon=0,
-            max_window_size=0,
-            min_window_size=0,
-            window_calculation='0',
-            **params):
-        BasePipelineItem.__init__(
-            self, type='transform', **params)
-
-        self.grain_columns = grain_columns
-        self.target_column = target_column
-        self.horizon = horizon
-        self.max_window_size = max_window_size
-        self.min_window_size = min_window_size
-        self.window_calculation = window_calculation
-
-    @property
-    def _entrypoint(self):
-        return transforms_simplerollingwindow
-
-    @trace
-    def _get_node(self, **all_args):
-        algo_args = dict(
-            grain_columns=self.grain_columns,
-            target_column=self.target_column,
-            horizon=self.horizon,
-            max_window_size=self.max_window_size,
-            min_window_size=self.min_window_size,
-            window_calculation=self.window_calculation)
-
-        all_args.update(algo_args)
-        return self._entrypoint(**all_args)
diff --git a/src/python/nimbusml/internal/entrypoints/_partitionedpathparser_parquetpathparser.py b/src/python/nimbusml/internal/entrypoints/_partitionedpathparser_parquetpathparser.py
deleted file mode 100644
index a5c34acb..00000000
--- a/src/python/nimbusml/internal/entrypoints/_partitionedpathparser_parquetpathparser.py
+++ /dev/null
@@ -1,26 +0,0 @@
-# - Generated by tools/entrypoint_compiler.py: do not edit by hand
-"""
-ParquetPathParser
-"""
-
-
-from ..utils.entrypoints import Component
-
-
-def parquet_path_parser(
-        **params):
-    """
-    **Description**
-        Extract name/value pairs from Parquet formatted directory names.
-        Example path: Year=2018/Month=12/data1.parquet
-
-    """
-
-    entrypoint_name = 'ParquetPathParser'
-    settings = {}
-
-    component = Component(
-        name=entrypoint_name,
-        settings=settings,
-        kind='PartitionedPathParser')
-    return component
diff --git a/src/python/nimbusml/internal/entrypoints/_partitionedpathparser_simplepathparser.py b/src/python/nimbusml/internal/entrypoints/_partitionedpathparser_simplepathparser.py
deleted file mode 100644
index 3f63ac19..00000000
--- a/src/python/nimbusml/internal/entrypoints/_partitionedpathparser_simplepathparser.py
+++ /dev/null
@@ -1,71 +0,0 @@
-# - Generated by tools/entrypoint_compiler.py: do not edit by hand
-"""
-SimplePathParser
-"""
-
-
-from ..utils.entrypoints import Component
-from ..utils.utils import try_set
-
-
-def simple_path_parser(
-        columns=None,
-        type='TX',
-        **params):
-    """
-    **Description**
-        A simple parser that extracts directory names as column values.
-        Column names are defined as arguments.
-
-    :param columns: Column definitions used to override the
-        Partitioned Path Parser. Expected with the format
-        name:type:numeric-source, for example, col=MyFeature:R4:1
-        (settings).
-    :param type: Data type of each column. (settings).
-    """
-
-    entrypoint_name = 'SimplePathParser'
-    settings = {}
-
-    if columns is not None:
-        settings['Columns'] = try_set(
-            obj=columns,
-            none_acceptable=True,
-            is_of_type=list,
-            is_column=True)
-    if type is not None:
-        settings['Type'] = try_set(
-            obj=type,
-            none_acceptable=True,
-            is_of_type=str,
-            values=[
-                'I1',
-                'U1',
-                'I2',
-                'U2',
-                'I4',
-                'U4',
-                'I8',
-                'U8',
-                'R4',
-                'Num',
-                'R8',
-                'TX',
-                'Text',
-                'TXT',
-                'BL',
-                'Bool',
-                'TimeSpan',
-                'TS',
-                'DT',
-                'DateTime',
-                'DZ',
-                'DateTimeZone',
-                'UG',
-                'U16'])
-
-    component = Component(
-        name=entrypoint_name,
-        settings=settings,
-        kind='PartitionedPathParser')
-    return component
diff --git a/src/python/nimbusml/internal/entrypoints/transforms_analyticalrollingwindow.py b/src/python/nimbusml/internal/entrypoints/transforms_analyticalrollingwindow.py
deleted file mode 100644
index c1ca37f2..00000000
--- a/src/python/nimbusml/internal/entrypoints/transforms_analyticalrollingwindow.py
+++ /dev/null
@@ -1,103 +0,0 @@
-# - Generated by tools/entrypoint_compiler.py: do not edit by hand
-"""
-Transforms.AnalyticalRollingWindow
-"""
-
-import numbers
-
-from ..utils.entrypoints import EntryPoint
-from ..utils.utils import try_set, unlist
-
-
-def transforms_analyticalrollingwindow(
-        grain_columns,
-        target_column,
-        data,
-        output_data=None,
-        model=None,
-        horizon=0,
-        max_window_size=0,
-        min_window_size=0,
-        window_calculation='0',
-        **params):
-    """
-    **Description**
-        Performs an analaytical calculation over a rolling timeseries window
-
-    :param grain_columns: List of grain columns (inputs).
-    :param target_column: Target column (inputs).
-    :param data: Input dataset (inputs).
-    :param horizon: Maximum horizon value (inputs).
-    :param max_window_size: Maximum window size (inputs).
-    :param min_window_size: Minimum window size (inputs).
-    :param window_calculation: What window calculation to use
-        (inputs).
-    :param output_data: Transformed dataset (outputs).
-    :param model: Transform model (outputs).
-    """
-
-    entrypoint_name = 'Transforms.AnalyticalRollingWindow'
-    inputs = {}
-    outputs = {}
-
-    if grain_columns is not None:
-        inputs['GrainColumns'] = try_set(
-            obj=grain_columns,
-            none_acceptable=False,
-            is_of_type=list,
-            is_column=True)
-    if target_column is not None:
-        inputs['TargetColumn'] = try_set(
-            obj=target_column,
-            none_acceptable=False,
-            is_of_type=str,
-            is_column=True)
-    if data is not None:
-        inputs['Data'] = try_set(
-            obj=data,
-            none_acceptable=False,
-            is_of_type=str)
-    if horizon is not None:
-        inputs['Horizon'] = try_set(
-            obj=horizon,
-            none_acceptable=False,
-            is_of_type=numbers.Real)
-    if max_window_size is not None:
-        inputs['MaxWindowSize'] = try_set(
-            obj=max_window_size,
-            none_acceptable=False,
-            is_of_type=numbers.Real)
-    if min_window_size is not None:
-        inputs['MinWindowSize'] = try_set(
-            obj=min_window_size,
-            none_acceptable=False,
-            is_of_type=numbers.Real)
-    if window_calculation is not None:
-        inputs['WindowCalculation'] = try_set(
-            obj=window_calculation,
-            none_acceptable=False,
-            is_of_type=str,
-            values=['Mean'])
-    if output_data is not None:
-        outputs['OutputData'] = try_set(
-            obj=output_data,
-            none_acceptable=False,
-            is_of_type=str)
-    if model is not None:
-        outputs['Model'] = try_set(
-            obj=model,
-            none_acceptable=False,
-            is_of_type=str)
-
-    input_variables = {
-        x for x in unlist(inputs.values())
-        if isinstance(x, str) and x.startswith("$")}
-    output_variables = {
-        x for x in unlist(outputs.values())
-        if isinstance(x, str) and x.startswith("$")}
-
-    entrypoint = EntryPoint(
-        name=entrypoint_name, inputs=inputs, outputs=outputs,
-        input_variables=input_variables,
-        output_variables=output_variables)
-    return entrypoint
diff --git a/src/python/nimbusml/internal/entrypoints/transforms_forecastingpivot.py b/src/python/nimbusml/internal/entrypoints/transforms_forecastingpivot.py
index ebf94c23..fee7b30d 100644
--- a/src/python/nimbusml/internal/entrypoints/transforms_forecastingpivot.py
+++ b/src/python/nimbusml/internal/entrypoints/transforms_forecastingpivot.py
@@ -13,12 +13,15 @@ def transforms_forecastingpivot(
         data,
         output_data=None,
         model=None,
+        horizon_column_name='Horizon',
         **params):
     """
     **Description**
         Pivots the input colums and drops any rows with N/A
 
     :param columns_to_pivot: List of columns to pivot (inputs).
+    :param horizon_column_name: Name of the horizon column generated.
+        (inputs).
     :param data: Input dataset (inputs).
     :param output_data: Transformed dataset (outputs).
     :param model: Transform model (outputs).
@@ -34,6 +37,12 @@ def transforms_forecastingpivot(
             none_acceptable=False,
             is_of_type=list,
             is_column=True)
+    if horizon_column_name is not None:
+        inputs['HorizonColumnName'] = try_set(
+            obj=horizon_column_name,
+            none_acceptable=True,
+            is_of_type=str,
+            is_column=True)
     if data is not None:
         inputs['Data'] = try_set(
             obj=data,
diff --git a/src/python/nimbusml/internal/entrypoints/transforms_lagleadoperator.py b/src/python/nimbusml/internal/entrypoints/transforms_lagleadoperator.py
index e840bd66..88f63edd 100644
--- a/src/python/nimbusml/internal/entrypoints/transforms_lagleadoperator.py
+++ b/src/python/nimbusml/internal/entrypoints/transforms_lagleadoperator.py
@@ -11,7 +11,7 @@
 
 def transforms_lagleadoperator(
         grain_columns,
-        target_column,
+        column,
         data,
         offsets,
         output_data=None,
@@ -20,10 +20,11 @@ def transforms_lagleadoperator(
         **params):
     """
     **Description**
-        uses the offset list to create lags and leads
+        Uses the offset list with the horizon to create lags and leads
 
     :param grain_columns: List of grain columns (inputs).
-    :param target_column: Target column (inputs).
+    :param column: New column definition (optional form: name:src)
+        (inputs).
     :param data: Input dataset (inputs).
     :param horizon: Maximum horizon value (inputs).
     :param offsets: Lag and Lead offset to use. A negative number is
@@ -42,11 +43,11 @@ def transforms_lagleadoperator(
             none_acceptable=False,
             is_of_type=list,
             is_column=True)
-    if target_column is not None:
-        inputs['TargetColumn'] = try_set(
-            obj=target_column,
+    if column is not None:
+        inputs['Column'] = try_set(
+            obj=column,
             none_acceptable=False,
-            is_of_type=str,
+            is_of_type=list,
             is_column=True)
     if data is not None:
         inputs['Data'] = try_set(
@@ -59,7 +60,7 @@ def transforms_lagleadoperator(
             none_acceptable=False,
             is_of_type=numbers.Real)
     if offsets is not None:
-        inputs['offsets'] = try_set(
+        inputs['Offsets'] = try_set(
             obj=offsets,
             none_acceptable=False,
             is_of_type=list)
diff --git a/src/python/nimbusml/internal/entrypoints/transforms_simplerollingwindow.py b/src/python/nimbusml/internal/entrypoints/transforms_rollingwindow.py
similarity index 80%
rename from src/python/nimbusml/internal/entrypoints/transforms_simplerollingwindow.py
rename to src/python/nimbusml/internal/entrypoints/transforms_rollingwindow.py
index 36f8eb43..0bd8823c 100644
--- a/src/python/nimbusml/internal/entrypoints/transforms_simplerollingwindow.py
+++ b/src/python/nimbusml/internal/entrypoints/transforms_rollingwindow.py
@@ -1,6 +1,6 @@
 # - Generated by tools/entrypoint_compiler.py: do not edit by hand
 """
-Transforms.SimpleRollingWindow
+Transforms.RollingWindow
 """
 
 import numbers
@@ -9,23 +9,24 @@
 from ..utils.utils import try_set, unlist
 
 
-def transforms_simplerollingwindow(
-        grain_columns,
-        target_column,
+def transforms_rollingwindow(
+        grain_column,
+        column,
         data,
         output_data=None,
         model=None,
         horizon=0,
         max_window_size=0,
-        min_window_size=0,
+        min_window_size=1,
         window_calculation='0',
         **params):
     """
     **Description**
-        Performs simple rolling window calculations.
+        Performs a calculation over a rolling timeseries window
 
-    :param grain_columns: List of grain columns (inputs).
-    :param target_column: Target column (inputs).
+    :param grain_column: List of grain columns (inputs).
+    :param column: New column definition (optional form: name:src)
+        (inputs).
     :param data: Input dataset (inputs).
     :param horizon: Maximum horizon value (inputs).
     :param max_window_size: Maximum window size (inputs).
@@ -36,21 +37,21 @@ def transforms_simplerollingwindow(
     :param model: Transform model (outputs).
     """
 
-    entrypoint_name = 'Transforms.SimpleRollingWindow'
+    entrypoint_name = 'Transforms.RollingWindow'
     inputs = {}
     outputs = {}
 
-    if grain_columns is not None:
-        inputs['GrainColumns'] = try_set(
-            obj=grain_columns,
+    if grain_column is not None:
+        inputs['GrainColumn'] = try_set(
+            obj=grain_column,
             none_acceptable=False,
             is_of_type=list,
             is_column=True)
-    if target_column is not None:
-        inputs['TargetColumn'] = try_set(
-            obj=target_column,
+    if column is not None:
+        inputs['Column'] = try_set(
+            obj=column,
             none_acceptable=False,
-            is_of_type=str,
+            is_of_type=list,
             is_column=True)
     if data is not None:
         inputs['Data'] = try_set(
@@ -78,6 +79,7 @@ def transforms_simplerollingwindow(
             none_acceptable=False,
             is_of_type=str,
             values=[
+                'Mean',
                 'Min',
                 'Max'])
     if output_data is not None:
diff --git a/src/python/nimbusml/internal/entrypoints/transforms_shortdrop.py b/src/python/nimbusml/internal/entrypoints/transforms_shortdrop.py
index bae78343..8be2424d 100644
--- a/src/python/nimbusml/internal/entrypoints/transforms_shortdrop.py
+++ b/src/python/nimbusml/internal/entrypoints/transforms_shortdrop.py
@@ -12,25 +12,17 @@
 def transforms_shortdrop(
         grain_columns,
         data,
-        offsets,
         output_data=None,
         model=None,
-        horizon=0,
-        max_window_size=0,
-        cross_validations=0,
+        min_rows=0,
         **params):
     """
     **Description**
         Drops rows if there aren't enough values per grain.
 
     :param grain_columns: List of grain columns (inputs).
-    :param horizon: Maximum horizon value (inputs).
+    :param min_rows: Minimum number of values required (inputs).
     :param data: Input dataset (inputs).
-    :param max_window_size: Maximum window size (inputs).
-    :param cross_validations: Number of cross validations being
-        performed. (inputs).
-    :param offsets: Lag and Lead offset to use. A negative number is
-        a lag, positive is a lead (inputs).
     :param output_data: Transformed dataset (outputs).
     :param model: Transform model (outputs).
     """
@@ -45,9 +37,9 @@ def transforms_shortdrop(
             none_acceptable=False,
             is_of_type=list,
             is_column=True)
-    if horizon is not None:
-        inputs['Horizon'] = try_set(
-            obj=horizon,
+    if min_rows is not None:
+        inputs['MinRows'] = try_set(
+            obj=min_rows,
             none_acceptable=False,
             is_of_type=numbers.Real)
     if data is not None:
@@ -55,21 +47,6 @@ def transforms_shortdrop(
             obj=data,
             none_acceptable=False,
             is_of_type=str)
-    if max_window_size is not None:
-        inputs['MaxWindowSize'] = try_set(
-            obj=max_window_size,
-            none_acceptable=False,
-            is_of_type=numbers.Real)
-    if cross_validations is not None:
-        inputs['CrossValidations'] = try_set(
-            obj=cross_validations,
-            none_acceptable=True,
-            is_of_type=numbers.Real)
-    if offsets is not None:
-        inputs['offsets'] = try_set(
-            obj=offsets,
-            none_acceptable=False,
-            is_of_type=list)
     if output_data is not None:
         outputs['OutputData'] = try_set(
             obj=output_data,
diff --git a/src/python/nimbusml/timeseries/__init__.py b/src/python/nimbusml/timeseries/__init__.py
index 05dbfa3c..6476cbc2 100644
--- a/src/python/nimbusml/timeseries/__init__.py
+++ b/src/python/nimbusml/timeseries/__init__.py
@@ -4,6 +4,10 @@
 from .ssachangepointdetector import SsaChangePointDetector
 from .ssaforecaster import SsaForecaster
 from .timeseriesimputer import TimeSeriesImputer
+from .rollingwindow import RollingWindow
+from .shortdrop import ShortDrop
+from .lagleadoperator import LagLeadOperator
+from .forecastingpivot import ForecastingPivot
 
 __all__ = [
     'IidSpikeDetector',
@@ -11,5 +15,9 @@
     'SsaSpikeDetector',
     'SsaChangePointDetector',
     'SsaForecaster',
-    'TimeSeriesImputer'
+    'TimeSeriesImputer',
+    'RollingWindow',
+    'ShortDrop',
+    'LagLeadOperator',
+    'ForecastingPivot',
 ]
diff --git a/src/python/nimbusml/timeseries/analyticalrollingwindow.py b/src/python/nimbusml/timeseries/analyticalrollingwindow.py
deleted file mode 100644
index 8cdc00d0..00000000
--- a/src/python/nimbusml/timeseries/analyticalrollingwindow.py
+++ /dev/null
@@ -1,77 +0,0 @@
-# --------------------------------------------------------------------------------------------
-# Copyright (c) Microsoft Corporation. All rights reserved.
-# Licensed under the MIT License.
-# --------------------------------------------------------------------------------------------
-# - Generated by tools/entrypoint_compiler.py: do not edit by hand
-"""
-AnalyticalRollingWindow
-"""
-
-__all__ = ["AnalyticalRollingWindow"]
-
-
-from sklearn.base import TransformerMixin
-
-from ..base_transform import BaseTransform
-from ..internal.core.timeseries.analyticalrollingwindow import \
-    AnalyticalRollingWindow as core
-from ..internal.utils.utils import trace
-
-
-class AnalyticalRollingWindow(
-        core,
-        BaseTransform,
-        TransformerMixin):
-    """
-    **Description**
-        Performs an analaytical calculation over a rolling timeseries window
-
-    :param columns: see `Columns </nimbusml/concepts/columns>`_.
-
-    :param grain_columns: List of grain columns.
-
-    :param target_column: Target column.
-
-    :param horizon: Maximum horizon value.
-
-    :param max_window_size: Maximum window size.
-
-    :param min_window_size: Minimum window size.
-
-    :param window_calculation: What window calculation to use.
-
-    :param params: Additional arguments sent to compute engine.
-
-    """
-
-    @trace
-    def __init__(
-            self,
-            grain_columns,
-            target_column,
-            horizon=0,
-            max_window_size=0,
-            min_window_size=0,
-            window_calculation='0',
-            columns=None,
-            **params):
-
-        if columns:
-            params['columns'] = columns
-        BaseTransform.__init__(self, **params)
-        core.__init__(
-            self,
-            grain_columns=grain_columns,
-            target_column=target_column,
-            horizon=horizon,
-            max_window_size=max_window_size,
-            min_window_size=min_window_size,
-            window_calculation=window_calculation,
-            **params)
-        self._columns = columns
-
-    def get_params(self, deep=False):
-        """
-        Get the parameters for this operator.
-        """
-        return core.get_params(self)
diff --git a/src/python/nimbusml/timeseries/forecastingpivot.py b/src/python/nimbusml/timeseries/forecastingpivot.py
index bb58b553..c01cddba 100644
--- a/src/python/nimbusml/timeseries/forecastingpivot.py
+++ b/src/python/nimbusml/timeseries/forecastingpivot.py
@@ -27,6 +27,8 @@ class ForecastingPivot(core, BaseTransform, TransformerMixin):
 
     :param columns_to_pivot: List of columns to pivot.
 
+    :param horizon_column_name: Name of the horizon column generated.
+
     :param params: Additional arguments sent to compute engine.
 
     """
@@ -35,6 +37,7 @@ class ForecastingPivot(core, BaseTransform, TransformerMixin):
     def __init__(
             self,
             columns_to_pivot,
+            horizon_column_name='Horizon',
             columns=None,
             **params):
 
@@ -44,6 +47,7 @@ def __init__(
         core.__init__(
             self,
             columns_to_pivot=columns_to_pivot,
+            horizon_column_name=horizon_column_name,
             **params)
         self._columns = columns
 
diff --git a/src/python/nimbusml/timeseries/lagleadoperator.py b/src/python/nimbusml/timeseries/lagleadoperator.py
index 373d4334..6a524114 100644
--- a/src/python/nimbusml/timeseries/lagleadoperator.py
+++ b/src/python/nimbusml/timeseries/lagleadoperator.py
@@ -20,14 +20,12 @@
 class LagLeadOperator(core, BaseTransform, TransformerMixin):
     """
     **Description**
-        uses the offset list to create lags and leads
+        Uses the offset list with the horizon to create lags and leads
 
     :param columns: see `Columns </nimbusml/concepts/columns>`_.
 
     :param grain_columns: List of grain columns.
 
-    :param target_column: Target column.
-
     :param horizon: Maximum horizon value.
 
     :param offsets: Lag and Lead offset to use. A negative number is a lag,
@@ -41,7 +39,6 @@ class LagLeadOperator(core, BaseTransform, TransformerMixin):
     def __init__(
             self,
             grain_columns,
-            target_column,
             offsets,
             horizon=0,
             columns=None,
@@ -53,7 +50,6 @@ def __init__(
         core.__init__(
             self,
             grain_columns=grain_columns,
-            target_column=target_column,
             offsets=offsets,
             horizon=horizon,
             **params)
diff --git a/src/python/nimbusml/timeseries/simplerollingwindow.py b/src/python/nimbusml/timeseries/rollingwindow.py
similarity index 75%
rename from src/python/nimbusml/timeseries/simplerollingwindow.py
rename to src/python/nimbusml/timeseries/rollingwindow.py
index b3d506fb..703e4324 100644
--- a/src/python/nimbusml/timeseries/simplerollingwindow.py
+++ b/src/python/nimbusml/timeseries/rollingwindow.py
@@ -4,30 +4,27 @@
 # --------------------------------------------------------------------------------------------
 # - Generated by tools/entrypoint_compiler.py: do not edit by hand
 """
-SimpleRollingWindow
+RollingWindow
 """
 
-__all__ = ["SimpleRollingWindow"]
+__all__ = ["RollingWindow"]
 
 
 from sklearn.base import TransformerMixin
 
 from ..base_transform import BaseTransform
-from ..internal.core.timeseries.simplerollingwindow import \
-    SimpleRollingWindow as core
+from ..internal.core.timeseries.rollingwindow import RollingWindow as core
 from ..internal.utils.utils import trace
 
 
-class SimpleRollingWindow(core, BaseTransform, TransformerMixin):
+class RollingWindow(core, BaseTransform, TransformerMixin):
     """
     **Description**
-        Performs simple rolling window calculations.
+        Performs a calculation over a rolling timeseries window
 
     :param columns: see `Columns </nimbusml/concepts/columns>`_.
 
-    :param grain_columns: List of grain columns.
-
-    :param target_column: Target column.
+    :param grain_column: List of grain columns.
 
     :param horizon: Maximum horizon value.
 
@@ -44,11 +41,10 @@ class SimpleRollingWindow(core, BaseTransform, TransformerMixin):
     @trace
     def __init__(
             self,
-            grain_columns,
-            target_column,
+            grain_column,
             horizon=0,
             max_window_size=0,
-            min_window_size=0,
+            min_window_size=1,
             window_calculation='0',
             columns=None,
             **params):
@@ -58,8 +54,7 @@ def __init__(
         BaseTransform.__init__(self, **params)
         core.__init__(
             self,
-            grain_columns=grain_columns,
-            target_column=target_column,
+            grain_column=grain_column,
             horizon=horizon,
             max_window_size=max_window_size,
             min_window_size=min_window_size,
diff --git a/src/python/nimbusml/timeseries/shortdrop.py b/src/python/nimbusml/timeseries/shortdrop.py
index 0e5e8a7e..c605ac0c 100644
--- a/src/python/nimbusml/timeseries/shortdrop.py
+++ b/src/python/nimbusml/timeseries/shortdrop.py
@@ -26,14 +26,7 @@ class ShortDrop(core, BaseTransform, TransformerMixin):
 
     :param grain_columns: List of grain columns.
 
-    :param horizon: Maximum horizon value.
-
-    :param max_window_size: Maximum window size.
-
-    :param cross_validations: Number of cross validations being performed.
-
-    :param offsets: Lag and Lead offset to use. A negative number is a lag,
-        positive is a lead.
+    :param min_rows: Minimum number of values required.
 
     :param params: Additional arguments sent to compute engine.
 
@@ -43,10 +36,7 @@ class ShortDrop(core, BaseTransform, TransformerMixin):
     def __init__(
             self,
             grain_columns,
-            offsets,
-            horizon=0,
-            max_window_size=0,
-            cross_validations=0,
+            min_rows=0,
             columns=None,
             **params):
 
@@ -56,10 +46,7 @@ def __init__(
         core.__init__(
             self,
             grain_columns=grain_columns,
-            offsets=offsets,
-            horizon=horizon,
-            max_window_size=max_window_size,
-            cross_validations=cross_validations,
+            min_rows=min_rows,
             **params)
         self._columns = columns
 
diff --git a/src/python/tools/manifest.json b/src/python/tools/manifest.json
index 615c2303..5be33996 100644
--- a/src/python/tools/manifest.json
+++ b/src/python/tools/manifest.json
@@ -17084,118 +17084,6 @@
         "ITrainerOutput"
       ]
     },
-    {
-      "Name": "Transforms.AnalyticalRollingWindow",
-      "Desc": "Performs an analaytical calculation over a rolling timeseries window",
-      "FriendlyName": "AnalyticalRollingWindowTransformer",
-      "ShortName": "AnalyticalRollingWindowTransformer",
-      "Inputs": [
-        {
-          "Name": "GrainColumns",
-          "Type": {
-            "Kind": "Array",
-            "ItemType": "String"
-          },
-          "Desc": "List of grain columns",
-          "Aliases": [
-            "grains"
-          ],
-          "Required": true,
-          "SortOrder": 0.0,
-          "IsNullable": false
-        },
-        {
-          "Name": "TargetColumn",
-          "Type": "String",
-          "Desc": "Target column",
-          "Aliases": [
-            "target"
-          ],
-          "Required": true,
-          "SortOrder": 1.0,
-          "IsNullable": false
-        },
-        {
-          "Name": "Data",
-          "Type": "DataView",
-          "Desc": "Input dataset",
-          "Required": true,
-          "SortOrder": 1.0,
-          "IsNullable": false
-        },
-        {
-          "Name": "Horizon",
-          "Type": "UInt",
-          "Desc": "Maximum horizon value",
-          "Aliases": [
-            "hor"
-          ],
-          "Required": true,
-          "SortOrder": 2.0,
-          "IsNullable": false,
-          "Default": 0
-        },
-        {
-          "Name": "MaxWindowSize",
-          "Type": "UInt",
-          "Desc": "Maximum window size",
-          "Aliases": [
-            "maxsize"
-          ],
-          "Required": true,
-          "SortOrder": 3.0,
-          "IsNullable": false,
-          "Default": 0
-        },
-        {
-          "Name": "MinWindowSize",
-          "Type": "UInt",
-          "Desc": "Minimum window size",
-          "Aliases": [
-            "minsize"
-          ],
-          "Required": true,
-          "SortOrder": 4.0,
-          "IsNullable": false,
-          "Default": 0
-        },
-        {
-          "Name": "WindowCalculation",
-          "Type": {
-            "Kind": "Enum",
-            "Values": [
-              "Mean"
-            ]
-          },
-          "Desc": "What window calculation to use",
-          "Aliases": [
-            "calc"
-          ],
-          "Required": true,
-          "SortOrder": 5.0,
-          "IsNullable": false,
-          "Default": "0"
-        }
-      ],
-      "Outputs": [
-        {
-          "Name": "OutputData",
-          "Type": "DataView",
-          "Desc": "Transformed dataset"
-        },
-        {
-          "Name": "Model",
-          "Type": "TransformModel",
-          "Desc": "Transform model"
-        }
-      ],
-      "InputKind": [
-        "ITransformInput"
-      ],
-      "OutputKind": [
-        "ITransformOutput"
-      ]
-    },
     {
       "Name": "Transforms.ApproximateBootstrapSampler",
       "Desc": "Approximate bootstrap sampling.",
@@ -18707,7 +18595,7 @@
       ]
     },
     {
-         "Name": "Transforms.DatasetScorerEx",
+      "Name": "Transforms.DatasetScorerEx",
       "Desc": "Score a dataset with a predictor model",
       "FriendlyName": null,
       "ShortName": null,
@@ -18752,7 +18640,7 @@
       ]
     },
     {
-   "Name": "Transforms.DatasetTransformScorer",
+      "Name": "Transforms.DatasetTransformScorer",
       "Desc": "Score a dataset with a transform model",
       "FriendlyName": null,
       "ShortName": null,
@@ -19369,6 +19257,18 @@
           "SortOrder": 0.0,
           "IsNullable": false
         },
+        {
+          "Name": "HorizonColumnName",
+          "Type": "String",
+          "Desc": "Name of the horizon column generated.",
+          "Aliases": [
+            "hor"
+          ],
+          "Required": false,
+          "SortOrder": 1.0,
+          "IsNullable": false,
+          "Default": "Horizon"
+        },
         {
           "Name": "Data",
           "Type": "DataView",
@@ -20628,9 +20528,9 @@
     },
     {
       "Name": "Transforms.LagLeadOperator",
-      "Desc": "uses the offset list to create lags and leads",
-      "FriendlyName": "LagLeadOperatorTransformer",
-      "ShortName": "LagLeadOperatorTransformer",
+      "Desc": "Uses the offset list with the horizon to create lags and leads",
+      "FriendlyName": "LagLeadOperator",
+      "ShortName": "LagLead",
       "Inputs": [
         {
           "Name": "GrainColumns",
@@ -20647,11 +20547,42 @@
           "IsNullable": false
         },
         {
-          "Name": "TargetColumn",
-          "Type": "String",
-          "Desc": "Target column",
+          "Name": "Column",
+          "Type": {
+            "Kind": "Array",
+            "ItemType": {
+              "Kind": "Struct",
+              "Fields": [
+                {
+                  "Name": "Name",
+                  "Type": "String",
+                  "Desc": "Name of the new column",
+                  "Aliases": [
+                    "name"
+                  ],
+                  "Required": false,
+                  "SortOrder": 150.0,
+                  "IsNullable": false,
+                  "Default": null
+                },
+                {
+                  "Name": "Source",
+                  "Type": "String",
+                  "Desc": "Name of the source column",
+                  "Aliases": [
+                    "src"
+                  ],
+                  "Required": false,
+                  "SortOrder": 150.0,
+                  "IsNullable": false,
+                  "Default": null
+                }
+              ]
+            }
+          },
+          "Desc": "New column definition (optional form: name:src)",
           "Aliases": [
-            "target"
+            "col"
           ],
           "Required": true,
           "SortOrder": 1.0,
@@ -20678,7 +20609,7 @@
           "Default": 0
         },
         {
-          "Name": "offsets",
+          "Name": "Offsets",
           "Type": {
             "Kind": "Array",
             "ItemType": "Int"
@@ -23085,6 +23016,151 @@
         "ITransformOutput"
       ]
     },
+    {
+      "Name": "Transforms.RollingWindow",
+      "Desc": "Performs a calculation over a rolling timeseries window",
+      "FriendlyName": "Rolling Window Featurizer",
+      "ShortName": "RollingWindow",
+      "Inputs": [
+        {
+          "Name": "GrainColumn",
+          "Type": {
+            "Kind": "Array",
+            "ItemType": "String"
+          },
+          "Desc": "List of grain columns",
+          "Aliases": [
+            "grains"
+          ],
+          "Required": true,
+          "SortOrder": 0.0,
+          "IsNullable": false
+        },
+        {
+          "Name": "Column",
+          "Type": {
+            "Kind": "Array",
+            "ItemType": {
+              "Kind": "Struct",
+              "Fields": [
+                {
+                  "Name": "Name",
+                  "Type": "String",
+                  "Desc": "Name of the new column",
+                  "Aliases": [
+                    "name"
+                  ],
+                  "Required": false,
+                  "SortOrder": 150.0,
+                  "IsNullable": false,
+                  "Default": null
+                },
+                {
+                  "Name": "Source",
+                  "Type": "String",
+                  "Desc": "Name of the source column",
+                  "Aliases": [
+                    "src"
+                  ],
+                  "Required": false,
+                  "SortOrder": 150.0,
+                  "IsNullable": false,
+                  "Default": null
+                }
+              ]
+            }
+          },
+          "Desc": "New column definition (optional form: name:src)",
+          "Aliases": [
+            "col"
+          ],
+          "Required": true,
+          "SortOrder": 1.0,
+          "IsNullable": false
+        },
+        {
+          "Name": "Data",
+          "Type": "DataView",
+          "Desc": "Input dataset",
+          "Required": true,
+          "SortOrder": 1.0,
+          "IsNullable": false
+        },
+        {
+          "Name": "Horizon",
+          "Type": "UInt",
+          "Desc": "Maximum horizon value",
+          "Aliases": [
+            "hor"
+          ],
+          "Required": true,
+          "SortOrder": 2.0,
+          "IsNullable": false,
+          "Default": 0
+        },
+        {
+          "Name": "MaxWindowSize",
+          "Type": "UInt",
+          "Desc": "Maximum window size",
+          "Aliases": [
+            "maxsize"
+          ],
+          "Required": true,
+          "SortOrder": 3.0,
+          "IsNullable": false,
+          "Default": 0
+        },
+        {
+          "Name": "MinWindowSize",
+          "Type": "UInt",
+          "Desc": "Minimum window size",
+          "Aliases": [
+            "minsize"
+          ],
+          "Required": true,
+          "SortOrder": 4.0,
+          "IsNullable": false,
+          "Default": 1
+        },
+        {
+          "Name": "WindowCalculation",
+          "Type": {
+            "Kind": "Enum",
+            "Values": [
+              "Mean",
+              "Min",
+              "Max"
+            ]
+          },
+          "Desc": "What window calculation to use",
+          "Aliases": [
+            "calc"
+          ],
+          "Required": true,
+          "SortOrder": 5.0,
+          "IsNullable": false,
+          "Default": "0"
+        }
+      ],
+      "Outputs": [
+        {
+          "Name": "OutputData",
+          "Type": "DataView",
+          "Desc": "Transformed dataset"
+        },
+        {
+          "Name": "Model",
+          "Type": "TransformModel",
+          "Desc": "Transform model"
+        }
+      ],
+      "InputKind": [
+        "ITransformInput"
+      ],
+      "OutputKind": [
+        "ITransformOutput"
+      ]
+    },
     {
       "Name": "Transforms.RowRangeFilter",
       "Desc": "Filters a dataview on a column of type Single, Double or Key (contiguous). Keeps the values that are in the specified min/max range. NaNs are always filtered out. If the input is a Key type, the min/max are considered percentages of the number of values.",
@@ -23545,11 +23621,11 @@
           "IsNullable": false
         },
         {
-          "Name": "Horizon",
+          "Name": "MinRows",
           "Type": "UInt",
-          "Desc": "Maximum horizon value",
+          "Desc": "Minimum number of values required",
           "Aliases": [
-            "hor"
+            "minr"
           ],
           "Required": true,
           "SortOrder": 1.0,
@@ -23563,157 +23639,6 @@
           "Required": true,
           "SortOrder": 1.0,
           "IsNullable": false
-        },
-        {
-          "Name": "MaxWindowSize",
-          "Type": "UInt",
-          "Desc": "Maximum window size",
-          "Aliases": [
-            "maxsize"
-          ],
-          "Required": true,
-          "SortOrder": 2.0,
-          "IsNullable": false,
-          "Default": 0
-        },
-        {
-          "Name": "CrossValidations",
-          "Type": "UInt",
-          "Desc": "Number of cross validations being performed.",
-          "Aliases": [
-            "crossv"
-          ],
-          "Required": false,
-          "SortOrder": 2.0,
-          "IsNullable": false,
-          "Default": 0
-        },
-        {
-          "Name": "offsets",
-          "Type": {
-            "Kind": "Array",
-            "ItemType": "Int"
-          },
-          "Desc": "Lag and Lead offset to use. A negative number is a lag, positive is a lead",
-          "Aliases": [
-            "off"
-          ],
-          "Required": true,
-          "SortOrder": 3.0,
-          "IsNullable": false
-        }
-      ],
-      "Outputs": [
-        {
-          "Name": "OutputData",
-          "Type": "DataView",
-          "Desc": "Transformed dataset"
-        },
-        {
-          "Name": "Model",
-          "Type": "TransformModel",
-          "Desc": "Transform model"
-        }
-      ],
-      "InputKind": [
-        "ITransformInput"
-      ],
-      "OutputKind": [
-        "ITransformOutput"
-      ]
-    },
-    {
-      "Name": "Transforms.SimpleRollingWindow",
-      "Desc": "Performs simple rolling window calculations.",
-      "FriendlyName": "SimpleRollingWindowTransformer",
-      "ShortName": "SimpleRollingWindowTransformer",
-      "Inputs": [
-        {
-          "Name": "GrainColumns",
-          "Type": {
-            "Kind": "Array",
-            "ItemType": "String"
-          },
-          "Desc": "List of grain columns",
-          "Aliases": [
-            "grains"
-          ],
-          "Required": true,
-          "SortOrder": 0.0,
-          "IsNullable": false
-        },
-        {
-          "Name": "TargetColumn",
-          "Type": "String",
-          "Desc": "Target column",
-          "Aliases": [
-            "target"
-          ],
-          "Required": true,
-          "SortOrder": 1.0,
-          "IsNullable": false
-        },
-        {
-          "Name": "Data",
-          "Type": "DataView",
-          "Desc": "Input dataset",
-          "Required": true,
-          "SortOrder": 1.0,
-          "IsNullable": false
-        },
-        {
-          "Name": "Horizon",
-          "Type": "UInt",
-          "Desc": "Maximum horizon value",
-          "Aliases": [
-            "hor"
-          ],
-          "Required": true,
-          "SortOrder": 2.0,
-          "IsNullable": false,
-          "Default": 0
-        },
-        {
-          "Name": "MaxWindowSize",
-          "Type": "UInt",
-          "Desc": "Maximum window size",
-          "Aliases": [
-            "maxsize"
-          ],
-          "Required": true,
-          "SortOrder": 3.0,
-          "IsNullable": false,
-          "Default": 0
-        },
-        {
-          "Name": "MinWindowSize",
-          "Type": "UInt",
-          "Desc": "Minimum window size",
-          "Aliases": [
-            "minsize"
-          ],
-          "Required": true,
-          "SortOrder": 4.0,
-          "IsNullable": false,
-          "Default": 0
-        },
-        {
-          "Name": "WindowCalculation",
-          "Type": {
-            "Kind": "Enum",
-            "Values": [
-              "Min",
-              "Max"
-            ]
-          },
-          "Desc": "What window calculation to use",
-          "Aliases": [
-            "calc"
-          ],
-          "Required": true,
-          "SortOrder": 5.0,
-          "IsNullable": false,
-          "Default": "0"
         }
       ],
       "Outputs": [
@@ -30582,140 +30507,6 @@
         }
       ]
     },
-    {
-      "Kind": "PartitionedPathParser",
-      "Components": [
-        {
-          "Name": "ParquetPathParser",
-          "Desc": "Extract name/value pairs from Parquet formatted directory names. Example path: Year=2018/Month=12/data1.parquet",
-          "FriendlyName": "Parquet Partitioned Path Parser",
-          "Aliases": [
-            "ParqPP"
-          ],
-          "Settings": []
-        },
-        {
-          "Name": "SimplePathParser",
-          "Desc": "A simple parser that extracts directory names as column values. Column names are defined as arguments.",
-          "FriendlyName": "Simple Partitioned Path Parser",
-          "Aliases": [
-            "SmplPP"
-          ],
-          "Settings": [
-            {
-              "Name": "Columns",
-              "Type": {
-                "Kind": "Array",
-                "ItemType": {
-                  "Kind": "Struct",
-                  "Fields": [
-                    {
-                      "Name": "Name",
-                      "Type": "String",
-                      "Desc": "Name of the column.",
-                      "Required": true,
-                      "SortOrder": 150.0,
-                      "IsNullable": false
-                    },
-                    {
-                      "Name": "Type",
-                      "Type": {
-                        "Kind": "Enum",
-                        "Values": [
-                          "I1",
-                          "U1",
-                          "I2",
-                          "U2",
-                          "I4",
-                          "U4",
-                          "I8",
-                          "U8",
-                          "R4",
-                          "Num",
-                          "R8",
-                          "TX",
-                          "Text",
-                          "TXT",
-                          "BL",
-                          "Bool",
-                          "TimeSpan",
-                          "TS",
-                          "DT",
-                          "DateTime",
-                          "DZ",
-                          "DateTimeZone",
-                          "UG",
-                          "U16"
-                        ]
-                      },
-                      "Desc": "Data type of the column.",
-                      "Required": false,
-                      "SortOrder": 150.0,
-                      "IsNullable": true,
-                      "Default": null
-                    },
-                    {
-                      "Name": "Source",
-                      "Type": "Int",
-                      "Desc": "Index of the directory representing this column.",
-                      "Required": true,
-                      "SortOrder": 150.0,
-                      "IsNullable": false,
-                      "Default": 0
-                    }
-                  ]
-                }
-              },
-              "Desc": "Column definitions used to override the Partitioned Path Parser. Expected with the format name:type:numeric-source, for example, col=MyFeature:R4:1",
-              "Aliases": [
-                "col"
-              ],
-              "Required": false,
-              "SortOrder": 1.0,
-              "IsNullable": false,
-              "Default": null
-            },
-            {
-              "Name": "Type",
-              "Type": {
-                "Kind": "Enum",
-                "Values": [
-                  "I1",
-                  "U1",
-                  "I2",
-                  "U2",
-                  "I4",
-                  "U4",
-                  "I8",
-                  "U8",
-                  "R4",
-                  "Num",
-                  "R8",
-                  "TX",
-                  "Text",
-                  "TXT",
-                  "BL",
-                  "Bool",
-                  "TimeSpan",
-                  "TS",
-                  "DT",
-                  "DateTime",
-                  "DZ",
-                  "DateTimeZone",
-                  "UG",
-                  "U16"
-                ]
-              },
-              "Desc": "Data type of each column.",
-              "Required": false,
-              "SortOrder": 150.0,
-              "IsNullable": false,
-              "Default": "TX"
-            }
-          ]
-        }
-      ]
-    },
     {
       "Kind": "RegressionLossFunction",
       "Components": [
diff --git a/src/python/tools/manifest_diff.json b/src/python/tools/manifest_diff.json
index 3b38fb2d..761ea70c 100644
--- a/src/python/tools/manifest_diff.json
+++ b/src/python/tools/manifest_diff.json
@@ -227,14 +227,8 @@
   ],
   "EntryPoints": [
     {
-      "Name": "Transforms.SimpleRollingWindow",
-      "NewName": "SimpleRollingWindow",
-      "Module": "timeseries",
-      "Type": "Transform"
-    },
-    {
-      "Name": "Transforms.AnalyticalRollingWindow",
-      "NewName": "AnalyticalRollingWindow",
+      "Name": "Transforms.RollingWindow",
+      "NewName": "RollingWindow",
       "Module": "timeseries",
       "Type": "Transform"
     },

From 7ae2fa91acebdceb169f39fae3de9fe0ab9680f9 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Sun, 19 Apr 2020 10:25:21 -0700
Subject: [PATCH 10/34] add unit tests

---
 src/python/nimbusml.pyproj                    |  4 +
 .../tests/timeseries/test_forecastingpivot.py | 40 +++++++++
 .../tests/timeseries/test_lagleadoperator.py  | 86 +++++++++++++++++++
 .../tests/timeseries/test_rollingwindow.py    | 65 ++++++++++++++
 .../tests/timeseries/test_shortdrop.py        | 40 +++++++++
 5 files changed, 235 insertions(+)
 create mode 100644 src/python/nimbusml/tests/timeseries/test_forecastingpivot.py
 create mode 100644 src/python/nimbusml/tests/timeseries/test_lagleadoperator.py
 create mode 100644 src/python/nimbusml/tests/timeseries/test_rollingwindow.py
 create mode 100644 src/python/nimbusml/tests/timeseries/test_shortdrop.py

diff --git a/src/python/nimbusml.pyproj b/src/python/nimbusml.pyproj
index d6eb1d36..81b33718 100644
--- a/src/python/nimbusml.pyproj
+++ b/src/python/nimbusml.pyproj
@@ -753,6 +753,10 @@
     <Compile Include="nimbusml\tests\test_fit_graph.py" />
     <Compile Include="nimbusml\tests\test_variable_column.py" />
     <Compile Include="nimbusml\tests\timeseries\test_iidchangepointdetector.py" />
+    <Compile Include="nimbusml\tests\timeseries\test_forecastingpivot.py" />
+    <Compile Include="nimbusml\tests\timeseries\test_lagleadoperator.py" />
+    <Compile Include="nimbusml\tests\timeseries\test_shortdrop.py" />
+    <Compile Include="nimbusml\tests\timeseries\test_rollingwindow.py" />
     <Compile Include="nimbusml\tests\timeseries\test_ssaforecaster.py" />
     <Compile Include="nimbusml\tests\timeseries\test_ssachangepointdetector.py" />
     <Compile Include="nimbusml\tests\timeseries\test_timeseriesimputer.py" />
diff --git a/src/python/nimbusml/tests/timeseries/test_forecastingpivot.py b/src/python/nimbusml/tests/timeseries/test_forecastingpivot.py
new file mode 100644
index 00000000..8077754d
--- /dev/null
+++ b/src/python/nimbusml/tests/timeseries/test_forecastingpivot.py
@@ -0,0 +1,40 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+
+import platform
+import unittest
+
+import numpy as np
+import pandas as pd
+from nimbusml import Pipeline
+from nimbusml.timeseries import ForecastingPivot, RollingWindow
+
+# BUGS
+# Removes NaN values? Record 0 is removed
+@unittest.skipIf('centos' in platform.linux_distribution()[0].lower(), "centos is not supported")
+class TestForecastingPivot(unittest.TestCase):
+
+    def test_simple_pivot(self):
+
+        df = pd.DataFrame(data=dict(
+            ts=[1.0, 3.0, 5.0, 7.0],
+            grain=['1970', '1970', '1970', '1970'],
+        ))
+
+        rw = RollingWindow(columns={'ts_r': 'ts'},
+                           grain_column=['grain'], 
+                           window_calculation='Mean',
+                           max_window_size=1,
+                           horizon=1)
+
+        xf1 = ForecastingPivot(columns_to_pivot=['ts_r'])
+
+        pipe = Pipeline([rw, xf1])
+
+        result = pipe.fit_transform(df)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/src/python/nimbusml/tests/timeseries/test_lagleadoperator.py b/src/python/nimbusml/tests/timeseries/test_lagleadoperator.py
new file mode 100644
index 00000000..f0609c1b
--- /dev/null
+++ b/src/python/nimbusml/tests/timeseries/test_lagleadoperator.py
@@ -0,0 +1,86 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+
+import platform
+import unittest
+
+import math
+import numpy as np
+import pandas as pd
+from nimbusml.timeseries import LagLeadOperator
+
+
+@unittest.skipIf('centos' in platform.linux_distribution()[0].lower(), "centos is not supported")
+class TestLagLeadOperator(unittest.TestCase):
+
+    def test_no_lag(self):
+
+        df = pd.DataFrame(data=dict(
+            ts=[1.0, 3.0, 5.0, 7.0],
+            grain=['1970', '1970', '1970', '1970'],
+        ))
+
+        ll = LagLeadOperator(columns={'ts_r': 'ts'}, 
+                           grain_columns=['grain'], 
+                           offsets=[0],
+                           horizon=1)
+
+        result = ll.fit_transform(df)
+ 
+        self.assertEqual(result.loc[0, 'ts_r'], 1)
+        self.assertEqual(result.loc[1, 'ts_r'], 3)
+        self.assertEqual(result.loc[2, 'ts_r'], 5)
+        self.assertEqual(result.loc[3, 'ts_r'], 7)
+
+    def test_simple_horizon(self):
+
+        df = pd.DataFrame(data=dict(
+            ts=[1.0, 3.0, 5.0, 7.0],
+            grain=['1970', '1970', '1970', '1970'],
+        ))
+
+        ll = LagLeadOperator(columns={'ts_r': 'ts'}, 
+                           grain_columns=['grain'], 
+                           offsets=[0],
+                           horizon=2)
+
+        result = ll.fit_transform(df)
+
+        self.assertTrue(math.isnan(result.loc[0, 'ts_r.0']))
+        self.assertEqual(result.loc[1, 'ts_r.0'], 1)
+        self.assertEqual(result.loc[2, 'ts_r.0'], 3)
+        self.assertEqual(result.loc[3, 'ts_r.0'], 5)
+        
+        self.assertEqual(result.loc[0, 'ts_r.1'], 1)
+        self.assertEqual(result.loc[1, 'ts_r.1'], 3)
+        self.assertEqual(result.loc[2, 'ts_r.1'], 5)
+        self.assertEqual(result.loc[3, 'ts_r.1'], 7)
+
+    def test_simple_lag(self):
+
+        df = pd.DataFrame(data=dict(
+            ts=[1.0, 3.0, 5.0, 7.0],
+            grain=['1970', '1970', '1970', '1970'],
+        ))
+
+        ll = LagLeadOperator(columns={'ts_r': 'ts'}, 
+                           grain_columns=['grain'], 
+                           offsets=[-1, 1],
+                           horizon=1)
+
+        result = ll.fit_transform(df)
+ 
+        self.assertTrue(math.isnan(result.loc[0, 'ts_r.0']))
+        self.assertEqual(result.loc[1, 'ts_r.0'], 1)
+        self.assertEqual(result.loc[2, 'ts_r.0'], 3)
+        self.assertEqual(result.loc[3, 'ts_r.0'], 5)
+
+        self.assertEqual(result.loc[0, 'ts_r.1'], 3)
+        self.assertEqual(result.loc[1, 'ts_r.1'], 5)
+        self.assertEqual(result.loc[2, 'ts_r.1'], 7)
+        self.assertTrue(math.isnan(result.loc[3, 'ts_r.1']))
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/src/python/nimbusml/tests/timeseries/test_rollingwindow.py b/src/python/nimbusml/tests/timeseries/test_rollingwindow.py
new file mode 100644
index 00000000..b6ccdc8c
--- /dev/null
+++ b/src/python/nimbusml/tests/timeseries/test_rollingwindow.py
@@ -0,0 +1,65 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+
+import platform
+import unittest
+
+import math
+import numpy as np
+import pandas as pd
+from nimbusml.timeseries import RollingWindow
+
+
+# BUGS
+# Grain is only string? Fix the error message as in ShortDrop
+# Horizon predicitons are not in correct order, see above
+@unittest.skipIf('centos' in platform.linux_distribution()[0].lower(), "centos is not supported")
+class TestRollingWindow(unittest.TestCase):
+
+    def test_simple_rolling_window(self):
+
+        df = pd.DataFrame(data=dict(
+            ts=[1.0, 3.0, 5.0, 7.0],
+            grain=['1970', '1970', '1970', '1970'],
+        ))
+
+        rw = RollingWindow(columns={'ts_r': 'ts'},
+                           grain_column=['grain'], 
+                           window_calculation='Mean',
+                           max_window_size=1,
+                           horizon=2)
+        result = rw.fit_transform(df)
+
+        self.assertTrue(math.isnan(result.loc[0, 'ts_r']))
+        self.assertEqual(result.loc[1, 'ts_r'], 1)
+        self.assertEqual(result.loc[2, 'ts_r'], 3)
+        self.assertEqual(result.loc[3, 'ts_r'], 5)
+
+    def test_simple_rolling_window2(self):
+
+        df = pd.DataFrame(data=dict(
+            ts=[1.0, 3.0, 5.0, 7.0],
+            grain=['1970', '1970', '1970', '1970'],
+        ))
+
+        rw = RollingWindow(columns={'ts_r': 'ts'},
+                           grain_column=['grain'], 
+                           window_calculation='Mean',
+                           max_window_size=2,
+                           horizon=2)
+        result = rw.fit_transform(df)
+
+        self.assertTrue(math.isnan(result.loc[0, 'ts_r.0']))
+        self.assertTrue(math.isnan(result.loc[1, 'ts_r.0']))
+        self.assertEqual(result.loc[2, 'ts_r.0'], 1)
+        self.assertEqual(result.loc[3, 'ts_r.0'], 2)
+        
+        self.assertTrue(math.isnan(result.loc[0, 'ts_r.1']))
+        self.assertEqual(result.loc[1, 'ts_r.1'], 1)
+        self.assertEqual(result.loc[2, 'ts_r.1'], 2)
+        self.assertEqual(result.loc[3, 'ts_r.1'], 4)
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/src/python/nimbusml/tests/timeseries/test_shortdrop.py b/src/python/nimbusml/tests/timeseries/test_shortdrop.py
new file mode 100644
index 00000000..85fed23b
--- /dev/null
+++ b/src/python/nimbusml/tests/timeseries/test_shortdrop.py
@@ -0,0 +1,40 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+
+import platform
+import unittest
+
+import numpy as np
+import pandas as pd
+from nimbusml.timeseries import ShortDrop
+
+
+@unittest.skipIf('centos' in platform.linux_distribution()[0].lower(), "centos is not supported")
+class TestShortDrop(unittest.TestCase):
+
+    def test_no_drops(self):
+
+        df = pd.DataFrame(data=dict(
+            ts=[1.0, 3.0, 5.0, 7.0],
+            grain=['1970', '1970', '1970', '1970'],
+        ))
+
+        sd = ShortDrop(grain_columns=['grain'], min_rows=4) << 'ts'
+        result = sd.fit_transform(df)
+        pd.testing.assert_frame_equal(result, df)
+
+    def test_drop_all(self):
+
+        df = pd.DataFrame(data=dict(
+            ts=[1.0, 3.0, 5.0, 7.0],
+            grain=['1970', '1970', '1970', '1970'],
+        ))
+
+        sd = ShortDrop(grain_columns=['grain'], min_rows=100) << 'ts'
+        result = sd.fit_transform(df)
+        self.assertEqual(len(result), 0)
+
+if __name__ == '__main__':
+    unittest.main()

From e3196c7cdc94d3a8830aaf4724890d94330e4f39 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Mon, 20 Apr 2020 11:48:06 -0700
Subject: [PATCH 11/34] Add timeseries transforms to onnx suite test. Get
 dependency on ort-featurizers

---
 build.cmd                                        | 2 +-
 src/python/tests_extended/test_export_to_onnx.py | 4 ----
 2 files changed, 1 insertion(+), 5 deletions(-)

diff --git a/build.cmd b/build.cmd
index 95fc02d3..fe4d97a3 100644
--- a/build.cmd
+++ b/build.cmd
@@ -399,7 +399,7 @@ if "%InstallPythonPackages%" == "True" (
         call "%PythonExe%" -m pip install --upgrade pyzmq
     ) else (
         call "%PythonExe%" -m pip install --upgrade "azureml-dataprep>=1.1.33"
-        call "%PythonExe%" -m pip install --upgrade onnxruntime
+        call "%PythonExe%" -m pip install --upgrade -i https://test.pypi.org/simple/ ort-nightly-featurizer
     )
 
     call "%PythonExe%" -m pip install --upgrade "%__currentScriptDir%target\%WheelFile%"
diff --git a/src/python/tests_extended/test_export_to_onnx.py b/src/python/tests_extended/test_export_to_onnx.py
index 4749fb3a..74454cb8 100644
--- a/src/python/tests_extended/test_export_to_onnx.py
+++ b/src/python/tests_extended/test_export_to_onnx.py
@@ -118,12 +118,10 @@
     'OnnxRunner',
     'Sentiment',
     'TensorFlowScorer',
-    'TimeSeriesImputer',
     'TreeFeaturizer',
     'WordEmbedding',
     'Binner',
     'BootstrapSampler',
-    'DateTimeSplitter',
     'EnsembleClassifier',
     'EnsembleRegressor',
     'FactorizationMachineBinaryClassifier',
@@ -146,8 +144,6 @@
     'SsaSpikeDetector',
     'SymSgdBinaryClassifier',
     'TakeFilter',
-    'ToKeyImputer',
-    'ToString',
     'EnsembleClassifier',
     'EnsembleRegressor',
     'CharTokenizer',

From d6ae18f7ab26b8bc7b467f3bdfa06d99bbe16247 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Mon, 20 Apr 2020 12:14:22 -0700
Subject: [PATCH 12/34] Add automl ONNX tests

---
 src/python/nimbusml.pyproj                    |   1 +
 .../tests_extended/test_timeseries_automl.py  | 202 ++++++++++++++++++
 2 files changed, 203 insertions(+)
 create mode 100644 src/python/tests_extended/test_timeseries_automl.py

diff --git a/src/python/nimbusml.pyproj b/src/python/nimbusml.pyproj
index 81b33718..61a2528a 100644
--- a/src/python/nimbusml.pyproj
+++ b/src/python/nimbusml.pyproj
@@ -776,6 +776,7 @@
     <Compile Include="nimbusml\timeseries\__init__.py" />
     <Compile Include="tests_extended\data_frame_tool.py" />
     <Compile Include="tests_extended\test_automl_scenario.py" />
+    <Compile Include="tests_extended\test_timeseries_automl.py" />
     <Compile Include="tests_extended\test_export_to_onnx.py" />
     <Compile Include="tests\test_estimator_checks.py" />
     <Compile Include="nimbusml\tests\feature_extraction\text\test_lightlda.py" />
diff --git a/src/python/tests_extended/test_timeseries_automl.py b/src/python/tests_extended/test_timeseries_automl.py
new file mode 100644
index 00000000..1e85f418
--- /dev/null
+++ b/src/python/tests_extended/test_timeseries_automl.py
@@ -0,0 +1,202 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+
+import os
+import platform
+import tempfile
+import unittest
+
+import numpy as np
+import pandas as pd
+from nimbusml import Pipeline
+from nimbusml.preprocessing import ToString, ToKeyImputer, DateTimeSplitter
+from nimbusml.timeseries import TimeSeriesImputer, LagLeadOperator, RollingWindow, ForecastingPivot, ShortDrop
+from data_frame_tool import DataFrameTool as DFT
+
+def get_tmp_file(suffix=None):
+    fd, file_name = tempfile.mkstemp(suffix=suffix)
+    fl = os.fdopen(fd, 'w')
+    fl.close()
+    return file_name
+
+class TestAutoMLTransforms(unittest.TestCase):
+
+    def test_tostring(self):
+        data={'f0': [4, 4, -1, 9],
+              'f1': [5, 5, 3.1, -0.23],
+              'f2': [6, 6.7, np.nan, np.nan]}
+        data = pd.DataFrame(data).astype({'f0': np.int32,
+                                       'f1': np.float32,
+                                       'f2': np.float64})
+
+        xf = ToString(columns={'f0.out': 'f0',
+                               'f1.out': 'f1',
+                               'f2.out': 'f2'})
+        xf.fit(data)
+
+        onnx_path = get_tmp_file('.onnx')
+        onnx_json_path = get_tmp_file('.onnx.json')
+        xf.export_to_onnx(onnx_path,
+                            'com.microsoft.ml',
+                            dst_json=onnx_json_path,
+                            onnx_version='Stable')
+
+    def test_tokeyimputer(self):
+        text_df = pd.DataFrame(
+            data=dict(
+                text=[
+                    "cat",
+                    "dog",
+                    "fish",
+                    "orange",
+                    "cat orange",
+                    "dog",
+                    "fish",
+                    None,
+                    "spider"]))
+
+        xf = ToKeyImputer() << 'text'
+        xf.fit(text_df)
+
+        onnx_path = get_tmp_file('.onnx')
+        onnx_json_path = get_tmp_file('.onnx.json')
+        xf.export_to_onnx(onnx_path,
+                            'com.microsoft.ml',
+                            dst_json=onnx_json_path,
+                            onnx_version='Stable')
+
+    def test_datetimesplitter(self):
+        df = pd.DataFrame(data=dict(
+            tokens1=[1, 2, 3, 157161600],
+            tokens2=[10, 11, 12, 13]
+        ))
+
+        cols_to_drop = [
+            'dtHour12', 'dtDayOfWeek', 'dtDayOfQuarter',
+            'dtDayOfYear', 'dtWeekOfMonth', 'dtQuarterOfYear',
+            'dtHalfOfYear', 'dtWeekIso', 'dtYearIso', 'dtMonthLabel',
+            'dtAmPmLabel', 'dtDayOfWeekLabel', 'dtIsPaidTimeOff'
+        ]
+
+        dts = DateTimeSplitter(prefix='dt', country='Canada') << 'tokens1'
+        xf = Pipeline([dts, ColumnSelector(drop_columns=cols_to_drop)])
+        xf.fit(df)
+
+        onnx_path = get_tmp_file('.onnx')
+        onnx_json_path = get_tmp_file('.onnx.json')
+        xf.export_to_onnx(onnx_path,
+                            'com.microsoft.ml',
+                            dst_json=onnx_json_path,
+                            onnx_version='Stable')
+
+    def test_timeseriesimputer(self):
+
+        df = pd.DataFrame(data=dict(
+            ts=[1, 2, 3, 5],
+            grain=[1970, 1970, 1970, 1970],
+            c3=[10, 13, 15, 20],
+            c4=[19, 12, 16, 19]
+        ))
+
+        xf = TimeSeriesImputer(time_series_column='ts',
+                                grain_columns=['grain'],
+                                filter_columns=['c3', 'c4'],
+                                impute_mode='ForwardFill',
+                                filter_mode='Include')
+        xf.fit(df)
+
+        onnx_path = get_tmp_file('.onnx')
+        onnx_json_path = get_tmp_file('.onnx.json')
+        xf.export_to_onnx(onnx_path,
+                            'com.microsoft.ml',
+                            dst_json=onnx_json_path,
+                            onnx_version='Stable')
+
+    def test_shortdrop(self):
+
+        df = pd.DataFrame(data=dict(
+            ts=[1.0, 3.0, 5.0, 7.0],
+            grain=['1970', '1970', '1970', '1970'],
+        ))
+
+        xf = ShortDrop(grain_columns=['grain'], min_rows=4) << 'ts'
+        xf.fit(df)
+
+        onnx_path = get_tmp_file('.onnx')
+        onnx_json_path = get_tmp_file('.onnx.json')
+        xf.export_to_onnx(onnx_path,
+                            'com.microsoft.ml',
+                            dst_json=onnx_json_path,
+                            onnx_version='Stable')
+
+    def test_rolling_window(self):
+
+        df = pd.DataFrame(data=dict(
+            ts=[1.0, 3.0, 5.0, 7.0],
+            grain=['1970', '1970', '1970', '1970'],
+        ))
+
+        xf = RollingWindow(columns={'ts_r': 'ts'},
+                           grain_column=['grain'], 
+                           window_calculation='Mean',
+                           max_window_size=1,
+                           horizon=2)
+        xf.fit(df)
+
+        onnx_path = get_tmp_file('.onnx')
+        onnx_json_path = get_tmp_file('.onnx.json')
+        xf.export_to_onnx(onnx_path,
+                            'com.microsoft.ml',
+                            dst_json=onnx_json_path,
+                            onnx_version='Stable')
+
+    def test_pivot(self):
+
+        df = pd.DataFrame(data=dict(
+            ts=[1.0, 3.0, 5.0, 7.0],
+            grain=['1970', '1970', '1970', '1970'],
+        ))
+
+        xf0 = RollingWindow(columns={'ts_r': 'ts'},
+                           grain_column=['grain'], 
+                           window_calculation='Mean',
+                           max_window_size=1,
+                           horizon=1)
+
+        xf1 = ForecastingPivot(columns_to_pivot=['ts_r'])
+
+        xf = Pipeline([xf0, xf1])
+
+        xf.fit(df)
+
+        onnx_path = get_tmp_file('.onnx')
+        onnx_json_path = get_tmp_file('.onnx.json')
+        xf.export_to_onnx(onnx_path,
+                            'com.microsoft.ml',
+                            dst_json=onnx_json_path,
+                            onnx_version='Stable')
+
+    def test_lag(self):
+
+        df = pd.DataFrame(data=dict(
+            ts=[1.0, 3.0, 5.0, 7.0],
+            grain=['1970', '1970', '1970', '1970'],
+        ))
+
+        xf = LagLeadOperator(columns={'ts_r': 'ts'}, 
+                           grain_columns=['grain'], 
+                           offsets=[-1, 1],
+                           horizon=1)
+
+        xf.fit(df)
+        onnx_path = get_tmp_file('.onnx')
+        onnx_json_path = get_tmp_file('.onnx.json')
+        xf.export_to_onnx(onnx_path,
+                            'com.microsoft.ml',
+                            dst_json=onnx_json_path,
+                            onnx_version='Stable')
+
+if __name__ == '__main__':
+    unittest.main()

From 7244760cc02db5831fc30d4d030bc2bd889d22c8 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Mon, 20 Apr 2020 12:36:02 -0700
Subject: [PATCH 13/34] 0.4.0 version for Featurizers

---
 src/DotNetBridge/DotNetBridge.csproj | 2 +-
 src/Platforms/build.csproj           | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/DotNetBridge/DotNetBridge.csproj b/src/DotNetBridge/DotNetBridge.csproj
index 3e20c790..0bb24a04 100644
--- a/src/DotNetBridge/DotNetBridge.csproj
+++ b/src/DotNetBridge/DotNetBridge.csproj
@@ -46,7 +46,7 @@
     <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-preview3*" />
     <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-preview3*" />
     <PackageReference Include="Microsoft.ML.Featurizers" Version="0.17.0-preview3*" />
-    <PackageReference Include="Microsoft.MLFeaturizers" Version="0.4.0-preview*" />
+    <PackageReference Include="Microsoft.MLFeaturizers" Version="0.4.0" />
     <PackageReference Include="Microsoft.DataPrep" Version="0.0.3.2-preview" />
     <PackageReference Include="TensorFlow.NET" Version="0.11.8.1" />
     <PackageReference Include="SciSharp.TensorFlow.Redist" Version="1.14.0" />
diff --git a/src/Platforms/build.csproj b/src/Platforms/build.csproj
index b63cfe46..3149c6f3 100644
--- a/src/Platforms/build.csproj
+++ b/src/Platforms/build.csproj
@@ -35,7 +35,7 @@
     <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-preview3*" />
     <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-preview3*" />
     <PackageReference Include="Microsoft.ML.Featurizers" Version="0.17.0-preview3*" />
-    <PackageReference Include="Microsoft.MLFeaturizers" Version="0.4.0-preview*" />
+    <PackageReference Include="Microsoft.MLFeaturizers" Version="0.4.0" />
     <PackageReference Include="Microsoft.DataPrep" Version="0.0.3.2-preview" />
     <PackageReference Include="TensorFlow.NET" Version="0.11.8.1" />
     <PackageReference Include="SciSharp.TensorFlow.Redist" Version="1.14.0" />

From f33345262c253371ba806659720a951f7f9b5743 Mon Sep 17 00:00:00 2001
From: Jin Yan <jiyan2@microsoft.com>
Date: Sun, 26 Apr 2020 23:50:28 -0700
Subject: [PATCH 14/34] Featurizer Onnx Export tests (#484)

* tests completed

* refactor tests

* resolve comments

* resolve comments

* resolve comments
---
 src/python/tests_extended/test_dft_based.py   | 338 +++++++
 .../tests_extended/test_tensor_based.py       | 846 ++++++++++++++++++
 .../test_tensor_invalid_input.py              | 403 +++++++++
 3 files changed, 1587 insertions(+)
 create mode 100644 src/python/tests_extended/test_dft_based.py
 create mode 100644 src/python/tests_extended/test_tensor_based.py
 create mode 100644 src/python/tests_extended/test_tensor_invalid_input.py

diff --git a/src/python/tests_extended/test_dft_based.py b/src/python/tests_extended/test_dft_based.py
new file mode 100644
index 00000000..96d0193c
--- /dev/null
+++ b/src/python/tests_extended/test_dft_based.py
@@ -0,0 +1,338 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+
+import os
+import sys
+import io
+import platform
+import tempfile
+import unittest
+
+import numpy as np
+import pandas as pd
+from nimbusml import Pipeline
+from nimbusml.preprocessing.schema import ColumnSelector
+from nimbusml.preprocessing import ToString, ToKeyImputer, DateTimeSplitter
+from scipy.sparse import csr_matrix
+from nimbusml.timeseries import TimeSeriesImputer, LagLeadOperator, RollingWindow, ForecastingPivot, ShortDrop
+from nimbusml.preprocessing import (TensorFlowScorer, FromKey, ToKey,
+                                    DateTimeSplitter, OnnxRunner)
+import onnxruntime as rt
+from data_frame_tool import DataFrameTool as DFT
+
+TEST_CASES = {
+    'DateTimeSplitter_Simple',
+    'DateTimeSplitter_Complex',
+    'ToKey_SimpleFloat',
+    'ToKey_SimpleDouble',
+    'ToKey_SimpleString',
+    'ToKey_2col_Double',
+    'ToKey_2col_Double_String',
+    'ToString_Numbers',
+    'ToString_Other_Types',
+    'TimeSeriesImputer_1grain_2gap',
+    'TimeSeriesImputer_1grain_2gap_backfill',
+    'TimeSeriesImputer_1grain_2gap_medianfill',
+    'TimeSeriesImputer_1grain_2gap',
+    'TimeSeriesImputer_1grain_1gap_2filtercolumn',
+    'TimeSeriesImputer_2grain_nogap',
+    'ShortGrainDropper',
+    'RollingWin_Pivot_Integration',
+    'Laglead_Pivot_Integration',
+}
+
+INSTANCES = {
+    'DateTimeSplitter_Simple': Pipeline([
+        DateTimeSplitter(prefix='dt') << 'tokens1',
+        ColumnSelector(drop_columns=[
+                                    'dtHour12', 'dtDayOfWeek', 'dtDayOfQuarter',
+                                    'dtDayOfYear', 'dtWeekOfMonth', 'dtQuarterOfYear',
+                                    'dtHalfOfYear', 'dtWeekIso', 'dtYearIso', 'dtMonthLabel',
+                                    'dtAmPmLabel', 'dtDayOfWeekLabel', 'dtIsPaidTimeOff','dtHolidayName'
+        ])
+    ]),
+    'DateTimeSplitter_Complex' : Pipeline([
+        DateTimeSplitter(prefix='dt') << 'tokens1',
+        ColumnSelector(drop_columns=[
+                                    'dtHour12', 'dtDayOfWeek', 'dtDayOfQuarter',
+                                    'dtDayOfYear', 'dtWeekOfMonth', 'dtQuarterOfYear',
+                                    'dtHalfOfYear', 'dtWeekIso', 'dtYearIso', 'dtMonthLabel',
+                                    'dtAmPmLabel', 'dtDayOfWeekLabel', 'dtIsPaidTimeOff','dtHolidayName'
+        ])
+    ]),
+    'ToKey_SimpleFloat': ToKeyImputer(),
+    'ToKey_SimpleDouble': ToKeyImputer(),
+    'ToKey_SimpleString': ToKeyImputer(),
+    'ToKey_2col_Double': ToKeyImputer(),
+    'ToKey_2col_Double_String': ToKeyImputer(),
+    'ToString_Numbers': ToString(columns={'f0.out': 'f0',
+                                          'f1.out': 'f1',
+                                          'f2.out': 'f2'}),
+    'ToString_Other_Types': ToString(columns={'f0.out': 'f0',
+                                              'f1.out': 'f1'}),
+    'TimeSeriesImputer_1grain_2gap': TimeSeriesImputer(time_series_column='ts',
+                                                       filter_columns=['c'],
+                                                       grain_columns=['grain'],
+                                                       impute_mode='ForwardFill',
+                                                       filter_mode='Include'),      
+    'TimeSeriesImputer_1grain_2gap_backfill': TimeSeriesImputer(time_series_column='ts',
+                                                       filter_columns=['c'],
+                                                       grain_columns=['grain'],
+                                                       impute_mode='BackFill',
+                                                       filter_mode='Include'),
+    'TimeSeriesImputer_1grain_2gap_medianfill': TimeSeriesImputer(time_series_column='ts',
+                                                       filter_columns=['c'],
+                                                       grain_columns=['grain'],
+                                                       impute_mode='Median',
+                                                       filter_mode='Include'),
+    'TimeSeriesImputer_1grain_1gap_2filtercolumn': TimeSeriesImputer(time_series_column='ts',
+                                                        grain_columns=['grain'],
+                                                        filter_columns=['c3', 'c4'],
+                                                        impute_mode='ForwardFill',
+                                                        filter_mode='Include'),
+    'TimeSeriesImputer_2grain_nogap': TimeSeriesImputer(time_series_column='ts',
+                                                       filter_columns=['c'],
+                                                       grain_columns=['grain'],
+                                                       impute_mode='ForwardFill',
+                                                       filter_mode='Include'),
+    'ShortGrainDropper': ShortDrop(columns={'colA1': 'colA'},
+                                   grain_columns=['grainA'],
+                                   min_rows=2),
+    # For RollingWindow with horizon as 2, max_window_size as 2 and we are calculating Mean, assume time frequency is 1 day
+    # output for each row would be [[mean of (2DaysBeforeYesterday and DayBeforeYesterday), mean of (DayBeforeYesterday and Yesterday)]]
+    # forecasting pivot will spread this 2d vector out and drop rows that have NaNs in it
+    'RollingWin_Pivot_Integration': Pipeline([
+        RollingWindow(columns={'colA1': 'colA'},
+                           grain_column=['grainA'], 
+                           window_calculation='Mean',
+                           max_window_size=2,
+                           horizon=2),
+        ForecastingPivot(columns_to_pivot=['colA1'])
+    ]),
+    # For LagLeadOperator with horizon as 2 and offsets as [-2, -1], assume time frequency is 1 day
+    # output for each row would be [[2DaysBeforeYesterday, DayBeforeYesterday],
+    #                               [DayBeforeYesterday, Yesterday]]
+    # forecasting pivot will spread this 2d vector out and drop rows that have NaNs in it
+    'Laglead_Pivot_Integration': Pipeline([
+        LagLeadOperator(columns={'colA1': 'colA'},
+                        grain_columns=['grainA'], 
+                        offsets=[-2, -1],
+                        horizon=2),
+        ForecastingPivot(columns_to_pivot=['colA1'])
+    ]),
+}
+
+DATASETS = {
+    'DateTimeSplitter_Simple': pd.DataFrame(data=dict(
+                                tokens1=[1, 2, 3, 157161600]
+                               )),
+    'DateTimeSplitter_Complex': pd.DataFrame(data=dict(
+                                tokens1=[217081624, 1751241600, 217081625, 32445842582]
+                               )),
+    'ToKey_SimpleFloat': pd.DataFrame(data=dict(
+                                    target=[1.0, 1.0, 1.0, 2.0]
+                        )).astype({'target': np.float64}),
+    'ToKey_SimpleDouble': pd.DataFrame(data=dict(
+                                    target=[1.0, 1.0, 1.0, 2.0]
+                        )).astype({'target': np.double}),
+    'ToKey_SimpleString': pd.DataFrame(data=dict(
+                                    target=["one", "one", "one", "two"]
+                        )),
+    'ToKey_2col_Double': pd.DataFrame(data=dict(
+                                    data1=[1.0, 1.0, 1.0, 2.0],
+                                    data2=[2.0, 2.0, 2.0, 3.0],
+                        )).astype({'data1': np.double,
+                                   'data1': np.double}),
+    'ToKey_2col_Double_String': pd.DataFrame(data=dict(
+                                    data1=[1.0, 1.0, 1.0, 2.0],
+                                    data2=["two", "two", "three", "two"],
+                        )),
+    'ToString_Numbers': pd.DataFrame(data=dict(
+                                    f0= [4, 4, -1, 9],
+                                    f1= [5, 5, 3.1, -0.23],
+                                    f2= [6, 6.7, np.nan, np.nan]
+                        )),
+    'ToString_Other_Types': pd.DataFrame(data=dict(
+                                    f0= [True, False],
+                                    f1= [123.45, 135453984983490.5473]
+                        )).astype({'f0': bool,
+                                   'f1': np.double}),
+    'TimeSeriesImputer_1grain_2gap': pd.DataFrame(data=dict(
+                                        ts=[1, 2, 3, 5, 7],
+                                        grain=[1970, 1970, 1970, 1970, 1970],
+                                        c=[10, 11, 12, 13, 14]
+                                    )).astype({'ts': np.int64, 'grain': np.int32, 'c': np.int32}),
+    'TimeSeriesImputer_1grain_2gap_backfill': pd.DataFrame(data=dict(
+                                                  ts=[1, 2, 3, 5, 7],
+                                                  grain=[1970, 1970, 1970, 1970, 1970],
+                                                  c=[10, 11, 12, 13, 14]
+                                              )).astype({'ts': np.int64, 'grain': np.int32, 'c': np.int32}),
+    'TimeSeriesImputer_1grain_2gap_medianfill': pd.DataFrame(data=dict(
+                                                    ts=[1, 2, 3, 5, 7],
+                                                    grain=[1970, 1970, 1970, 1970, 1970],
+                                                    c=[10, 11, 12, 13, 14]
+                                                )).astype({'ts': np.int64, 'grain': np.int32, 'c': np.double}),
+    'TimeSeriesImputer_1grain_1gap_2filtercolumn': pd.DataFrame(data=dict(
+                                        ts=[1, 2, 3, 5],
+                                        grain=[1970, 1970, 1970, 1970],
+                                        c3=[10, 13, 15, 20],
+                                        c4=[19, 12, 16, 19]
+                                    )).astype({'ts': np.int64, 'grain': np.int32, 'c3': np.int32, 'c4': np.int32}),
+    'TimeSeriesImputer_2grain_nogap': pd.DataFrame(data=dict(
+                                        ts=[1, 5, 2, 6],
+                                        grain=[1970, 1971, 1970, 1971],
+                                        c=[10, 11, 12, 13]
+                                    )).astype({'ts': np.int64, 'grain': np.int32, 'c': np.int32}),
+    'ShortGrainDropper': pd.DataFrame(data=dict(
+                                    colA=[1.0, 2.0, 3.0, 4.0],
+                                    grainA=["one", "one", "one", "two"]
+                                )),
+    'RollingWin_Pivot_Integration': pd.DataFrame(data=dict(
+                                    colA=[1.0, 2.0, 3.0, 4.0],
+                                    grainA=["one", "one", "one", "one"]
+                                )),
+    'Laglead_Pivot_Integration': pd.DataFrame(data=dict(
+                                    colA=[1.0, 2.0, 3.0, 4.0],
+                                    grainA=["one", "one", "one", "one"]
+                                ))
+}
+
+def get_file_size(file_path):
+    file_size = 0
+    try:
+        file_size = os.path.getsize(file_path)
+    except:
+        pass
+    return file_size
+
+def get_tmp_file(suffix=None):
+    fd, file_name = tempfile.mkstemp(suffix=suffix)
+    fl = os.fdopen(fd, 'w')
+    fl.close()
+    return file_name
+
+class CaptureOutputContext():
+    """
+    Context which can be used for
+    capturing stdout and stderr. 
+    """
+    def __enter__(self):
+        self.orig_stdout = sys.stdout
+        self.orig_stderr = sys.stderr
+        self.stdout_capturer = io.StringIO()
+        self.stderr_capturer = io.StringIO()
+        sys.stdout = self.stdout_capturer
+        sys.stderr = self.stderr_capturer
+        return self
+
+    def __exit__(self, *args):
+        sys.stdout = self.orig_stdout
+        sys.stderr = self.orig_stderr
+        self.stdout = self.stdout_capturer.getvalue()
+        self.stderr = self.stderr_capturer.getvalue()
+
+        if self.stdout:
+            print(self.stdout)
+
+        if self.stderr:
+            print(self.stderr)
+
+        # free up some memory
+        del self.stdout_capturer
+        del self.stderr_capturer
+
+def validate_results(result_mlnet, result_ort):
+    
+    if len(result_ort.columns) != len(result_mlnet.columns):
+        raise RuntimeError("ERROR: The ORT output does not contain the same number of columns as ML.NET.")
+    col_tuples = list(zip(result_mlnet.columns[0:],
+                          result_ort.columns[0:]))
+    for col_tuple in col_tuples:
+        try:
+            col_mlnet = result_mlnet.loc[:, col_tuple[0]]
+            col_ort = result_ort.loc[:, col_tuple[1]]
+            check_kwargs = {
+                'check_names': False,
+                'check_exact': True,
+                'check_dtype': True,
+                'check_less_precise': True
+            }
+            pd.testing.assert_series_equal(col_mlnet, col_ort, **check_kwargs)
+        except Exception as e:
+            print(e)
+            raise RuntimeError("ERROR: OnnxRunner result does not match ML.NET result.")
+    return True
+
+def export_to_onnx(estimator, test_case):
+    """
+    Fit and test an estimator and determine
+    if it supports exporting to the ONNX format.
+    """
+    onnx_path = get_tmp_file('.onnx')
+    onnx_json_path = get_tmp_file('.onnx.json')
+
+    output = None
+    exported = False
+    export_valid = False
+
+    try:
+        dataset = DATASETS.get(test_case)
+        
+        result_mlnet = estimator.fit_transform(dataset)
+
+        with CaptureOutputContext() as output:
+            estimator.export_to_onnx(onnx_path,
+                                     'com.microsoft.ml',
+                                     dst_json=onnx_json_path,
+                                     onnx_version='Stable')
+    except Exception as e:
+        print(e)
+
+    onnx_file_size = get_file_size(onnx_path)
+    onnx_json_file_size = get_file_size(onnx_json_path)
+    
+    if (output and
+        (onnx_file_size != 0) and
+        (onnx_json_file_size != 0) and
+        (not 'cannot save itself as ONNX' in output.stdout) and
+        (not 'Warning: We do not know how to save the predictor as ONNX' in output.stdout)):
+
+        exported = True
+
+        try:
+            df_tool = DFT(onnx_path)
+            result_ort = df_tool.execute(dataset, [])
+
+            export_valid = validate_results(result_mlnet, result_ort)
+        except Exception as e:
+            print(e)
+            
+    os.remove(onnx_path)
+    os.remove(onnx_json_path)
+    return {'exported': exported, 'export_valid': export_valid}
+
+class TestOnnxExport(unittest.TestCase):
+
+    # This method is a static method of the class
+    # because there were pytest fixture related
+    # issues when the method was in the global scope.
+    @staticmethod
+    def generate_test_method(test_case):
+        def method(self):
+            estimator = INSTANCES[test_case]
+
+            result = export_to_onnx(estimator, test_case)
+            assert result['exported']
+            assert result['export_valid']
+
+        return method
+
+for test_case in TEST_CASES:
+    test_name = 'test_%s' % test_case.replace('(', '_').replace(')', '').lower()
+    method = TestOnnxExport.generate_test_method(test_case)
+    setattr(TestOnnxExport, test_name, method)
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/src/python/tests_extended/test_tensor_based.py b/src/python/tests_extended/test_tensor_based.py
new file mode 100644
index 00000000..ea6e5edc
--- /dev/null
+++ b/src/python/tests_extended/test_tensor_based.py
@@ -0,0 +1,846 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+
+import os
+import platform
+import tempfile
+import unittest
+
+import numpy as np
+import pandas as pd
+from nimbusml import Pipeline
+from nimbusml.preprocessing.schema import ColumnSelector
+from nimbusml.preprocessing import ToString, ToKeyImputer, DateTimeSplitter
+from nimbusml.timeseries import TimeSeriesImputer, LagLeadOperator, RollingWindow, ForecastingPivot, ShortDrop
+from nimbusml.preprocessing import (TensorFlowScorer, FromKey, ToKey,
+                                    DateTimeSplitter, OnnxRunner)
+import onnxruntime as rt
+from data_frame_tool import DataFrameTool as DFT
+
+def get_tmp_file(suffix=None):
+    fd, file_name = tempfile.mkstemp(suffix=suffix)
+    fl = os.fdopen(fd, 'w')
+    fl.close()
+    return file_name
+
+def set_up_onnx_model(estimator, training_data):
+    estimator.fit(training_data)
+    onnx_path = get_tmp_file('.onnx')
+    onnx_json_path = get_tmp_file('.onnx.json')
+    estimator.export_to_onnx(onnx_path,
+                        'com.microsoft.ml',
+                        dst_json=onnx_json_path,
+                        onnx_version='Stable')
+    return rt.InferenceSession(onnx_path)
+
+class TestAutoMLTransforms(unittest.TestCase):
+    def test_datetimesplitter(self):
+        training_data = pd.DataFrame(data=dict(
+            tokens1=[1, 2, 3, 157161600]
+        ))
+
+        cols_to_drop = [
+            'dtHour12', 'dtDayOfWeek', 'dtDayOfQuarter',
+            'dtDayOfYear', 'dtWeekOfMonth', 'dtQuarterOfYear',
+            'dtHalfOfYear', 'dtWeekIso', 'dtYearIso', 'dtMonthLabel',
+            'dtAmPmLabel', 'dtDayOfWeekLabel', 'dtIsPaidTimeOff'
+        ]
+
+        dts = DateTimeSplitter(prefix='dt') << 'tokens1'
+        xf = Pipeline([dts, ColumnSelector(drop_columns=cols_to_drop)])
+        
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_data = np.array([1, 2, 3, 157161600]).astype(np.int64).reshape(4,1)
+        result = sess.run(None, {"tokens1":inferencing_data})
+        
+        expected_years = np.array([1970, 1970, 1970, 1974]).reshape(4, 1)
+        expected_month = np.array([1, 1, 1, 12]).reshape(4, 1)
+        expected_day = np.array([1, 1, 1, 25]).reshape(4, 1)
+        expected_hour = np.array([0, 0, 0, 0]).reshape(4, 1)
+        expected_minute = np.array([0, 0, 0, 0]).reshape(4, 1)
+        expected_second = np.array([1, 2, 3, 0]).reshape(4, 1)
+        expected_ampm = np.array([0, 0, 0, 0]).reshape(4, 1)
+        expected_holidayname = np.array(["", "", "", ""]).reshape(4, 1)
+        
+        np.testing.assert_array_equal(result[1],expected_years)
+        np.testing.assert_array_equal(result[2],expected_month)
+        np.testing.assert_array_equal(result[3],expected_day)
+        np.testing.assert_array_equal(result[4],expected_hour)
+        np.testing.assert_array_equal(result[5],expected_minute)
+        np.testing.assert_array_equal(result[6],expected_second)
+        np.testing.assert_array_equal(result[7],expected_ampm)
+        np.testing.assert_array_equal(result[8],expected_holidayname)
+            
+    def test_datetimesplitter_complex(self):
+        training_data = pd.DataFrame(data=dict(
+            tokens1=[217081624, 1751241600, 217081625, 32445842582]
+        ))
+
+        cols_to_drop = [
+            'dtHour12', 'dtDayOfWeek', 'dtDayOfQuarter',
+            'dtDayOfYear', 'dtWeekOfMonth', 'dtQuarterOfYear',
+            'dtHalfOfYear', 'dtWeekIso', 'dtYearIso', 'dtMonthLabel',
+            'dtAmPmLabel', 'dtDayOfWeekLabel', 'dtIsPaidTimeOff'
+        ]
+
+        dts = DateTimeSplitter(prefix='dt') << 'tokens1'
+        xf = Pipeline([dts, ColumnSelector(drop_columns=cols_to_drop)])
+        
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_data = np.array([217081624, 1751241600, 217081625, 32445842582]).astype(np.int64).reshape(4,1)
+        result = sess.run(None, {"tokens1": inferencing_data})
+        
+        expected_years = np.array([1976, 2025, 1976, 2998]).reshape(4, 1)
+        expected_month = np.array([11, 6, 11, 3]).reshape(4, 1)
+        expected_day = np.array([17, 30, 17, 2]).reshape(4, 1)
+        expected_hour = np.array([12, 0, 12, 14]).reshape(4, 1)
+        expected_minute = np.array([27, 0, 27, 3]).reshape(4, 1)
+        expected_second = np.array([4, 0, 5, 2]).reshape(4, 1)
+        expected_ampm = np.array([1, 0, 1, 1]).reshape(4, 1)
+        expected_holidayname = np.array(["", "", "", ""]).reshape(4, 1)
+        
+        np.testing.assert_array_equal(result[1],expected_years)
+        np.testing.assert_array_equal(result[2],expected_month)
+        np.testing.assert_array_equal(result[3],expected_day)
+        np.testing.assert_array_equal(result[4],expected_hour)
+        np.testing.assert_array_equal(result[5],expected_minute)
+        np.testing.assert_array_equal(result[6],expected_second)
+        np.testing.assert_array_equal(result[7],expected_ampm)
+        np.testing.assert_array_equal(result[8],expected_holidayname)
+
+    def test_tokey_simple_float(self):
+        
+        training_data = pd.DataFrame(data=dict(
+            target=[1.0, 1.0, 1.0, 2.0]
+        )).astype({'target': np.float64})
+
+        xf = ToKeyImputer()
+        
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_data = np.array([1, float("NaN"), 4, 7, float("NaN")]).astype(np.float64).reshape(5,1)
+        result = sess.run(None, {"target": inferencing_data})
+
+        expectedData = np.array([1, 1, 4, 7, 1]).astype(np.float64).reshape(5, 1)
+        
+        np.testing.assert_array_equal(result[0],expectedData)
+
+    def test_tokey_simple_double(self):
+        
+        training_data = pd.DataFrame(data=dict(
+            target=[1.0, 1.0, 1.0, 2.0]
+        )).astype({'target': np.double})
+
+        xf = ToKeyImputer()
+        
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_data = np.array([1, float("NaN"), 4, 7, float("NaN")]).astype(np.double).reshape(5,1)
+        result = sess.run(None, {"target": inferencing_data})
+
+        expectedData = np.array([1, 1, 4, 7, 1]).astype(np.double).reshape(5, 1)
+        
+        np.testing.assert_array_equal(result[0],expectedData)
+
+    def test_tokey_simple_string(self):
+        
+        training_data = pd.DataFrame(data=dict(
+            target=["one", "one", "one", "two"]
+        ))
+
+        xf = ToKeyImputer()
+        
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_data = np.array(["1", "", "Hello", "", "World"]).reshape(5,1)
+        result = sess.run(None, {"target": inferencing_data})
+
+        expectedData = np.array(["1", "one", "Hello", "one", "World"]).reshape(5, 1)
+        
+        np.testing.assert_array_equal(result[0],expectedData)
+
+    def test_tokey_2col_double(self):
+        
+        training_data = pd.DataFrame(data=dict(
+            data1=[1.0, 1.0, 1.0, 2.0],
+            data2=[2.0, 2.0, 2.0, 3.0],
+        )).astype({'data1': np.double,
+                   'data1': np.double})
+
+        xf = ToKeyImputer()
+        
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_data1 = np.array([1.0, float("NaN"), 4.0, 7.0, float("NaN")]).astype(np.double).reshape(5,1)
+        inferencing_data2 = np.array([1.0, float("NaN"), 4.0, 7.0, float("NaN")]).astype(np.double).reshape(5,1)
+        result = sess.run(None, {"data1": inferencing_data1, "data2": inferencing_data2})
+
+        expectedData1 = np.array([1.0, 1.0, 4.0, 7.0, 1.0]).astype(np.double).reshape(5, 1)
+        expectedData2 = np.array([1.0, 2.0, 4.0, 7.0, 2.0]).astype(np.double).reshape(5, 1)
+        
+        np.testing.assert_array_equal(result[0],expectedData1)
+        np.testing.assert_array_equal(result[1],expectedData2)
+
+    def test_tokey_2col_double_string(self):
+        
+        training_data = pd.DataFrame(data=dict(
+            data1=[1.0, 1.0, 1.0, 2.0],
+            data2=["two", "two", "three", "two"],
+        ))
+
+        xf = ToKeyImputer()
+        
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_data1 = np.array([1.0, float("NaN"), 4.0, 7.0, float("NaN")]).astype(np.double).reshape(5,1)
+        inferencing_data2 = np.array(["1", "", "Hello", "", "World"]).reshape(5,1)
+        result = sess.run(None, {"data1": inferencing_data1, "data2": inferencing_data2})
+
+        expectedData1 = np.array([1.0, 1.0, 4.0, 7.0, 1.0]).astype(np.double).reshape(5, 1)
+        expectedData2 = np.array(["1", "two", "Hello", "two", "World"]).reshape(5, 1)
+        
+        np.testing.assert_array_equal(result[0],expectedData1)
+        np.testing.assert_array_equal(result[1],expectedData2)
+
+    def test_tostring_numbers_wo_dft(self):
+        training_data = pd.DataFrame(data=dict(
+            f0=[4, 4, -1, 9],
+            f1=[5, 5, 3.1, -0.23],
+            f2=[6, 6.7, np.nan, np.nan]
+        )).astype({'f0': np.int32,
+                   'f1': np.float32,
+                   'f2': np.float64})
+
+        xf = ToString(columns={'f0.out': 'f0',
+                               'f1.out': 'f1',
+                               'f2.out': 'f2'})
+                               
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_f0 = np.array([4, 4, -1, 9]).astype(np.int32).reshape(4,1)
+        inferencing_f1 = np.array([5, 5, 3.1, -0.23]).astype(np.float32).reshape(4,1)
+        inferencing_f2 = np.array([6, 6.7, float("NaN"), float("NaN")]).astype(np.float64).reshape(4,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"f0": inferencing_f0, "f1": inferencing_f1, "f2": inferencing_f2})
+        
+        f0_output = np.array([['4'], ['4'], ['-1'], ['9']]).reshape(4, 1)
+        f1_output = np.array([['5.000000'], ['5.000000'], ['3.100000'], ['-0.230000']]).reshape(4, 1)
+        f2_output = np.array([['6.000000'], ['6.700000'], ['NaN'], ['NaN']]).reshape(4, 1)
+
+        np.testing.assert_array_equal(f0_output, result[3])
+        np.testing.assert_array_equal(f1_output, result[4])
+        np.testing.assert_array_equal(f2_output, result[5])
+
+    def test_tostring_other_types_wo_dft(self):
+        training_data = pd.DataFrame(data=dict(
+            f0=[True, False],
+            f1=[123.45, 135453984983490.5473]
+        )).astype({'f0': bool,
+                   'f1': np.double})
+
+        xf = ToString(columns={'f0.out': 'f0',
+                               'f1.out': 'f1'})
+                               
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_f0 = np.array([True, False]).astype(bool).reshape(2,1)
+        inferencing_f1 = np.array([123.45, 135453984983490.5473]).astype(np.double).reshape(2,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"f0": inferencing_f0, "f1": inferencing_f1})
+        
+        f0_output = np.array([['True'], ['False']]).reshape(2, 1)
+        #This value, 135453984983490.5473, is changing due to precision and not being able to represent the input exactly.
+        f1_output = np.array([['123.450000'], ['135453984983490.546875']]).reshape(2, 1)
+        np.testing.assert_array_equal(f0_output, result[2])
+        np.testing.assert_array_equal(f1_output, result[3])
+
+    def test_timeseriesimputer_onegrain_twogap(self):
+
+        training_data = pd.DataFrame(data=dict(
+            ts=[1, 2, 3, 5, 7],
+            grain=[1970, 1970, 1970, 1970, 1970],
+            c=[10, 11, 12, 13, 14]
+        )).astype({'ts': np.int64, 'grain': np.int32, 'c': np.int32})
+
+        xf = TimeSeriesImputer(time_series_column='ts',
+                                filter_columns=['c'],
+                                grain_columns=['grain'],
+                                impute_mode='ForwardFill',
+                                filter_mode='Include')
+                                
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_ts = np.array([1, 2, 3, 5, 7]).astype(np.int64).reshape(5,1)
+        inferencing_grain = np.array([1970, 1970, 1970, 1970, 1970]).astype(np.int32).reshape(5,1)
+        inferencing_c = np.array([10, 11, 12, 13, 14]).astype(np.int32).reshape(5,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"ts": inferencing_ts, "grain": inferencing_grain, 'c': inferencing_c})
+ 
+        expected_ts = np.array([[1], [2], [3], [4], [5], [6], [7]]).astype(np.single).reshape(7, 1)
+        expected_c = np.array([[10], [11], [12], [12], [13], [13], [14]]).astype(np.single).reshape(7, 1)
+        expected_isrowimputed = np.array([[False], [False], [False], [True], [False], [True], [False]]).astype(np.single).reshape(7, 1)
+        
+        np.testing.assert_array_equal(expected_ts, result[0])
+        np.testing.assert_array_equal(expected_c, result[2])
+        np.testing.assert_array_equal(expected_isrowimputed, result[3])
+
+    def test_timeseriesimputer_onegrain_twogap_backfill(self):
+
+        training_data = pd.DataFrame(data=dict(
+            ts=[1, 2, 3, 5, 7],
+            grain=[1970, 1970, 1970, 1970, 1970],
+            c=[10, 11, 12, 13, 14]
+        )).astype({'ts': np.int64, 'grain': np.int32, 'c': np.int32})
+
+        xf = TimeSeriesImputer(time_series_column='ts',
+                                filter_columns=['c'],
+                                grain_columns=['grain'],
+                                impute_mode='BackFill',
+                                filter_mode='Include')
+                                
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_ts = np.array([1, 2, 3, 5, 7]).astype(np.int64).reshape(5,1)
+        inferencing_grain = np.array([1970, 1970, 1970, 1970, 1970]).astype(np.int32).reshape(5,1)
+        inferencing_c = np.array([10, 11, 12, 13, 14]).astype(np.int32).reshape(5,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"ts": inferencing_ts, "grain": inferencing_grain, 'c': inferencing_c})
+ 
+        expected_ts = np.array([[1], [2], [3], [4], [5], [6], [7]]).astype(np.single).reshape(7, 1)
+        expected_c = np.array([[10], [11], [12], [13], [13], [14], [14]]).astype(np.single).reshape(7, 1)
+        expected_isrowimputed = np.array([[False], [False], [False], [True], [False], [True], [False]]).astype(np.single).reshape(7, 1)
+        
+        np.testing.assert_array_equal(expected_ts, result[0])
+        np.testing.assert_array_equal(expected_c, result[2])
+        np.testing.assert_array_equal(expected_isrowimputed, result[3])
+
+    def test_timeseriesimputer_onegrain_twogap_backfill(self):
+
+        training_data = pd.DataFrame(data=dict(
+            ts=[1, 2, 3, 5, 7],
+            grain=[1970, 1970, 1970, 1970, 1970],
+            c=[10, 11, 12, 13, 14]
+        )).astype({'ts': np.int64, 'grain': np.int32, 'c': np.double})
+
+        xf = TimeSeriesImputer(time_series_column='ts',
+                                filter_columns=['c'],
+                                grain_columns=['grain'],
+                                impute_mode='Median',
+                                filter_mode='Include')
+                                
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_ts = np.array([1, 2, 3, 5, 7]).astype(np.int64).reshape(5,1)
+        inferencing_grain = np.array([1970, 1970, 1970, 1970, 1970]).astype(np.int32).reshape(5,1)
+        inferencing_c = np.array([10, 11, 12, 13, 14]).astype(np.double).reshape(5,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"ts": inferencing_ts, "grain": inferencing_grain, 'c': inferencing_c})
+        
+        expected_ts = np.array([[1], [2], [3], [4], [5], [6], [7]]).astype(np.single).reshape(7, 1)
+        expected_c = np.array([[10], [11], [12], [12], [13], [12], [14]]).astype(np.single).reshape(7, 1)
+        expected_isrowimputed = np.array([[False], [False], [False], [True], [False], [True], [False]]).astype(np.single).reshape(7, 1)
+        
+        np.testing.assert_array_equal(expected_ts, result[0])
+        np.testing.assert_array_equal(expected_c, result[2])
+        np.testing.assert_array_equal(expected_isrowimputed, result[3])
+
+    def test_timeseriesimputer_twograin_nogap(self):
+
+        training_data = pd.DataFrame(data=dict(
+            ts=[1, 5, 2, 6],
+            grain=[1970, 1971, 1970, 1971],
+            c=[10, 11, 12, 13]
+        )).astype({'ts': np.int64, 'grain': np.int32, 'c': np.int32})
+
+        xf = TimeSeriesImputer(time_series_column='ts',
+                                filter_columns=['c'],
+                                grain_columns=['grain'],
+                                impute_mode='ForwardFill',
+                                filter_mode='Include')
+                                
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_ts = np.array([1, 5, 2, 6]).astype(np.int64).reshape(4,1)
+        inferencing_grain = np.array([1970, 1971, 1970, 1971]).astype(np.int32).reshape(4,1)
+        inferencing_c = np.array([10, 11, 12, 13]).astype(np.int32).reshape(4,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"ts": inferencing_ts, "grain": inferencing_grain, 'c': inferencing_c})
+ 
+        expected_ts = np.array([[1], [5], [2], [6]]).astype(np.single).reshape(4, 1)
+        expected_grain = np.array([[1970], [1971], [1970], [1971]]).astype(np.single).reshape(4, 1)
+        expected_c = np.array([[10], [11], [12], [13]]).astype(np.single).reshape(4, 1)
+        expected_isrowimputed = np.array([[False], [False], [False], [False]]).astype(np.single).reshape(4, 1)
+        
+
+        np.testing.assert_array_equal(expected_ts, result[0])
+        np.testing.assert_array_equal(expected_grain, result[1])
+        np.testing.assert_array_equal(expected_c, result[2])
+        np.testing.assert_array_equal(expected_isrowimputed, result[3])
+
+    def test_timeseriesimputer_twograin_twogap(self):
+
+        training_data = pd.DataFrame(data=dict(
+            ts=[0, 5, 1, 6],
+            grain=[1970, 1971, 1970, 1971],
+            c=[10, 11, 12, 13]
+        )).astype({'ts': np.int64, 'grain': np.int32, 'c': np.int32})
+
+
+        xf = TimeSeriesImputer(time_series_column='ts',
+                                filter_columns=['c'],
+                                grain_columns=['grain'],
+                                impute_mode='ForwardFill',
+                                filter_mode='Include')
+                                
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_ts = np.array([0, 5, 3, 8]).astype(np.int64).reshape(4,1)
+        inferencing_grain = np.array([1970, 1971, 1970, 1971]).astype(np.int32).reshape(4,1)
+        inferencing_c = np.array([10, 11, 12, 13]).astype(np.int32).reshape(4,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"ts": inferencing_ts, "grain": inferencing_grain, 'c': inferencing_c})
+ 
+        expected_ts = np.array([[0], [5], [1], [2], [3], [6], [7], [8]]).astype(np.single).reshape(8, 1)
+        expected_grain = np.array([[1970], [1971], [1970], [1970], [1970], [1971], [1971], [1971]]).astype(np.single).reshape(8, 1)
+        expected_c = np.array([[10], [11], [10], [10], [12], [11], [11], [13]]).astype(np.single).reshape(8, 1)
+        expected_isrowimputed = np.array([[False], [False], [True], [True], [False], [True], [True], [False]]).astype(np.single).reshape(8, 1)
+ 
+        np.testing.assert_array_equal(expected_ts, result[0])
+        np.testing.assert_array_equal(expected_grain, result[1])
+        np.testing.assert_array_equal(expected_c, result[2])
+        np.testing.assert_array_equal(expected_isrowimputed, result[3])
+
+    def test_timeseriesimputer_onegrain_onegap_two_filtercolumn(self):
+
+        training_data = pd.DataFrame(data=dict(
+            ts=[1, 2, 3, 5],
+            grain=[1970, 1970, 1970, 1970],
+            c3=[10, 13, 15, 20],
+            c4=[19, 12, 16, 19]
+        )).astype({'ts': np.int64, 'grain': np.int32, 'c3': np.int32, 'c4': np.int32})
+
+        xf = TimeSeriesImputer(time_series_column='ts',
+                                grain_columns=['grain'],
+                                filter_columns=['c3', 'c4'],
+                                impute_mode='ForwardFill',
+                                filter_mode='Include')
+                                
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_ts = np.array([1, 2, 3, 5]).astype(np.int64).reshape(4,1)
+        inferencing_grain = np.array([1970, 1970, 1970, 1970]).astype(np.int32).reshape(4,1)
+        inferencing_c3 = np.array([10, 13, 15, 20]).astype(np.int32).reshape(4,1)
+        inferencing_c4 = np.array([19, 12, 16, 19]).astype(np.int32).reshape(4,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"ts": inferencing_ts, "grain": inferencing_grain, "c3": inferencing_c3, "c4": inferencing_c4})
+ 
+        expected_ts = np.array([[1], [2], [3], [4], [5]]).astype(np.single).reshape(5, 1)
+        expected_c3 = np.array([[10], [13], [15], [15], [20]]).astype(np.single).reshape(5, 1)
+        expected_c4 = np.array([[19], [12], [16], [16], [19]]).astype(np.single).reshape(5, 1)
+        expected_isrowimputed = np.array([[False], [False], [False], [True], [False]]).astype(np.single).reshape(5, 1)
+        
+        np.testing.assert_array_equal(expected_ts, result[0])
+        np.testing.assert_array_equal(expected_c3, result[2])
+        np.testing.assert_array_equal(expected_c4, result[3])
+        np.testing.assert_array_equal(expected_isrowimputed, result[4])
+
+    def test_rolling_window_simple_mean_wo_dft(self):
+
+        training_data = pd.DataFrame(data=dict(
+            colA=[1.0, 2.0, 3.0, 4.0],
+            grainA=["one", "one", "one", "one"]
+        ))
+
+        xf = RollingWindow(columns={'colA1': 'colA'},
+                           grain_column=['grainA'], 
+                           window_calculation='Mean',
+                           max_window_size=2,
+                           horizon=2)
+                           
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_grainA = np.array(["one", "one", "one", "one"]).reshape(4,1)
+        inferencing_colA = np.array([1.0, 2.0, 3.0, 4.0]).astype(np.double).reshape(4,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"grainA": inferencing_grainA, "colA": inferencing_colA  })
+        
+        expected = np.array([[[float("NaN"), float("NaN")]], [[float("NaN"), 1.0]], [[1.0, 1.5]], [[1.5, 2.5]]]).astype(np.single).reshape(4, 1, 2)
+        
+        np.testing.assert_array_equal(expected, result[2])
+
+    def test_rolling_window_simple_max_wo_dft(self):
+
+        training_data = pd.DataFrame(data=dict(
+            colA=[1.0, 2.0, 3.0, 4.0],
+            grainA=["one", "one", "one", "one"]
+        ))
+
+        xf = RollingWindow(columns={'colA1': 'colA'},
+                           grain_column=['grainA'], 
+                           window_calculation='Max',
+                           max_window_size=1,
+                           horizon=1)
+                           
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_grainA = np.array(["one", "one", "one", "one"]).reshape(4,1)
+        inferencing_colA = np.array([1.0, 2.0, 3.0, 4.0]).astype(np.double).reshape(4,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"grainA": inferencing_grainA, "colA": inferencing_colA})
+        
+        expected = np.array([[[float("NaN")]], [[1.0]], [[2.0]], [[3.0]]]).astype(np.single).reshape(4, 1, 1)
+        
+        np.testing.assert_array_equal(expected, result[2])
+
+    def test_rolling_window_simple_min_wo_dft(self):
+
+        training_data = pd.DataFrame(data=dict(
+            colA=[1.0, 2.0, 3.0, 4.0],
+            grainA=["one", "one", "one", "one"]
+        ))
+
+        xf = RollingWindow(columns={'colA1': 'colA'},
+                           grain_column=['grainA'], 
+                           window_calculation='Min',
+                           max_window_size=1,
+                           horizon=1)
+                           
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_grainA = np.array(["one", "one", "one", "one"]).reshape(4,1)
+        inferencing_colA = np.array([1.0, 2.0, 3.0, 4.0]).astype(np.double).reshape(4,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"grainA": inferencing_grainA, "colA": inferencing_colA  })
+        
+        expected = np.array([[[float("NaN")]], [[1.0]], [[2.0]], [[3.0]]]).astype(np.single).reshape(4, 1, 1)
+        
+        np.testing.assert_array_equal(expected, result[2])
+
+    def test_rolling_window_multiple_grains_wo_dft(self):
+
+        training_data = pd.DataFrame(data=dict(
+            colA=[1.0, 2.0, 1.0, 2.0],
+            grainA=["one", "one", "two", "two"]
+        ))
+
+        xf = RollingWindow(columns={'colA1': 'colA'},
+                           grain_column=['grainA'], 
+                           window_calculation='Mean',
+                           max_window_size=1,
+                           horizon=1)
+                           
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_grainA = np.array(["one", "one", "two", "two"]).reshape(4,1)
+        inferencing_colA = np.array([1.0, 2.0, 1.0, 2.0]).astype(np.double).reshape(4,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"grainA": inferencing_grainA, "colA": inferencing_colA})
+        
+        expected = np.array([[[float("NaN")]], [[1.0]], [[float("NaN")]], [[1.0]]]).astype(np.single).reshape(4, 1, 1)
+        
+        np.testing.assert_array_equal(expected, result[2])
+    
+    def test_rolling_window_non_string_grain_wo_dft(self):
+
+        training_data = pd.DataFrame(data=dict(
+            colA=[1.0, 2.0, 3.0, 4.0],
+            grainA=[True, True, True, True]
+        ))
+
+        xf = RollingWindow(columns={'colA1': 'colA'},
+                           grain_column=['grainA'], 
+                           window_calculation='Mean',
+                           max_window_size=1,
+                           horizon=1)
+                           
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_grainA = np.array([True, True, True, True]).reshape(4,1)
+        inferencing_colA = np.array([1.0, 2.0, 3.0, 4.0]).astype(np.double).reshape(4,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"grainA": inferencing_grainA, "colA": inferencing_colA})
+        
+        expected = np.array([[[float("NaN")]], [[1.0]], [[2.0]], [[3.0]]]).astype(np.single).reshape(4, 1, 1)
+        
+        np.testing.assert_array_equal(expected, result[2])
+ 
+
+    def test_laglead_lag_wo_dft(self):
+
+        training_data = pd.DataFrame(data=dict(
+            colA=[1.0, 2.0, 3.0, 4.0],
+            grainA=["one", "one", "one", "one"]
+        ))
+
+        xf = LagLeadOperator(columns={'colA1': 'colA'},
+                           grain_columns=['grainA'], 
+                           offsets=[-2, -1],
+                           horizon=2)
+                               
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_grainA = np.array(["one", "one", "one", "one"]).reshape(4,1)
+        inferencing_colA = np.array([1, 2, 3, 4]).astype(np.double).reshape(4,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"grainA": inferencing_grainA, "colA": inferencing_colA})        
+        
+        expected = np.array([[[float("NaN"), float("NaN")], [float("NaN"), float("NaN")]], 
+                             [[float("NaN"), float("NaN")], [float("NaN"), 1.0]], 
+                             [[float("NaN"), 1.0], [1.0, 2.0]], 
+                             [[1.0, 2.0], [2.0, 3.0]]]).astype(np.single).reshape(4, 2, 2)
+        
+        np.testing.assert_array_equal(expected, result[2])
+
+    def test_laglead_lead_wo_dft(self):
+
+        training_data = pd.DataFrame(data=dict(
+            colA=[1.0, 2.0, 3.0, 4.0],
+            grainA=["one", "one", "one", "one"]
+        ))
+
+        xf = LagLeadOperator(columns={'colA1': 'colA'},
+                           grain_columns=['grainA'], 
+                           offsets=[1, 2],
+                           horizon=2)
+                               
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_grainA = np.array(["one", "one", "one", "one"]).reshape(4,1)
+        inferencing_colA = np.array([1, 2, 3, 4]).astype(np.double).reshape(4,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"grainA": inferencing_grainA, "colA": inferencing_colA})        
+        
+        expected = np.array([[[1.0, 2.0], [2.0, 3.0]], 
+                             [[2.0, 3.0], [3.0, 4.0]], 
+                             [[3.0, 4.0], [4.0, float("NaN")]], 
+                             [[4.0, float("NaN")], [float("NaN"), float("NaN")]]]).astype(np.single).reshape(4, 2, 2)
+        
+        np.testing.assert_array_equal(expected, result[2])
+    
+    def test_laglead_complex_wo_dft(self):
+
+        training_data = pd.DataFrame(data=dict(
+            colA=[1.0, 2.0, 3.0, 4.0],
+            grainA=["one", "one", "one", "one"]
+        ))
+
+        xf = LagLeadOperator(columns={'colA1': 'colA'},
+                           grain_columns=['grainA'], 
+                           offsets=[-2, -1, 1, 2],
+                           horizon=2)
+                               
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_grainA = np.array(["one", "one", "one", "one"]).reshape(4,1)
+        inferencing_colA = np.array([1, 2, 3, 4]).astype(np.double).reshape(4,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"grainA": inferencing_grainA, "colA": inferencing_colA})        
+        
+        expected = np.array([[[float("NaN"), float("NaN")], [float("NaN"), float("NaN")], [1.0, 2.0], [2.0, 3.0]], 
+                            [[float("NaN"), float("NaN")], [float("NaN"), 1.0], [2.0, 3.0], [3.0, 4.0]], 
+                            [[float("NaN"), 1.0], [1.0, 2.0], [3.0, 4.0], [4.0, float("NaN")]], 
+                            [[1.0, 2.0], [2.0, 3.0], [4.0, float("NaN")], [float("NaN"), float("NaN")]]]).astype(np.single).reshape(4, 4, 2)
+        
+        np.testing.assert_array_equal(expected, result[2])
+        
+    def test_short_drop_wo_dft(self):
+
+        training_data = pd.DataFrame(data=dict(
+            colA=[1.0, 2.0, 3.0, 4.0],
+            grainA=["one", "one", "one", "two"]
+        ))
+
+        xf = ShortDrop(columns={'colA1': 'colA'},
+                           grain_columns=['grainA'],
+                           min_rows=2)
+                               
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_grainA = np.array(["one", "one", "one", "two"]).reshape(4,1)
+        inferencing_colA = np.array([1, 2, 3, 4]).astype(np.double).reshape(4,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"grainA": inferencing_grainA, "colA": inferencing_colA})
+        
+        colA_expected = np.array([[1.0], [2.0], [3.0]]).reshape(3, 1)
+        grainA_expected = np.array([["one"], ["one"], ["one"]]).reshape(3, 1)
+        np.testing.assert_array_equal(colA_expected, result[0])
+        np.testing.assert_array_equal(grainA_expected, result[1])
+
+    def test_integration_rollwin_pivot(self):
+
+        training_data = pd.DataFrame(data=dict(
+            colA=[1.0, 3.0, 5.0, 7.0],
+            grainA=['1970', '1970', '1970', '1970']
+        ))
+
+        xf0 = RollingWindow(columns={'colA1': 'colA'},
+                           grain_column=['grainA'], 
+                           window_calculation='Mean',
+                           max_window_size=2,
+                           horizon=2)
+
+        xf1 = ForecastingPivot(columns_to_pivot=['colA1'])
+
+        xf = Pipeline([xf0, xf1])
+                               
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_colA = np.array([1.0, 3.0, 5.0, 7.0]).reshape(4,1)
+        inferencing_grainA = np.array(['1970', '1970', '1970', '1970']).reshape(4,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"colA": inferencing_colA, "grainA": inferencing_grainA})
+        
+        expected_colA = np.array([[3.0], [5.0], [5.0], [7.0], [7.0]])
+        expected_grainA = np.array([['1970'], ['1970'], ['1970'], ['1970'], ['1970']])
+        expected_output = np.array([[1.0], [1.0], [2.0], [2.0], [4.0]])
+        np.testing.assert_array_equal(expected_colA, result[0])
+        np.testing.assert_array_equal(expected_grainA, result[1])
+        np.testing.assert_array_equal(expected_output, result[3])
+        
+    def test_integration_laglead_pivot(self):
+
+        training_data = pd.DataFrame(data=dict(
+            colA=[1.0, 2.0, 3.0, 4.0],
+            grainA=["one", "one", "one", "one"]
+        ))
+
+        xf0 = LagLeadOperator(columns={'colA1': 'colA'},
+                           grain_columns=['grainA'], 
+                           offsets=[-2, -1],
+                           horizon=2)
+
+        xf1 = ForecastingPivot(columns_to_pivot=['colA1'])
+
+        xf = Pipeline([xf0, xf1])
+                               
+        sess = set_up_onnx_model(xf, training_data)
+
+        inferencing_grainA = np.array(["one", "one", "one", "one"]).reshape(4,1)
+        inferencing_colA = np.array([1, 2, 3, 4]).astype(np.double).reshape(4,1)
+ 
+        # Run your inference session with your model and your data
+        result = sess.run(None, {"colA": inferencing_colA, "grainA": inferencing_grainA})
+        
+        expected_colA = np.array([[3.0], [4.0], [4.0]])
+        expected_grainA = np.array([['one'], ['one'], ['one']])
+        expected_output_lag2 = np.array([[1.0], [1.0], [2.0]])
+        expected_output_lag1 = np.array([[2.0], [2.0], [3.0]])
+        np.testing.assert_array_equal(expected_colA, result[0])
+        np.testing.assert_array_equal(expected_grainA, result[1])
+        np.testing.assert_array_equal(expected_output_lag2, result[3])
+        np.testing.assert_array_equal(expected_output_lag1, result[4])
+
+    def test_pivot_one_matrix(self):
+            
+        training_data = pd.DataFrame(data=dict(
+            colA=[1.0],
+            grainA=["one"]
+        ))
+
+        xf0 = LagLeadOperator(columns={'colA1': 'colA'},
+                           grain_columns=['grainA'], 
+                           offsets=[-2, -1, 1],
+                           horizon=4)
+        binarydata = xf0.fit_transform(training_data, as_binary_data_stream=True)
+        
+        xf1 = ForecastingPivot(columns_to_pivot=['colA1'])
+        
+        sess = set_up_onnx_model(xf1, binarydata)
+
+        inferencing_grainA = np.array(["one"]).reshape(1,1)
+        inferencing_colA = np.array([1]).astype(np.double).reshape(1,1)
+        inferencing_colA1 = np.array([1, 4, 6, float("NaN"), 2, 5, float("NaN"), float("NaN"), 3, float("NaN"), float("NaN"), 7]).astype(np.double).reshape(1,3,4)
+
+        result = sess.run(None, {"grainA": inferencing_grainA,"colA": inferencing_colA, "colA1": inferencing_colA1})
+
+        expectedHorizon = np.array([4]).astype(np.uint32).reshape(1, 1)
+        expectedColA = np.array([1]).astype(np.double).reshape(1, 1)
+        expectedLag1 = np.array([1]).astype(np.double).reshape(1, 1)
+        expectedLead1 = np.array([2]).astype(np.double).reshape(1, 1)
+        expectedLag2 = np.array([3]).astype(np.double).reshape(1, 1)
+        
+        np.testing.assert_array_equal(result[0], expectedColA)
+        np.testing.assert_array_equal(result[2], expectedHorizon)
+        np.testing.assert_array_equal(result[3], expectedLag1)
+        np.testing.assert_array_equal(result[4], expectedLead1)
+        np.testing.assert_array_equal(result[5], expectedLag2)
+    
+    def test_pivot_two_matrix(self):
+            
+        training_data = pd.DataFrame(data=dict(
+            colA=[1.0, 2.0],
+            grainA=["one", "one"],
+            colB=[1.0, 3.0],
+            grainB=["one", "one"]
+        ))
+
+        xf0 = LagLeadOperator(columns={'colA1': 'colA'},
+                           grain_columns=['grainA'], 
+                           offsets=[-2, -1, 1],
+                           horizon=4)
+                           
+        xf1 = LagLeadOperator(columns={'colB1': 'colB'},
+                           grain_columns=['grainB'], 
+                           offsets=[-2, -1],
+                           horizon=4)
+        xf2 = Pipeline([xf0, xf1])
+        binarydata = xf2.fit_transform(training_data, as_binary_data_stream=True)
+
+        xf3 = ForecastingPivot(columns_to_pivot=['colA1', 'colB1'])
+        
+        sess = set_up_onnx_model(xf3, binarydata)
+        
+        inferencing_colA = np.array([1,2]).astype(np.double).reshape(2,1)
+        inferencing_colB = np.array([1,2]).astype(np.double).reshape(2,1)
+        inferencing_grainA = np.array(["one", "one"]).reshape(2,1)
+        inferencing_grainB = np.array(["one", "one"]).reshape(2,1)
+        inferencing_colA1 = np.array([1, 6, 3, 9, 2, 4, 5, 8, float("NaN"), float("NaN"), 7, 10, 
+                                      1, 6, 9, 3, 2, 4, 8, 5, float("NaN"), float("NaN"), 10, 7]).astype(np.double).reshape(2,3,4)
+        inferencing_colB1 = np.array([1, float("NaN"), 5, 6, 2, float("NaN"), 3, 4, 
+                                      1, float("NaN"), 6, 5, 2, float("NaN"), 4, 3]).astype(np.double).reshape(2,2,4)
+        
+        result = sess.run(None, {"colA": inferencing_colA, "colB": inferencing_colB, "grainA": inferencing_grainA, 
+                                 "grainB": inferencing_grainB, "colA1": inferencing_colA1, "colB1": inferencing_colB1})
+        
+        expectedColA = np.array([1, 1, 2, 2]).astype(np.double).reshape(4, 1)
+        expectedColB = np.array([1, 1, 2, 2]).astype(np.double).reshape(4, 1)
+        expectedHorizon = np.array([2, 1, 2, 1]).astype(np.uint32).reshape(4, 1)
+        expectedLag1 = np.array([3, 9, 9, 3]).astype(np.double).reshape(4, 1)
+        expectedLead1 = np.array([5, 8, 8, 5]).astype(np.double).reshape(4, 1)
+        expectedLag2 = np.array([7, 10, 10, 7]).astype(np.double).reshape(4, 1)
+        expectedVec2Lag2 = np.array([5, 6, 6, 5]).astype(np.double).reshape(4, 1)
+        expectedVec2Lag5 = np.array([3, 4, 4, 3]).astype(np.double).reshape(4, 1)
+
+        np.testing.assert_array_equal(result[0], expectedColA)
+        np.testing.assert_array_equal(result[2], expectedColB)
+        np.testing.assert_array_equal(result[4], expectedHorizon)
+        np.testing.assert_array_equal(result[5], expectedLag1)
+        np.testing.assert_array_equal(result[6], expectedLead1)
+        np.testing.assert_array_equal(result[7], expectedLag2)
+        np.testing.assert_array_equal(result[8], expectedVec2Lag2)
+        np.testing.assert_array_equal(result[9], expectedVec2Lag5)
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/src/python/tests_extended/test_tensor_invalid_input.py b/src/python/tests_extended/test_tensor_invalid_input.py
new file mode 100644
index 00000000..1db6258e
--- /dev/null
+++ b/src/python/tests_extended/test_tensor_invalid_input.py
@@ -0,0 +1,403 @@
+# --------------------------------------------------------------------------------------------
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License.
+# --------------------------------------------------------------------------------------------
+
+import os
+import sys
+import io
+import platform
+import tempfile
+import unittest
+
+import numpy as np
+import pandas as pd
+from nimbusml import Pipeline
+from nimbusml.preprocessing.schema import ColumnSelector
+from nimbusml.preprocessing import ToString, ToKeyImputer, DateTimeSplitter
+from scipy.sparse import csr_matrix
+from nimbusml.timeseries import TimeSeriesImputer, LagLeadOperator, RollingWindow, ForecastingPivot, ShortDrop
+from nimbusml.preprocessing import (TensorFlowScorer, FromKey, ToKey,
+                                    DateTimeSplitter, OnnxRunner)
+import onnxruntime as rt
+from data_frame_tool import DataFrameTool as DFT
+
+TEST_CASES_FOR_INVALID_INPUT = {
+    'DateTimeSplitter_Bad_Input_Data',
+    'DateTimeSplitter_Bad_Input_Type',
+    'DateTimeSplitter_Bad_Input_Shape',
+    'ToKey_Bad_Input_Type',
+    'ToKey_Bad_Input_Shape',
+    'ToString_Bad_Input_Type',
+    'ToString_Bad_Input_Shape',
+    'TimeSeriesImputer_Bad_Input_Data',
+    'TimeSeriesImputer_Bad_Input_Type',
+    'TimeSeriesImputer_Bad_Input_Shape',
+    'RollingWindow_Bad_Input_Type',
+    'RollingWindow_Bad_Input_Shape',
+    'LagLead_Bad_Input_Type',
+    'LagLead_Bad_Input_Shape',
+    'ShortDrop_Bad_Input_Type',
+    'ShortDrop_Bad_Input_Shape',
+    'ShortDrop_Drop_All'
+}
+
+INSTANCES_FOR_INVALID_INPUT = {
+    'DateTimeSplitter_Bad_Input_Data': Pipeline([
+        DateTimeSplitter(prefix='dt') << 'tokens1',
+        ColumnSelector(drop_columns=[
+                                    'dtHour12', 'dtDayOfWeek', 'dtDayOfQuarter',
+                                    'dtDayOfYear', 'dtWeekOfMonth', 'dtQuarterOfYear',
+                                    'dtHalfOfYear', 'dtWeekIso', 'dtYearIso', 'dtMonthLabel',
+                                    'dtAmPmLabel', 'dtDayOfWeekLabel', 'dtIsPaidTimeOff','dtHolidayName'
+        ])
+    ]),
+    'DateTimeSplitter_Bad_Input_Type': Pipeline([
+        DateTimeSplitter(prefix='dt') << 'tokens1',
+        ColumnSelector(drop_columns=[
+                                    'dtHour12', 'dtDayOfWeek', 'dtDayOfQuarter',
+                                    'dtDayOfYear', 'dtWeekOfMonth', 'dtQuarterOfYear',
+                                    'dtHalfOfYear', 'dtWeekIso', 'dtYearIso', 'dtMonthLabel',
+                                    'dtAmPmLabel', 'dtDayOfWeekLabel', 'dtIsPaidTimeOff','dtHolidayName'
+        ])
+    ]),
+    'DateTimeSplitter_Bad_Input_Shape': Pipeline([
+        DateTimeSplitter(prefix='dt') << 'tokens1',
+        ColumnSelector(drop_columns=[
+                                    'dtHour12', 'dtDayOfWeek', 'dtDayOfQuarter',
+                                    'dtDayOfYear', 'dtWeekOfMonth', 'dtQuarterOfYear',
+                                    'dtHalfOfYear', 'dtWeekIso', 'dtYearIso', 'dtMonthLabel',
+                                    'dtAmPmLabel', 'dtDayOfWeekLabel', 'dtIsPaidTimeOff','dtHolidayName'
+        ])
+    ]),
+    'ToKey_Bad_Input_Type': ToKeyImputer(),
+    'ToKey_Bad_Input_Shape': ToKeyImputer(),
+    'ToString_Bad_Input_Type': ToString(columns={'f0.out': 'f0',
+                                                'f1.out': 'f1',
+                                                'f2.out': 'f2'}),
+    'ToString_Bad_Input_Shape': ToString(columns={'f0.out': 'f0',
+                                                'f1.out': 'f1',
+                                                'f2.out': 'f2'}),
+    'TimeSeriesImputer_Bad_Input_Data': TimeSeriesImputer(time_series_column='ts',
+                                                          filter_columns=['c'],
+                                                          grain_columns=['grain'],
+                                                          impute_mode='ForwardFill',
+                                                          filter_mode='Include'),
+    'TimeSeriesImputer_Bad_Input_Type': TimeSeriesImputer(time_series_column='ts',
+                                                          filter_columns=['c'],
+                                                          grain_columns=['grain'],
+                                                          impute_mode='ForwardFill',
+                                                          filter_mode='Include'),
+    'TimeSeriesImputer_Bad_Input_Shape': TimeSeriesImputer(time_series_column='ts',
+                                                          filter_columns=['c'],
+                                                          grain_columns=['grain'],
+                                                          impute_mode='ForwardFill',
+                                                          filter_mode='Include'),
+    'RollingWindow_Bad_Input_Type': RollingWindow(columns={'colA1': 'colA'},
+                                                  grain_column=['grainA'], 
+                                                  window_calculation='Mean',
+                                                  max_window_size=2,
+                                                  horizon=2),
+    'RollingWindow_Bad_Input_Shape': RollingWindow(columns={'colA1': 'colA'},
+                                                  grain_column=['grainA'], 
+                                                  window_calculation='Mean',
+                                                  max_window_size=2,
+                                                  horizon=2),
+    'LagLead_Bad_Input_Type': LagLeadOperator(columns={'colA1': 'colA'},
+                                              grain_columns=['grainA'], 
+                                              offsets=[-1],
+                                              horizon=1),
+    'LagLead_Bad_Input_Shape': LagLeadOperator(columns={'colA1': 'colA'},
+                                              grain_columns=['grainA'], 
+                                              offsets=[-1],
+                                              horizon=1),
+    'ShortDrop_Bad_Input_Type': ShortDrop(columns={'colA1': 'colA'},
+                                           grain_columns=['grainA'],
+                                           min_rows=2),
+    'ShortDrop_Bad_Input_Shape': ShortDrop(columns={'colA1': 'colA'},
+                                           grain_columns=['grainA'],
+                                           min_rows=2),
+    'ShortDrop_Drop_All': ShortDrop(columns={'colA1': 'colA'},
+                                           grain_columns=['grainA'],
+                                           min_rows=15)
+}
+
+TRAINING_DATASETS_FOR_INVALID_INPUT = {
+    'DateTimeSplitter_Bad_Input_Data': pd.DataFrame(data=dict(
+                                           tokens1=[1, 2, 3, 157161600]
+                                       )),
+    'DateTimeSplitter_Bad_Input_Type': pd.DataFrame(data=dict(
+                                           tokens1=[1, 2, 3, 157161600]
+                                       )),
+    'DateTimeSplitter_Bad_Input_Shape': pd.DataFrame(data=dict(
+                                           tokens1=[1, 2, 3, 157161600]
+                                       )),
+    'ToKey_Bad_Input_Type': pd.DataFrame(data=dict(
+                                target=[1.0, 1.0, 1.0, 2.0]
+                            )).astype({'target': np.float64}),
+    'ToKey_Bad_Input_Shape': pd.DataFrame(data=dict(
+                                target=[1.0, 1.0, 1.0, 2.0]
+                            )).astype({'target': np.float64}),
+    'ToString_Bad_Input_Type': pd.DataFrame(data=dict(
+                                            f0= [4, 4, -1, 9],
+                                            f1= [5, 5, 3.1, -0.23],
+                                            f2= [6, 6.7, np.nan, np.nan]
+                               )),
+    'ToString_Bad_Input_Shape': pd.DataFrame(data=dict(
+                                            f0= [4, 4, -1, 9],
+                                            f1= [5, 5, 3.1, -0.23],
+                                            f2= [6, 6.7, np.nan, np.nan]
+                                )),
+    'TimeSeriesImputer_Bad_Input_Data': pd.DataFrame(data=dict(
+                                            ts=[1, 2, 3, 5, 7],
+                                            grain=[1970, 1970, 1970, 1970, 1970],
+                                            c=[10, 11, 12, 13, 14]
+                                        )).astype({'ts': np.int64, 'grain': np.int32, 'c': np.int32}),
+    'TimeSeriesImputer_Bad_Input_Type': pd.DataFrame(data=dict(
+                                            ts=[1, 2, 3, 5, 7],
+                                            grain=[1970, 1970, 1970, 1970, 1970],
+                                            c=[10, 11, 12, 13, 14]
+                                        )).astype({'ts': np.int64, 'grain': np.int32, 'c': np.int32}),
+    'TimeSeriesImputer_Bad_Input_Shape': pd.DataFrame(data=dict(
+                                            ts=[1, 2, 3, 5, 7],
+                                            grain=[1970, 1970, 1970, 1970, 1970],
+                                            c=[10, 11, 12, 13, 14]
+                                        )).astype({'ts': np.int64, 'grain': np.int32, 'c': np.int32}),
+    'RollingWindow_Bad_Input_Type': pd.DataFrame(data=dict(
+                                        colA=[1.0, 2.0, 3.0, 4.0],
+                                        grainA=["one", "one", "one", "one"]
+                                    )),
+    'RollingWindow_Bad_Input_Shape': pd.DataFrame(data=dict(
+                                        colA=[1.0, 2.0, 3.0, 4.0],
+                                        grainA=["one", "one", "one", "one"]
+                                    )),
+    'LagLead_Bad_Input_Type':pd.DataFrame(data=dict(
+                                 colA=[1.0, 2.0, 3.0, 4.0],
+                                 grainA=["one", "one", "one", "one"]
+                             )),
+    'LagLead_Bad_Input_Shape': pd.DataFrame(data=dict(
+                                 colA=[1.0, 2.0, 3.0, 4.0],
+                                 grainA=["one", "one", "one", "one"]
+                               )),
+    'ShortDrop_Bad_Input_Type': pd.DataFrame(data=dict(
+                                     colA=[1.0, 2.0, 3.0, 4.0],
+                                     grainA=["one", "one", "one", "two"]
+                                )),
+    'ShortDrop_Bad_Input_Shape': pd.DataFrame(data=dict(
+                                     colA=[1.0, 2.0, 3.0, 4.0],
+                                     grainA=["one", "one", "one", "two"]
+                                 )),
+    'ShortDrop_Drop_All': pd.DataFrame(data=dict(
+                                     colA=[1.0, 2.0, 3.0, 4.0],
+                                     grainA=["one", "one", "one", "two"]
+                                 ))
+}
+
+INFERENCE_DATASETS_FOR_INVALID_INPUT = {
+    'DateTimeSplitter_Bad_Input_Data': {"tokens1": np.array([1, 2, 3, -3]).reshape(4,1)},
+    'DateTimeSplitter_Bad_Input_Type': {"tokens1": np.array([1, 2, 3, "3"]).reshape(4,1)},
+    'DateTimeSplitter_Bad_Input_Shape': {"tokens1": np.array([[1, 2, 3, 3], [1, 2, 3, 4]]).reshape(4,2)},
+    'ToKey_Bad_Input_Type': {"target": np.array([1, float("NaN"), "", 7, float("NaN")]).reshape(5,1)},
+    'ToKey_Bad_Input_Shape': {"target": np.array([[1, float("NaN")], [1, float("NaN")]]).reshape(2,2)},
+    'ToString_Bad_Input_Type': {"f0": np.array([4, 4, -1, 9]).astype(np.int32).reshape(4,1),
+                                "f1": np.array([5, 5, 3.1, -0.23]).astype(np.float32).reshape(4,1),
+                                "f2": np.array([6, "6.7", float("NaN"), float("NaN")]).reshape(4,1)},
+    'ToString_Bad_Input_Shape': {"f0": np.array([[4, 4, -1, 9],[4, 4, -1, 9]]).astype(np.int32).reshape(4,2),
+                                 "f1": np.array([5, 5, 3.1, -0.23]).astype(np.float32).reshape(4,1),
+                                 "f2": np.array([6, 6.7, float("NaN"), float("NaN")]).reshape(4,1)},
+    'TimeSeriesImputer_Bad_Input_Data': {"ts": np.array([1, 2, 3, -5, 7]).astype(np.int64).reshape(5,1),
+                                         "grain": np.array([1970, 1970, 1970, 1970, 1970]).reshape(5,1),
+                                         "c": np.array([10, 11, 12, 13, 14]).astype(np.int32).reshape(5,1)},
+    'TimeSeriesImputer_Bad_Input_Type': {"ts": np.array([1, 2, 3, 5, 7]).astype(np.int64).reshape(5,1),
+                                         "grain": np.array([1970, "1970", 1970, 1970, 1970]).reshape(5,1),
+                                         "c": np.array([10, 11, 12, 13, 14]).astype(np.int32).reshape(5,1)},
+    'TimeSeriesImputer_Bad_Input_Shape': {"ts": np.array([[1, 2, 3, 5, 7], [1, 2, 3, 5, 7]]).astype(np.int64).reshape(5,2),
+                                          "grain": np.array([1970, 1970, 1970, 1970, 1970]).reshape(5,1),
+                                          "c": np.array([10, 11, 12, 13, 14]).astype(np.int32).reshape(5,1)},
+    'RollingWindow_Bad_Input_Type': {"grainA": np.array(["one", "one", "one", "one"]).reshape(4,1),
+                                     "colA": np.array([1.0, 2.0, 3.0, "4.0"]).reshape(4,1)},
+    'RollingWindow_Bad_Input_Shape': {"grainA": np.array(["one", "one", "one", "one"]).reshape(4,1),
+                                      "colA": np.array([[1.0, 2.0, 3.0, 4.0],[1.0, 2.0, 3.0, 4.0]]).reshape(4,2)},
+    'LagLead_Bad_Input_Type': {"grainA": np.array(["one", "one", "one", "one"]).reshape(4,1),
+                               "colA": np.array([1, 2, 3, "4"]).reshape(4,1)},
+    'LagLead_Bad_Input_Shape': {"grainA": np.array(["one", "one", "one", "one"]).reshape(4,1),
+                                "colA": np.array([[1.0, 2.0, 3.0, 4.0],[1.0, 2.0, 3.0, 4.0]]).reshape(4,2)},
+    'ShortDrop_Bad_Input_Type': {"grainA": np.array(["one", "one", "one", "two"]).reshape(4,1),
+                                 "colA": np.array([1, 2, 3, "4"]).reshape(4,1)},
+    'ShortDrop_Bad_Input_Shape': {"grainA": np.array(["one", "one", "one", "two"]).reshape(4,1),
+                                  "colA": np.array([[1.0, 2.0, 3.0, 4.0],[1.0, 2.0, 3.0, 4.0]]).reshape(4,2)},
+    'ShortDrop_Drop_All': {"grainA": np.array(["one", "one", "one", "two"]).reshape(4,1),
+                                  "colA": np.array([[1.0, 2.0, 3.0, 4.0],[1.0, 2.0, 3.0, 4.0]]).reshape(4,2)}
+}
+
+def get_file_size(file_path):
+    file_size = 0
+    try:
+        file_size = os.path.getsize(file_path)
+    except:
+        pass
+    return file_size
+
+def get_tmp_file(suffix=None):
+    fd, file_name = tempfile.mkstemp(suffix=suffix)
+    fl = os.fdopen(fd, 'w')
+    fl.close()
+    return file_name
+
+class CaptureOutputContext():
+    """
+    Context which can be used for
+    capturing stdout and stderr. 
+    """
+    def __enter__(self):
+        self.orig_stdout = sys.stdout
+        self.orig_stderr = sys.stderr
+        self.stdout_capturer = io.StringIO()
+        self.stderr_capturer = io.StringIO()
+        sys.stdout = self.stdout_capturer
+        sys.stderr = self.stderr_capturer
+        return self
+
+    def __exit__(self, *args):
+        sys.stdout = self.orig_stdout
+        sys.stderr = self.orig_stderr
+        self.stdout = self.stdout_capturer.getvalue()
+        self.stderr = self.stderr_capturer.getvalue()
+
+        if self.stdout:
+            print(self.stdout)
+
+        if self.stderr:
+            print(self.stderr)
+
+        # free up some memory
+        del self.stdout_capturer
+        del self.stderr_capturer
+
+def validate_bad_input(self, estimator, test_case):
+    onnx_path = get_tmp_file('.onnx')
+    onnx_json_path = get_tmp_file('.onnx.json')
+
+    exported = False
+    throw_expected_error = False
+    try:
+        dataset = TRAINING_DATASETS_FOR_INVALID_INPUT.get(test_case)
+
+        estimator.fit(dataset)
+
+        with CaptureOutputContext() as output:
+            estimator.export_to_onnx(onnx_path,
+                                     'com.microsoft.ml',
+                                     dst_json=onnx_json_path,
+                                     onnx_version='Stable')
+    except Exception as e:
+        print(e)
+
+    onnx_file_size = get_file_size(onnx_path)
+    onnx_json_file_size = get_file_size(onnx_json_path)
+    
+    if (output and
+        (onnx_file_size != 0) and
+        (onnx_json_file_size != 0) and
+        (not 'cannot save itself as ONNX' in output.stdout) and
+        (not 'Warning: We do not know how to save the predictor as ONNX' in output.stdout)):
+
+        exported = True
+
+        sess = rt.InferenceSession(onnx_path)
+
+        with self.assertRaisesRegex(Exception, "ONNXRuntimeError"):
+            invalid_data = INFERENCE_DATASETS_FOR_INVALID_INPUT.get(test_case)
+            pred = sess.run(None, invalid_data)
+
+        throw_expected_error = True
+
+    os.remove(onnx_path)
+    os.remove(onnx_json_path)
+    return {'exported': exported, 'throw_expected_error': throw_expected_error}
+
+class TestOnnxExport(unittest.TestCase):
+    # This method is a static method of the class
+    # because there were pytest fixture related
+    # issues when the method was in the global scope.
+    @staticmethod
+    def generate_test_method_for_bad(test_case):
+        def method(self):
+            estimator = INSTANCES_FOR_INVALID_INPUT[test_case]
+
+            result = validate_bad_input(self, estimator, test_case)
+            assert result['exported']
+            assert result['throw_expected_error']
+
+        return method
+   
+    def test_pivot_bad_input_type(self):
+            
+        df = pd.DataFrame(data=dict(
+            colA=[1.0],
+            grainA=["one"]
+        ))
+
+        xf0 = LagLeadOperator(columns={'colA1': 'colA'},
+                           grain_columns=['grainA'], 
+                           offsets=[-2, -1, 1],
+                           horizon=4)
+        binarydata = xf0.fit_transform(df, as_binary_data_stream=True)
+        
+        xf1 = ForecastingPivot(columns_to_pivot=['colA1'])
+
+        xf1.fit(binarydata)
+        onnx_path = get_tmp_file('.onnx')
+        onnx_json_path = get_tmp_file('.onnx.json')
+        xf1.export_to_onnx(onnx_path,
+                            'com.microsoft.ml',
+                            dst_json=onnx_json_path,
+                            onnx_version='Stable')
+        sess = rt.InferenceSession(onnx_path)
+
+        with self.assertRaisesRegex(Exception, "ONNXRuntimeError"):
+            grainA = np.array(["one"]).reshape(1,1)
+            colA = np.array([1]).astype(np.double).reshape(1,1)
+            colA1 = np.array([1, 4, "6", float("NaN"), 2, 5, float("NaN"), float("NaN"), 3, float("NaN"), float("NaN"), 7]).reshape(1,3,4)
+            pred = sess.run(None, {"grainA":grainA,"colA":colA, "colA1":colA1 })
+            
+    def test_pivot_bad_shape(self):
+            
+        df = pd.DataFrame(data=dict(
+            colA=[1.0],
+            grainA=["one"]
+        ))
+
+        xf0 = LagLeadOperator(columns={'colA1': 'colA'},
+                           grain_columns=['grainA'], 
+                           offsets=[-2, -1, 1],
+                           horizon=4)
+        binarydata = xf0.fit_transform(df, as_binary_data_stream=True)
+        
+        xf1 = ForecastingPivot(columns_to_pivot=['colA1'])
+
+        xf1.fit(binarydata)
+        onnx_path = get_tmp_file('.onnx')
+        onnx_json_path = get_tmp_file('.onnx.json')
+        xf1.export_to_onnx(onnx_path,
+                            'com.microsoft.ml',
+                            dst_json=onnx_json_path,
+                            onnx_version='Stable')
+        sess = rt.InferenceSession(onnx_path)
+
+        with self.assertRaisesRegex(Exception, "ONNXRuntimeError"):
+            grainA = np.array(["one"]).reshape(1,1)
+            colA = np.array([1]).astype(np.double).reshape(1,1)
+            colA1 = np.array([1, 4, 6, float("NaN"), 2, 5, float("NaN"), float("NaN"), 3, float("NaN"), float("NaN"), 7]).reshape(1,2,6)
+            pred = sess.run(None, {"grainA":grainA,"colA":colA, "colA1":colA1 })
+
+
+
+for test_case_invalid_input in TEST_CASES_FOR_INVALID_INPUT:
+    test_name = 'test_%s' % test_case_invalid_input.replace('(', '_').replace(')', '').lower()
+    
+    method = TestOnnxExport.generate_test_method_for_bad(test_case_invalid_input)
+    setattr(TestOnnxExport, test_name, method)
+    
+if __name__ == '__main__':
+    unittest.main()

From ac5ce115d190c78b92301385eeadf8f7810944b2 Mon Sep 17 00:00:00 2001
From: Jin Yan <jiyan2@microsoft.com>
Date: Mon, 27 Apr 2020 16:23:25 -0700
Subject: [PATCH 15/34] Add tests for DateTimeSplitter with country (#486)

* Add callstack field to BrdigeRuntime exception (#483)

* Add exception stack to the error message

* Add callstack field

Co-authored-by: Gani Nazirov <ganaziro@microsoft.com>

* Add callstack field to BrdigeRuntime exception (#483)

* Add exception stack to the error message

* Add callstack field

Co-authored-by: Gani Nazirov <ganaziro@microsoft.com>

* revert "Add callstack field to BrdigeRuntime exception (#483)"

This reverts commit 569ea7bcf02de6bc23da2a255f16d75d53230c05.

* add in DateTimeSplitter tests for country

* add in big tests for more featurizers

Co-authored-by: Gani Nazirov <ganinz@hotmail.com>
Co-authored-by: Gani Nazirov <ganaziro@microsoft.com>
---
 src/python/tests_extended/test_dft_based.py | 52 ++++++++++++++++++++-
 1 file changed, 51 insertions(+), 1 deletion(-)

diff --git a/src/python/tests_extended/test_dft_based.py b/src/python/tests_extended/test_dft_based.py
index 96d0193c..b6436fb1 100644
--- a/src/python/tests_extended/test_dft_based.py
+++ b/src/python/tests_extended/test_dft_based.py
@@ -25,6 +25,8 @@
 TEST_CASES = {
     'DateTimeSplitter_Simple',
     'DateTimeSplitter_Complex',
+    'DateTimeSplitter_Canada_1day_before_christmas',
+    'DateTimeSplitter_Czech_non_english_holiday',
     'ToKey_SimpleFloat',
     'ToKey_SimpleDouble',
     'ToKey_SimpleString',
@@ -41,6 +43,8 @@
     'ShortGrainDropper',
     'RollingWin_Pivot_Integration',
     'Laglead_Pivot_Integration',
+    'Big_Test1',
+    'Big_Test2'
 }
 
 INSTANCES = {
@@ -62,6 +66,8 @@
                                     'dtAmPmLabel', 'dtDayOfWeekLabel', 'dtIsPaidTimeOff','dtHolidayName'
         ])
     ]),
+    'DateTimeSplitter_Canada_1day_before_christmas' : DateTimeSplitter(prefix='dt', country='Canada') << 'tokens1',
+    'DateTimeSplitter_Czech_non_english_holiday' : DateTimeSplitter(prefix='dt', country='Czech') << 'tokens1',
     'ToKey_SimpleFloat': ToKeyImputer(),
     'ToKey_SimpleDouble': ToKeyImputer(),
     'ToKey_SimpleString': ToKeyImputer(),
@@ -122,6 +128,34 @@
                         horizon=2),
         ForecastingPivot(columns_to_pivot=['colA1'])
     ]),
+    'Big_Test1': Pipeline([
+        TimeSeriesImputer(time_series_column='ts',
+                                filter_columns=['c', 'grain'],
+                                grain_columns=['grain'],
+                                impute_mode='ForwardFill',
+                                filter_mode='Include'),
+        DateTimeSplitter(prefix='dt') << 'ts',
+        LagLeadOperator(columns={'c1': 'c'},
+                           grain_columns=['dtMonthLabel'], 
+                           offsets=[-2, -1],
+                           horizon=1),
+        ForecastingPivot(columns_to_pivot=['c1']),
+        ColumnSelector(drop_columns=['dtHolidayName'])
+    ]),
+    'Big_Test2': Pipeline([
+        TimeSeriesImputer(time_series_column='ts',
+                                filter_columns=['c', 'grain'],
+                                grain_columns=['grain'],
+                                impute_mode='ForwardFill',
+                                filter_mode='Include'),
+        DateTimeSplitter(prefix='dt', country = 'Canada') << 'ts',
+        RollingWindow(columns={'c1': 'c'},
+                           grain_column=['grain'], 
+                           window_calculation='Mean',
+                           max_window_size=2,
+                           horizon=2),
+        ForecastingPivot(columns_to_pivot=['c1'])
+    ])
 }
 
 DATASETS = {
@@ -131,6 +165,12 @@
     'DateTimeSplitter_Complex': pd.DataFrame(data=dict(
                                 tokens1=[217081624, 1751241600, 217081625, 32445842582]
                                )),
+    'DateTimeSplitter_Canada_1day_before_christmas': pd.DataFrame(data=dict(
+                                tokens1=[157161599]
+                               )),
+    'DateTimeSplitter_Czech_non_english_holiday': pd.DataFrame(data=dict(
+                                tokens1=[3911760000, 3834432000, 3985200000]
+                               )),
     'ToKey_SimpleFloat': pd.DataFrame(data=dict(
                                     target=[1.0, 1.0, 1.0, 2.0]
                         )).astype({'target': np.float64}),
@@ -196,7 +236,17 @@
     'Laglead_Pivot_Integration': pd.DataFrame(data=dict(
                                     colA=[1.0, 2.0, 3.0, 4.0],
                                     grainA=["one", "one", "one", "one"]
-                                ))
+                                )),
+    'Big_Test1': pd.DataFrame(data=dict(
+            ts=[217081624, 217081625, 217081627, 217081629],
+            grain=[1970, 1970, 1970, 1970],
+            c=[10, 11, 12, 13]
+        )).astype({'ts': np.int64, 'grain': np.int32, 'c': np.double}),
+    'Big_Test2': pd.DataFrame(data=dict(
+            ts=[0, 86400, 172800],
+            grain=[1970, 1970, 1970],
+            c=[10, 11, 12]
+        )).astype({'ts': np.int64, 'grain': np.int32, 'c': np.double})
 }
 
 def get_file_size(file_path):

From 0d5e594904175186e2cfc6f1d9f537dd90e91c74 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Mon, 27 Apr 2020 17:39:00 -0700
Subject: [PATCH 16/34] install ort-featurizers

---
 build.cmd | 2 +-
 build.sh  | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/build.cmd b/build.cmd
index fe4d97a3..1cf885aa 100644
--- a/build.cmd
+++ b/build.cmd
@@ -399,7 +399,7 @@ if "%InstallPythonPackages%" == "True" (
         call "%PythonExe%" -m pip install --upgrade pyzmq
     ) else (
         call "%PythonExe%" -m pip install --upgrade "azureml-dataprep>=1.1.33"
-        call "%PythonExe%" -m pip install --upgrade -i https://test.pypi.org/simple/ ort-nightly-featurizer
+        call "%PythonExe%" -m pip install --upgrade --extra-index-url https://test.pypi.org/simple/ ort-nightly-featurizer
     )
 
     call "%PythonExe%" -m pip install --upgrade "%__currentScriptDir%target\%WheelFile%"
diff --git a/build.sh b/build.sh
index 149be72e..203a333a 100755
--- a/build.sh
+++ b/build.sh
@@ -293,7 +293,7 @@ then
         fi
 
         "${PythonExe}" -m pip install --upgrade "azureml-dataprep>=1.1.33"
-        "${PythonExe}" -m pip install --upgrade onnxruntime
+        "${PythonExe}" -m pip install --upgrade --extra-index-url https://test.pypi.org/simple/ ort-nightly-featurizer
     fi
     "${PythonExe}" -m pip install --upgrade "${Wheel}"
     "${PythonExe}" -m pip install "scikit-learn==0.19.2"

From 634597d4e610a200508bbe9f789fddc591a3f0c1 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Tue, 28 Apr 2020 11:00:26 -0700
Subject: [PATCH 17/34] fix feed

---
 nuget.config | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/nuget.config b/nuget.config
index 5bf65c94..63e7a3be 100644
--- a/nuget.config
+++ b/nuget.config
@@ -5,6 +5,6 @@
   </config>
   <packageSources>
     <add key="nuget.org" value="https://api.nuget.org/v3/index.json" />
-	<add key="MachineLearning-ORTFeaturizers" value="https://devdiv.pkgs.visualstudio.com/DevDiv/_packaging/MachineLearning-ORTFeaturizers/nuget/v3/index.json" />
+	<add key="MachineLearning" value="https://pkgs.dev.azure.com/dnceng/public/_packaging/MachineLearning/nuget/v3/index.json" />
   </packageSources>
 </configuration>

From f2236715eb41c499735323d6531a7ff28f68b60d Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Tue, 28 Apr 2020 12:33:59 -0700
Subject: [PATCH 18/34] update version for ort-featurizers

---
 src/DotNetBridge/DotNetBridge.csproj | 26 +++++++++++++-------------
 src/Platforms/build.csproj           | 26 +++++++++++++-------------
 src/python/nimbusml.pyproj           |  3 +++
 3 files changed, 29 insertions(+), 26 deletions(-)

diff --git a/src/DotNetBridge/DotNetBridge.csproj b/src/DotNetBridge/DotNetBridge.csproj
index 0bb24a04..f609ddd5 100644
--- a/src/DotNetBridge/DotNetBridge.csproj
+++ b/src/DotNetBridge/DotNetBridge.csproj
@@ -32,20 +32,20 @@
       <PrivateAssets>all</PrivateAssets>
       <IncludeAssets>runtime; build; native; contentfiles; analyzers</IncludeAssets>
     </PackageReference>
-    <PackageReference Include="Microsoft.ML" Version="1.5.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.CpuMath" Version="1.5.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.EntryPoints" Version="0.17.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.Mkl.Components" Version="1.5.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.ImageAnalytics" Version="1.5.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.LightGBM" Version="1.5.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.OnnxConverter" Version="0.17.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.OnnxTransformer" Version="1.5.0-preview3*" />
+    <PackageReference Include="Microsoft.ML" Version="1.5.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.CpuMath" Version="1.5.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.EntryPoints" Version="0.17.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.Mkl.Components" Version="1.5.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.ImageAnalytics" Version="1.5.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.LightGBM" Version="1.5.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.OnnxConverter" Version="0.17.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.OnnxTransformer" Version="1.5.0-ortFeaturizers*" />
     <PackageReference Include="Microsoft.ML.OnnxRuntime" Version="1.2.0" />
-    <PackageReference Include="Microsoft.ML.TensorFlow" Version="1.5.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.Vision" Version="1.5.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.Featurizers" Version="0.17.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.TensorFlow" Version="1.5.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.Vision" Version="1.5.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.Featurizers" Version="0.17.0-ortFeaturizers*" />
     <PackageReference Include="Microsoft.MLFeaturizers" Version="0.4.0" />
     <PackageReference Include="Microsoft.DataPrep" Version="0.0.3.2-preview" />
     <PackageReference Include="TensorFlow.NET" Version="0.11.8.1" />
diff --git a/src/Platforms/build.csproj b/src/Platforms/build.csproj
index 3149c6f3..ac10b48d 100644
--- a/src/Platforms/build.csproj
+++ b/src/Platforms/build.csproj
@@ -21,20 +21,20 @@
   </Target> 
   
   <ItemGroup>
-    <PackageReference Include="Microsoft.ML" Version="1.5.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.CpuMath" Version="1.5.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.EntryPoints" Version="0.17.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.Mkl.Components" Version="1.5.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.ImageAnalytics" Version="1.5.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.LightGBM" Version="1.5.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.OnnxConverter" Version="0.17.0-preview3*" />
+    <PackageReference Include="Microsoft.ML" Version="1.5.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.CpuMath" Version="1.5.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.EntryPoints" Version="0.17.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.Mkl.Components" Version="1.5.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.ImageAnalytics" Version="1.5.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.LightGBM" Version="1.5.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.OnnxConverter" Version="0.17.0-ortFeaturizers*" />
     <PackageReference Include="Microsoft.ML.OnnxRuntime" Version="1.2.0" />
-    <PackageReference Include="Microsoft.ML.OnnxTransformer" Version="1.5.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.TensorFlow" Version="1.5.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.Vision" Version="1.5.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-preview3*" />
-    <PackageReference Include="Microsoft.ML.Featurizers" Version="0.17.0-preview3*" />
+    <PackageReference Include="Microsoft.ML.OnnxTransformer" Version="1.5.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.TensorFlow" Version="1.5.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.Vision" Version="1.5.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-ortFeaturizers*" />
+    <PackageReference Include="Microsoft.ML.Featurizers" Version="0.17.0-ortFeaturizers*" />
     <PackageReference Include="Microsoft.MLFeaturizers" Version="0.4.0" />
     <PackageReference Include="Microsoft.DataPrep" Version="0.0.3.2-preview" />
     <PackageReference Include="TensorFlow.NET" Version="0.11.8.1" />
diff --git a/src/python/nimbusml.pyproj b/src/python/nimbusml.pyproj
index 61a2528a..3433a902 100644
--- a/src/python/nimbusml.pyproj
+++ b/src/python/nimbusml.pyproj
@@ -776,6 +776,9 @@
     <Compile Include="nimbusml\timeseries\__init__.py" />
     <Compile Include="tests_extended\data_frame_tool.py" />
     <Compile Include="tests_extended\test_automl_scenario.py" />
+    <Compile Include="tests_extended\test_dft_based.py" />
+    <Compile Include="tests_extended\test_tensor_based.py" />
+    <Compile Include="tests_extended\test_tensor_invalid_input.py" />
     <Compile Include="tests_extended\test_timeseries_automl.py" />
     <Compile Include="tests_extended\test_export_to_onnx.py" />
     <Compile Include="tests\test_estimator_checks.py" />

From ca0eaa80cf1716dcb7a74fb2de0705b43d64c585 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Tue, 28 Apr 2020 13:21:48 -0700
Subject: [PATCH 19/34] fix tests

---
 .../nimbusml/tests/timeseries/test_rollingwindow.py       | 8 ++++----
 src/python/tests_extended/test_export_to_onnx.py          | 8 ++++++++
 2 files changed, 12 insertions(+), 4 deletions(-)

diff --git a/src/python/nimbusml/tests/timeseries/test_rollingwindow.py b/src/python/nimbusml/tests/timeseries/test_rollingwindow.py
index b6ccdc8c..fc473a7f 100644
--- a/src/python/nimbusml/tests/timeseries/test_rollingwindow.py
+++ b/src/python/nimbusml/tests/timeseries/test_rollingwindow.py
@@ -32,10 +32,10 @@ def test_simple_rolling_window(self):
                            horizon=2)
         result = rw.fit_transform(df)
 
-        self.assertTrue(math.isnan(result.loc[0, 'ts_r']))
-        self.assertEqual(result.loc[1, 'ts_r'], 1)
-        self.assertEqual(result.loc[2, 'ts_r'], 3)
-        self.assertEqual(result.loc[3, 'ts_r'], 5)
+        self.assertTrue(math.isnan(result.loc[0, 'ts_r.1']))
+        self.assertEqual(result.loc[1, 'ts_r.1'], 1)
+        self.assertEqual(result.loc[2, 'ts_r.1'], 3)
+        self.assertEqual(result.loc[3, 'ts_r.1'], 5)
 
     def test_simple_rolling_window2(self):
 
diff --git a/src/python/tests_extended/test_export_to_onnx.py b/src/python/tests_extended/test_export_to_onnx.py
index 74454cb8..54967fe2 100644
--- a/src/python/tests_extended/test_export_to_onnx.py
+++ b/src/python/tests_extended/test_export_to_onnx.py
@@ -118,10 +118,12 @@
     'OnnxRunner',
     'Sentiment',
     'TensorFlowScorer',
+    'TimeSeriesImputer',
     'TreeFeaturizer',
     'WordEmbedding',
     'Binner',
     'BootstrapSampler',
+    'DateTimeSplitter',
     'EnsembleClassifier',
     'EnsembleRegressor',
     'FactorizationMachineBinaryClassifier',
@@ -138,12 +140,18 @@
     'RangeFilter',
     'Resizer',
     'RobustScaler',
+    'RollingWindow',
+    'ForecastingPivot',
+    'LagLeadOperator',
+    'ShortDrop',
     'SkipFilter',
     'SsaChangePointDetector',
     'SsaForecaster',
     'SsaSpikeDetector',
     'SymSgdBinaryClassifier',
     'TakeFilter',
+    'ToKeyImputer',
+    'ToString',
     'EnsembleClassifier',
     'EnsembleRegressor',
     'CharTokenizer',

From f234b7c5349409fe553f7204e4e3ae0f0694eee1 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Tue, 28 Apr 2020 14:02:06 -0700
Subject: [PATCH 20/34] skip ts checks

---
 src/python/tests/test_estimator_checks.py | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/src/python/tests/test_estimator_checks.py b/src/python/tests/test_estimator_checks.py
index a9372ad3..91541a52 100644
--- a/src/python/tests/test_estimator_checks.py
+++ b/src/python/tests/test_estimator_checks.py
@@ -201,6 +201,12 @@
     'check_estimators_pickle')
 
 OMITTED_CHECKS_ALWAYS = 'check_estimators_nan_inf'
+OMITTED_CHECKS_CLASS_ALWAYS = [ 
+    'RobustScaler',
+    'LagLeadOperator',
+    'ForecastingPivot',
+    'RollingWindow',
+    'ShortDrop']
 
 NOBINARY_CHECKS = [
     'check_estimator_sparse_data',
@@ -344,6 +350,8 @@ def method(self):
                      hasattr(estimator, 'decision_function')):
                     continue
 
+                if class_name in OMITTED_CHECKS_CLASS_ALWAYS:
+                    continue
                 if check.__name__ in OMITTED_CHECKS_ALWAYS:
                     continue
                 if 'Binary' in class_name and check.__name__ in NOBINARY_CHECKS:

From 9a0bec93d9c7aa9468cd623a4bdb75e22ec0ebc2 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Tue, 28 Apr 2020 14:43:00 -0700
Subject: [PATCH 21/34] fix tests

---
 src/python/nimbusml/examples/ForecastingPivot.py     |  2 +-
 src/python/nimbusml/examples/RollingWindow.py        |  2 +-
 .../internal/core/timeseries/rollingwindow.py        |  8 ++++----
 .../internal/entrypoints/transforms_rollingwindow.py | 10 +++++-----
 .../tests/timeseries/test_forecastingpivot.py        |  2 +-
 .../nimbusml/tests/timeseries/test_rollingwindow.py  |  4 ++--
 src/python/nimbusml/timeseries/rollingwindow.py      |  6 +++---
 src/python/tests/test_estimator_checks.py            |  5 +++--
 src/python/tests_extended/test_dft_based.py          |  4 ++--
 src/python/tests_extended/test_tensor_based.py       | 12 ++++++------
 .../tests_extended/test_tensor_invalid_input.py      |  4 ++--
 src/python/tests_extended/test_timeseries_automl.py  |  4 ++--
 src/python/tools/manifest.json                       |  2 +-
 13 files changed, 33 insertions(+), 32 deletions(-)

diff --git a/src/python/nimbusml/examples/ForecastingPivot.py b/src/python/nimbusml/examples/ForecastingPivot.py
index 98d41871..b1592fbf 100644
--- a/src/python/nimbusml/examples/ForecastingPivot.py
+++ b/src/python/nimbusml/examples/ForecastingPivot.py
@@ -12,7 +12,7 @@
 
 # transform usage
 xf = RollingWindow(columns={'age_1': 'age'},
-                   grain_column=['education'], 
+                   grain_columns=['education'], 
                    window_calculation='Mean',
                    max_window_size=1,
                    horizon=1)
diff --git a/src/python/nimbusml/examples/RollingWindow.py b/src/python/nimbusml/examples/RollingWindow.py
index 086f5a7a..8fe9100e 100644
--- a/src/python/nimbusml/examples/RollingWindow.py
+++ b/src/python/nimbusml/examples/RollingWindow.py
@@ -12,7 +12,7 @@
 
 # transform usage
 xf = RollingWindow(columns={'age_1': 'age'},
-                   grain_column=['education'], 
+                   grain_columns=['education'], 
                    window_calculation='Mean',
                    max_window_size=2,
                    horizon=2)
diff --git a/src/python/nimbusml/internal/core/timeseries/rollingwindow.py b/src/python/nimbusml/internal/core/timeseries/rollingwindow.py
index 4a67f54d..3240bf6a 100644
--- a/src/python/nimbusml/internal/core/timeseries/rollingwindow.py
+++ b/src/python/nimbusml/internal/core/timeseries/rollingwindow.py
@@ -20,7 +20,7 @@ class RollingWindow(BasePipelineItem, DefaultSignature):
     **Description**
         Performs a calculation over a rolling timeseries window
 
-    :param grain_column: List of grain columns.
+    :param grain_columns: List of grain columns.
 
     :param horizon: Maximum horizon value.
 
@@ -37,7 +37,7 @@ class RollingWindow(BasePipelineItem, DefaultSignature):
     @trace
     def __init__(
             self,
-            grain_column,
+            grain_columns,
             horizon=0,
             max_window_size=0,
             min_window_size=1,
@@ -46,7 +46,7 @@ def __init__(
         BasePipelineItem.__init__(
             self, type='transform', **params)
 
-        self.grain_column = grain_column
+        self.grain_columns = grain_columns
         self.horizon = horizon
         self.max_window_size = max_window_size
         self.min_window_size = min_window_size
@@ -98,7 +98,7 @@ def _get_node(self, **all_args):
                 o in zip(
                     input_columns,
                     output_columns)] if input_columns else None,
-            grain_column=self.grain_column,
+            grain_columns=self.grain_columns,
             horizon=self.horizon,
             max_window_size=self.max_window_size,
             min_window_size=self.min_window_size,
diff --git a/src/python/nimbusml/internal/entrypoints/transforms_rollingwindow.py b/src/python/nimbusml/internal/entrypoints/transforms_rollingwindow.py
index 0bd8823c..fb1eec3a 100644
--- a/src/python/nimbusml/internal/entrypoints/transforms_rollingwindow.py
+++ b/src/python/nimbusml/internal/entrypoints/transforms_rollingwindow.py
@@ -10,7 +10,7 @@
 
 
 def transforms_rollingwindow(
-        grain_column,
+        grain_columns,
         column,
         data,
         output_data=None,
@@ -24,7 +24,7 @@ def transforms_rollingwindow(
     **Description**
         Performs a calculation over a rolling timeseries window
 
-    :param grain_column: List of grain columns (inputs).
+    :param grain_columns: List of grain columns (inputs).
     :param column: New column definition (optional form: name:src)
         (inputs).
     :param data: Input dataset (inputs).
@@ -41,9 +41,9 @@ def transforms_rollingwindow(
     inputs = {}
     outputs = {}
 
-    if grain_column is not None:
-        inputs['GrainColumn'] = try_set(
-            obj=grain_column,
+    if grain_columns is not None:
+        inputs['GrainColumns'] = try_set(
+            obj=grain_columns,
             none_acceptable=False,
             is_of_type=list,
             is_column=True)
diff --git a/src/python/nimbusml/tests/timeseries/test_forecastingpivot.py b/src/python/nimbusml/tests/timeseries/test_forecastingpivot.py
index 8077754d..cde9f3ce 100644
--- a/src/python/nimbusml/tests/timeseries/test_forecastingpivot.py
+++ b/src/python/nimbusml/tests/timeseries/test_forecastingpivot.py
@@ -24,7 +24,7 @@ def test_simple_pivot(self):
         ))
 
         rw = RollingWindow(columns={'ts_r': 'ts'},
-                           grain_column=['grain'], 
+                           grain_columns=['grain'], 
                            window_calculation='Mean',
                            max_window_size=1,
                            horizon=1)
diff --git a/src/python/nimbusml/tests/timeseries/test_rollingwindow.py b/src/python/nimbusml/tests/timeseries/test_rollingwindow.py
index fc473a7f..c64962f1 100644
--- a/src/python/nimbusml/tests/timeseries/test_rollingwindow.py
+++ b/src/python/nimbusml/tests/timeseries/test_rollingwindow.py
@@ -26,7 +26,7 @@ def test_simple_rolling_window(self):
         ))
 
         rw = RollingWindow(columns={'ts_r': 'ts'},
-                           grain_column=['grain'], 
+                           grain_columns=['grain'], 
                            window_calculation='Mean',
                            max_window_size=1,
                            horizon=2)
@@ -45,7 +45,7 @@ def test_simple_rolling_window2(self):
         ))
 
         rw = RollingWindow(columns={'ts_r': 'ts'},
-                           grain_column=['grain'], 
+                           grain_columns=['grain'], 
                            window_calculation='Mean',
                            max_window_size=2,
                            horizon=2)
diff --git a/src/python/nimbusml/timeseries/rollingwindow.py b/src/python/nimbusml/timeseries/rollingwindow.py
index 703e4324..d1f228f6 100644
--- a/src/python/nimbusml/timeseries/rollingwindow.py
+++ b/src/python/nimbusml/timeseries/rollingwindow.py
@@ -24,7 +24,7 @@ class RollingWindow(core, BaseTransform, TransformerMixin):
 
     :param columns: see `Columns </nimbusml/concepts/columns>`_.
 
-    :param grain_column: List of grain columns.
+    :param grain_columns: List of grain columns.
 
     :param horizon: Maximum horizon value.
 
@@ -41,7 +41,7 @@ class RollingWindow(core, BaseTransform, TransformerMixin):
     @trace
     def __init__(
             self,
-            grain_column,
+            grain_columns,
             horizon=0,
             max_window_size=0,
             min_window_size=1,
@@ -54,7 +54,7 @@ def __init__(
         BaseTransform.__init__(self, **params)
         core.__init__(
             self,
-            grain_column=grain_column,
+            grain_columns=grain_columns,
             horizon=horizon,
             max_window_size=max_window_size,
             min_window_size=min_window_size,
diff --git a/src/python/tests/test_estimator_checks.py b/src/python/tests/test_estimator_checks.py
index 91541a52..3c7f25b6 100644
--- a/src/python/tests/test_estimator_checks.py
+++ b/src/python/tests/test_estimator_checks.py
@@ -330,6 +330,9 @@ def method(self):
             passed_checks = set()
             class_name = epoint[1]
             print("\n======== now Estimator is %s =========== " % class_name)
+            
+            if class_name in OMITTED_CHECKS_CLASS_ALWAYS:
+                continue
 
             mod = __import__('nimbusml.' + epoint[0], fromlist=[str(class_name)])
             the_class = getattr(mod, class_name)
@@ -350,8 +353,6 @@ def method(self):
                      hasattr(estimator, 'decision_function')):
                     continue
 
-                if class_name in OMITTED_CHECKS_CLASS_ALWAYS:
-                    continue
                 if check.__name__ in OMITTED_CHECKS_ALWAYS:
                     continue
                 if 'Binary' in class_name and check.__name__ in NOBINARY_CHECKS:
diff --git a/src/python/tests_extended/test_dft_based.py b/src/python/tests_extended/test_dft_based.py
index b6436fb1..f0fb0763 100644
--- a/src/python/tests_extended/test_dft_based.py
+++ b/src/python/tests_extended/test_dft_based.py
@@ -111,7 +111,7 @@
     # forecasting pivot will spread this 2d vector out and drop rows that have NaNs in it
     'RollingWin_Pivot_Integration': Pipeline([
         RollingWindow(columns={'colA1': 'colA'},
-                           grain_column=['grainA'], 
+                           grain_columns=['grainA'], 
                            window_calculation='Mean',
                            max_window_size=2,
                            horizon=2),
@@ -150,7 +150,7 @@
                                 filter_mode='Include'),
         DateTimeSplitter(prefix='dt', country = 'Canada') << 'ts',
         RollingWindow(columns={'c1': 'c'},
-                           grain_column=['grain'], 
+                           grain_columns=['grain'], 
                            window_calculation='Mean',
                            max_window_size=2,
                            horizon=2),
diff --git a/src/python/tests_extended/test_tensor_based.py b/src/python/tests_extended/test_tensor_based.py
index ea6e5edc..b7dfe98c 100644
--- a/src/python/tests_extended/test_tensor_based.py
+++ b/src/python/tests_extended/test_tensor_based.py
@@ -464,7 +464,7 @@ def test_rolling_window_simple_mean_wo_dft(self):
         ))
 
         xf = RollingWindow(columns={'colA1': 'colA'},
-                           grain_column=['grainA'], 
+                           grain_columns=['grainA'], 
                            window_calculation='Mean',
                            max_window_size=2,
                            horizon=2)
@@ -489,7 +489,7 @@ def test_rolling_window_simple_max_wo_dft(self):
         ))
 
         xf = RollingWindow(columns={'colA1': 'colA'},
-                           grain_column=['grainA'], 
+                           grain_columns=['grainA'], 
                            window_calculation='Max',
                            max_window_size=1,
                            horizon=1)
@@ -514,7 +514,7 @@ def test_rolling_window_simple_min_wo_dft(self):
         ))
 
         xf = RollingWindow(columns={'colA1': 'colA'},
-                           grain_column=['grainA'], 
+                           grain_columns=['grainA'], 
                            window_calculation='Min',
                            max_window_size=1,
                            horizon=1)
@@ -539,7 +539,7 @@ def test_rolling_window_multiple_grains_wo_dft(self):
         ))
 
         xf = RollingWindow(columns={'colA1': 'colA'},
-                           grain_column=['grainA'], 
+                           grain_columns=['grainA'], 
                            window_calculation='Mean',
                            max_window_size=1,
                            horizon=1)
@@ -564,7 +564,7 @@ def test_rolling_window_non_string_grain_wo_dft(self):
         ))
 
         xf = RollingWindow(columns={'colA1': 'colA'},
-                           grain_column=['grainA'], 
+                           grain_columns=['grainA'], 
                            window_calculation='Mean',
                            max_window_size=1,
                            horizon=1)
@@ -695,7 +695,7 @@ def test_integration_rollwin_pivot(self):
         ))
 
         xf0 = RollingWindow(columns={'colA1': 'colA'},
-                           grain_column=['grainA'], 
+                           grain_columns=['grainA'], 
                            window_calculation='Mean',
                            max_window_size=2,
                            horizon=2)
diff --git a/src/python/tests_extended/test_tensor_invalid_input.py b/src/python/tests_extended/test_tensor_invalid_input.py
index 1db6258e..6126f7ce 100644
--- a/src/python/tests_extended/test_tensor_invalid_input.py
+++ b/src/python/tests_extended/test_tensor_invalid_input.py
@@ -94,12 +94,12 @@
                                                           impute_mode='ForwardFill',
                                                           filter_mode='Include'),
     'RollingWindow_Bad_Input_Type': RollingWindow(columns={'colA1': 'colA'},
-                                                  grain_column=['grainA'], 
+                                                  grain_columns=['grainA'], 
                                                   window_calculation='Mean',
                                                   max_window_size=2,
                                                   horizon=2),
     'RollingWindow_Bad_Input_Shape': RollingWindow(columns={'colA1': 'colA'},
-                                                  grain_column=['grainA'], 
+                                                  grain_columns=['grainA'], 
                                                   window_calculation='Mean',
                                                   max_window_size=2,
                                                   horizon=2),
diff --git a/src/python/tests_extended/test_timeseries_automl.py b/src/python/tests_extended/test_timeseries_automl.py
index 1e85f418..f6d32035 100644
--- a/src/python/tests_extended/test_timeseries_automl.py
+++ b/src/python/tests_extended/test_timeseries_automl.py
@@ -139,7 +139,7 @@ def test_rolling_window(self):
         ))
 
         xf = RollingWindow(columns={'ts_r': 'ts'},
-                           grain_column=['grain'], 
+                           grain_columns=['grain'], 
                            window_calculation='Mean',
                            max_window_size=1,
                            horizon=2)
@@ -160,7 +160,7 @@ def test_pivot(self):
         ))
 
         xf0 = RollingWindow(columns={'ts_r': 'ts'},
-                           grain_column=['grain'], 
+                           grain_columns=['grain'], 
                            window_calculation='Mean',
                            max_window_size=1,
                            horizon=1)
diff --git a/src/python/tools/manifest.json b/src/python/tools/manifest.json
index 5be33996..48947d1a 100644
--- a/src/python/tools/manifest.json
+++ b/src/python/tools/manifest.json
@@ -23023,7 +23023,7 @@
       "ShortName": "RollingWindow",
       "Inputs": [
         {
-          "Name": "GrainColumn",
+          "Name": "GrainColumns",
           "Type": {
             "Kind": "Array",
             "ItemType": "String"

From 82f831bfd0d85fe2982b1f7a78f9f2df78e96d3d Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Tue, 28 Apr 2020 15:53:48 -0700
Subject: [PATCH 22/34] fix test

---
 src/python/tests/test_estimator_checks.py | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/src/python/tests/test_estimator_checks.py b/src/python/tests/test_estimator_checks.py
index 3c7f25b6..3b0070af 100644
--- a/src/python/tests/test_estimator_checks.py
+++ b/src/python/tests/test_estimator_checks.py
@@ -329,11 +329,10 @@ def method(self):
             failed_checks = set()
             passed_checks = set()
             class_name = epoint[1]
-            print("\n======== now Estimator is %s =========== " % class_name)
-            
             if class_name in OMITTED_CHECKS_CLASS_ALWAYS:
-                continue
+                return
 
+            print("\n======== now Estimator is %s =========== " % class_name)
             mod = __import__('nimbusml.' + epoint[0], fromlist=[str(class_name)])
             the_class = getattr(mod, class_name)
             if class_name in INSTANCES:

From 2b7accb203566caf64d5b2ac2dc481cef2155b1e Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Tue, 28 Apr 2020 16:56:25 -0700
Subject: [PATCH 23/34] MLFeatur vcersion

---
 src/DotNetBridge/DotNetBridge.csproj                | 2 +-
 src/Platforms/build.csproj                          | 2 +-
 src/python/tests_extended/test_timeseries_automl.py | 1 +
 3 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/DotNetBridge/DotNetBridge.csproj b/src/DotNetBridge/DotNetBridge.csproj
index f609ddd5..21121c02 100644
--- a/src/DotNetBridge/DotNetBridge.csproj
+++ b/src/DotNetBridge/DotNetBridge.csproj
@@ -46,7 +46,7 @@
     <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-ortFeaturizers*" />
     <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-ortFeaturizers*" />
     <PackageReference Include="Microsoft.ML.Featurizers" Version="0.17.0-ortFeaturizers*" />
-    <PackageReference Include="Microsoft.MLFeaturizers" Version="0.4.0" />
+    <PackageReference Include="Microsoft.MLFeaturizers" Version="0.4.*" />
     <PackageReference Include="Microsoft.DataPrep" Version="0.0.3.2-preview" />
     <PackageReference Include="TensorFlow.NET" Version="0.11.8.1" />
     <PackageReference Include="SciSharp.TensorFlow.Redist" Version="1.14.0" />
diff --git a/src/Platforms/build.csproj b/src/Platforms/build.csproj
index ac10b48d..d4c3dcb1 100644
--- a/src/Platforms/build.csproj
+++ b/src/Platforms/build.csproj
@@ -35,7 +35,7 @@
     <PackageReference Include="Microsoft.ML.Ensemble" Version="0.17.0-ortFeaturizers*" />
     <PackageReference Include="Microsoft.ML.TimeSeries" Version="1.5.0-ortFeaturizers*" />
     <PackageReference Include="Microsoft.ML.Featurizers" Version="0.17.0-ortFeaturizers*" />
-    <PackageReference Include="Microsoft.MLFeaturizers" Version="0.4.0" />
+    <PackageReference Include="Microsoft.MLFeaturizers" Version="0.4.*" />
     <PackageReference Include="Microsoft.DataPrep" Version="0.0.3.2-preview" />
     <PackageReference Include="TensorFlow.NET" Version="0.11.8.1" />
     <PackageReference Include="SciSharp.TensorFlow.Redist" Version="1.14.0" />
diff --git a/src/python/tests_extended/test_timeseries_automl.py b/src/python/tests_extended/test_timeseries_automl.py
index f6d32035..a6f6d73c 100644
--- a/src/python/tests_extended/test_timeseries_automl.py
+++ b/src/python/tests_extended/test_timeseries_automl.py
@@ -12,6 +12,7 @@
 import pandas as pd
 from nimbusml import Pipeline
 from nimbusml.preprocessing import ToString, ToKeyImputer, DateTimeSplitter
+from nimbusml.preprocessing.schema import ColumnSelector
 from nimbusml.timeseries import TimeSeriesImputer, LagLeadOperator, RollingWindow, ForecastingPivot, ShortDrop
 from data_frame_tool import DataFrameTool as DFT
 

From 7a7bef73a02a6dc08f05bb7e8ac8722922ad1d95 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Wed, 29 Apr 2020 10:18:47 -0700
Subject: [PATCH 24/34] exclude test for Mac

---
 src/python/tests_extended/test_tensor_invalid_input.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/src/python/tests_extended/test_tensor_invalid_input.py b/src/python/tests_extended/test_tensor_invalid_input.py
index 6126f7ce..07135d30 100644
--- a/src/python/tests_extended/test_tensor_invalid_input.py
+++ b/src/python/tests_extended/test_tensor_invalid_input.py
@@ -396,6 +396,11 @@ def test_pivot_bad_shape(self):
 for test_case_invalid_input in TEST_CASES_FOR_INVALID_INPUT:
     test_name = 'test_%s' % test_case_invalid_input.replace('(', '_').replace(')', '').lower()
     
+    # The following test for negative timepoints. On Linux and Windows it throws as expected.
+    # On Mac negative timepoints are a valid input.
+    if test_name in 'test_datetimesplitter_bad_input_data' and platform.system() == "Darwin":
+        continue
+   
     method = TestOnnxExport.generate_test_method_for_bad(test_case_invalid_input)
     setattr(TestOnnxExport, test_name, method)
     

From 1315d4dd7a08cdaa209c5d60a958adf62263e2e1 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Wed, 29 Apr 2020 12:12:31 -0700
Subject: [PATCH 25/34] do mv to save space

---
 build.sh | 24 ++++++++++++------------
 1 file changed, 12 insertions(+), 12 deletions(-)

diff --git a/build.sh b/build.sh
index 203a333a..4a730061 100755
--- a/build.sh
+++ b/build.sh
@@ -203,27 +203,27 @@ then
     touch "${__currentScriptDir}/src/python/nimbusml/internal/libs/__init__.py"
 
     echo "Placing binaries in libs dir for wheel packaging ... "
-    cp  "${BuildOutputDir}/${__configuration}"/DotNetBridge.dll "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
-    cp  "${BuildOutputDir}/${__configuration}"/pybridge.so "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
+    mv  "${BuildOutputDir}/${__configuration}"/DotNetBridge.dll "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
+    mv  "${BuildOutputDir}/${__configuration}"/pybridge.so "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
 
     # ls -l "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/
     if [ ${PythonVersion} = 2.7 ]
     then
-        cp  "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/*.dll "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
-        cp  "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/System.Native.a "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
-        cp  "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/createdump "${__currentScriptDir}/src/python/nimbusml/internal/libs/"  || :
-        cp  "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/sosdocsunix.txt "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
-        cp  -r "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/Data "${__currentScriptDir}/src/python/nimbusml/internal/libs/."
+        mv  "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/*.dll "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
+        mv  "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/System.Native.a "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
+        mv  "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/createdump "${__currentScriptDir}/src/python/nimbusml/internal/libs/"  || :
+        mv  "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/sosdocsunix.txt "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
+        mv  "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/Data "${__currentScriptDir}/src/python/nimbusml/internal/libs/."
         ext=*.so
         if [ "$(uname -s)" = "Darwin" ]
         then 
             ext=*.dylib
         fi    
-        cp  "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/${ext} "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
+        mv  "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/${ext} "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
         # Obtain "libtensorflow_framework.so.1", which is the upgraded version of "libtensorflow.so". This is required for tests TensorFlowScorer.py to pass in Linux distros with Python 2.7
         if [ ! "$(uname -s)" = "Darwin" ]
         then
-            cp  "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/libtensorflow_framework.so.1 "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
+            mv  "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/libtensorflow_framework.so.1 "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
         fi
         # remove dataprep dlls as its not supported in python 2.7
         rm -f "${__currentScriptDir}/src/python/nimbusml/internal/libs/Microsoft.DPrep.*"
@@ -240,14 +240,14 @@ then
             libs_txt=libs_mac.txt
         fi
         cat build/${libs_txt} | while read i; do
-            cp  "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/$i "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
+            mv  "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/$i "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
         done
-        cp  -r "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/Data "${__currentScriptDir}/src/python/nimbusml/internal/libs/."
+        mv  "${BuildOutputDir}/${__configuration}/Platform/${PublishDir}"/publish/Data "${__currentScriptDir}/src/python/nimbusml/internal/libs/."
     fi
     
     if [[ $__configuration = Dbg* ]]
     then
-        cp  "${BuildOutputDir}/${__configuration}"/DotNetBridge.pdb "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
+        mv  "${BuildOutputDir}/${__configuration}"/DotNetBridge.pdb "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
     fi
   
     "${PythonExe}" -m pip install --upgrade "wheel>=0.31.0"

From 99b0e71c4582b592ee2fa5be7a085fea7adb8e46 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Wed, 29 Apr 2020 20:44:51 -0700
Subject: [PATCH 26/34] Make more space for build

---
 build.sh | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/build.sh b/build.sh
index 4a730061..c63e1c2d 100755
--- a/build.sh
+++ b/build.sh
@@ -250,6 +250,10 @@ then
         mv  "${BuildOutputDir}/${__configuration}"/DotNetBridge.pdb "${__currentScriptDir}/src/python/nimbusml/internal/libs/"
     fi
   
+    # Clean out space for building wheel
+	rm -rf "${BuildOutputDir}"
+    rm -rf "${BoostRoot}"
+    
     "${PythonExe}" -m pip install --upgrade "wheel>=0.31.0"
     cd "${__currentScriptDir}/src/python"
 

From 787898216b62e5de03de1989acaed4c6b0cd342c Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Wed, 29 Apr 2020 20:58:35 -0700
Subject: [PATCH 27/34] more space

---
 build.sh | 1 +
 1 file changed, 1 insertion(+)

diff --git a/build.sh b/build.sh
index c63e1c2d..816d6385 100755
--- a/build.sh
+++ b/build.sh
@@ -253,6 +253,7 @@ then
     # Clean out space for building wheel
 	rm -rf "${BuildOutputDir}"
     rm -rf "${BoostRoot}"
+	rm -rf "${__currentScriptDir}/cli"
     
     "${PythonExe}" -m pip install --upgrade "wheel>=0.31.0"
     cd "${__currentScriptDir}/src/python"

From b3797e260cbef2be4f0c954b4fcd1b3d69547292 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Wed, 29 Apr 2020 21:04:23 -0700
Subject: [PATCH 28/34] more space

---
 build.sh | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/build.sh b/build.sh
index 816d6385..dd923bb8 100755
--- a/build.sh
+++ b/build.sh
@@ -280,6 +280,12 @@ then
     echo "#################################"
     echo "Installing Python packages ... "
     echo "#################################"
+
+    # Make more space, remove not needed folders
+    rm -rf "${build}"
+    rm -rf "${dist}"
+    rm -rf "${libs}"
+
     Wheel=${__currentScriptDir}/target/nimbusml-${ProductVersion}-${PythonTag}-none-${PlatName}.whl
     if [ ! -f ${Wheel} ]
     then

From f2e81d38d7c29e2fc90d8c04bf650a41c70518f5 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Wed, 29 Apr 2020 21:28:28 -0700
Subject: [PATCH 29/34] more space

---
 build.sh | 23 ++++++++++++-----------
 1 file changed, 12 insertions(+), 11 deletions(-)

diff --git a/build.sh b/build.sh
index dd923bb8..ae16036e 100755
--- a/build.sh
+++ b/build.sh
@@ -154,19 +154,20 @@ then
 fi
 PythonExe="${PythonRoot}/bin/python"
 echo "Python executable: ${PythonExe}"
-# Download & unzip Boost
-if [ ! -e "${BoostRoot}/.done" ]
-then
-    mkdir -p "${BoostRoot}"
-    echo "Downloading and extracting Boost archive ... "
-    curl "${BoostUrl}" | tar xz -C "${BoostRoot}"
-    touch "${BoostRoot}/.done"
-fi
 
 if [ ${__buildNativeBridge} = true ]
 then 
     echo "Building Native Bridge ... "
+    # Download & unzip Boost
+    if [ ! -e "${BoostRoot}/.done" ]
+    then
+        mkdir -p "${BoostRoot}"
+        echo "Downloading and extracting Boost archive ... "
+        curl "${BoostUrl}" | tar xz -C "${BoostRoot}"
+        touch "${BoostRoot}/.done"
+    fi
     bash "${__currentScriptDir}/src/NativeBridge/build.sh" --configuration $__configuration --pythonver "${PythonVersion}" --pythonpath "${PythonRoot}" --boostpath "${BoostRoot}" 
+    rm -rf "${BoostRoot}"
 fi
 
 if [ ${__buildDotNetBridge} = true ]
@@ -251,9 +252,8 @@ then
     fi
   
     # Clean out space for building wheel
-	rm -rf "${BuildOutputDir}"
-    rm -rf "${BoostRoot}"
-	rm -rf "${__currentScriptDir}/cli"
+    rm -rf "${BuildOutputDir}"
+    rm -rf "${__currentScriptDir}/cli"
     
     "${PythonExe}" -m pip install --upgrade "wheel>=0.31.0"
     cd "${__currentScriptDir}/src/python"
@@ -282,6 +282,7 @@ then
     echo "#################################"
 
     # Make more space, remove not needed folders
+    echo "Deleting ${build} ${dist} ${libs} ... "
     rm -rf "${build}"
     rm -rf "${dist}"
     rm -rf "${libs}"

From 9252d1e1d3757e29c945a7dd84ffb1b05adaa7bf Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Wed, 29 Apr 2020 22:02:32 -0700
Subject: [PATCH 30/34] more space

---
 build.sh | 61 ++++++++++++++++++++++++++------------------------------
 1 file changed, 28 insertions(+), 33 deletions(-)

diff --git a/build.sh b/build.sh
index ae16036e..90f177c4 100755
--- a/build.sh
+++ b/build.sh
@@ -7,6 +7,14 @@ ProductVersion=$(<version.txt)
 __currentScriptDir=$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )
 BuildOutputDir=${__currentScriptDir}/x64/
 DependenciesDir=${__currentScriptDir}/dependencies
+PythonRoot=${DependenciesDir}/Python${PythonVersion}
+BoostRoot=${DependenciesDir}/Boost${PythonVersion}
+# Platform name for python wheel based on OS
+PlatName=manylinux1_x86_64
+if [ "$(uname -s)" = "Darwin" ]
+then 
+	PlatName=macosx_10_11_x86_64
+fi
 mkdir -p "${DependenciesDir}"
 
 usage()
@@ -129,32 +137,6 @@ case $__configuration in
 echo "Unknown configuration '$__configuration'"; usage; exit 1
 esac
 
-PythonRoot=${DependenciesDir}/Python${PythonVersion}
-BoostRoot=${DependenciesDir}/Boost${PythonVersion}
-# Platform name for python wheel based on OS
-PlatName=manylinux1_x86_64
-if [ "$(uname -s)" = "Darwin" ]
-then 
-    PlatName=macosx_10_11_x86_64
-fi
-
-echo ""
-echo "#################################"
-echo "Downloading Dependencies "
-echo "#################################"
-# Download & unzip Python
-if [ ! -e "${PythonRoot}/.done" ]
-then
-    mkdir -p "${PythonRoot}"
-    echo "Downloading and extracting Python archive ... "
-    curl "${PythonUrl}" | tar xz -C "${PythonRoot}"
-    # Move all binaries out of "anaconda3", "anaconda2", or "anaconda", depending on naming convention for version
-    mv "${PythonRoot}/anaconda"*/* "${PythonRoot}/"
-    touch "${PythonRoot}/.done"
-fi
-PythonExe="${PythonRoot}/bin/python"
-echo "Python executable: ${PythonExe}"
-
 if [ ${__buildNativeBridge} = true ]
 then 
     echo "Building Native Bridge ... "
@@ -252,9 +234,24 @@ then
     fi
   
     # Clean out space for building wheel
+    echo "Deleting ${BuildOutputDir} ${__currentScriptDir}/cli"
     rm -rf "${BuildOutputDir}"
     rm -rf "${__currentScriptDir}/cli"
-    
+
+    echo "Downloading Python Dependencies "
+    # Download & unzip Python
+    if [ ! -e "${PythonRoot}/.done" ]
+    then
+        mkdir -p "${PythonRoot}"
+        echo "Downloading and extracting Python archive ... "
+        curl "${PythonUrl}" | tar xz -C "${PythonRoot}"
+        # Move all binaries out of "anaconda3", "anaconda2", or "anaconda", depending on naming convention for version
+        mv "${PythonRoot}/anaconda"*/* "${PythonRoot}/"
+        touch "${PythonRoot}/.done"
+    fi
+    PythonExe="${PythonRoot}/bin/python"
+    echo "Python executable: ${PythonExe}"
+
     "${PythonExe}" -m pip install --upgrade "wheel>=0.31.0"
     cd "${__currentScriptDir}/src/python"
 
@@ -272,6 +269,10 @@ then
     mkdir -p "${__currentScriptDir}/target"
     mv "${__currentScriptDir}/src/python/dist/${WheelFile}" "${__currentScriptDir}/target/"
     echo Python package successfully created: ${__currentScriptDir}/target/${WheelFile}
+    echo "Deleting ${build} ${dist} ${libs} ... "
+    rm -rf "${build}"
+    rm -rf "${dist}"
+    rm -rf "${libs}"
 fi
 
 if [ ${__installPythonPackages} = true ]
@@ -281,12 +282,6 @@ then
     echo "Installing Python packages ... "
     echo "#################################"
 
-    # Make more space, remove not needed folders
-    echo "Deleting ${build} ${dist} ${libs} ... "
-    rm -rf "${build}"
-    rm -rf "${dist}"
-    rm -rf "${libs}"
-
     Wheel=${__currentScriptDir}/target/nimbusml-${ProductVersion}-${PythonTag}-none-${PlatName}.whl
     if [ ! -f ${Wheel} ]
     then

From b0882773492769af90bd7eb156c1e35817027477 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Wed, 29 Apr 2020 22:06:56 -0700
Subject: [PATCH 31/34] fix build

---
 build.sh | 28 ++++++++++++++--------------
 1 file changed, 14 insertions(+), 14 deletions(-)

diff --git a/build.sh b/build.sh
index 90f177c4..2293a252 100755
--- a/build.sh
+++ b/build.sh
@@ -137,6 +137,20 @@ case $__configuration in
 echo "Unknown configuration '$__configuration'"; usage; exit 1
 esac
 
+echo "Downloading Python Dependencies "
+# Download & unzip Python
+if [ ! -e "${PythonRoot}/.done" ]
+then
+	mkdir -p "${PythonRoot}"
+	echo "Downloading and extracting Python archive ... "
+	curl "${PythonUrl}" | tar xz -C "${PythonRoot}"
+	# Move all binaries out of "anaconda3", "anaconda2", or "anaconda", depending on naming convention for version
+	mv "${PythonRoot}/anaconda"*/* "${PythonRoot}/"
+	touch "${PythonRoot}/.done"
+fi
+PythonExe="${PythonRoot}/bin/python"
+echo "Python executable: ${PythonExe}"
+
 if [ ${__buildNativeBridge} = true ]
 then 
     echo "Building Native Bridge ... "
@@ -238,20 +252,6 @@ then
     rm -rf "${BuildOutputDir}"
     rm -rf "${__currentScriptDir}/cli"
 
-    echo "Downloading Python Dependencies "
-    # Download & unzip Python
-    if [ ! -e "${PythonRoot}/.done" ]
-    then
-        mkdir -p "${PythonRoot}"
-        echo "Downloading and extracting Python archive ... "
-        curl "${PythonUrl}" | tar xz -C "${PythonRoot}"
-        # Move all binaries out of "anaconda3", "anaconda2", or "anaconda", depending on naming convention for version
-        mv "${PythonRoot}/anaconda"*/* "${PythonRoot}/"
-        touch "${PythonRoot}/.done"
-    fi
-    PythonExe="${PythonRoot}/bin/python"
-    echo "Python executable: ${PythonExe}"
-
     "${PythonExe}" -m pip install --upgrade "wheel>=0.31.0"
     cd "${__currentScriptDir}/src/python"
 

From 2fc6a1f3237cfc8903f4a1a1fcc37dd8c9440336 Mon Sep 17 00:00:00 2001
From: Gani Nazirov <ganaziro@microsoft.com>
Date: Wed, 29 Apr 2020 23:17:41 -0700
Subject: [PATCH 32/34] more space

---
 build.sh | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/build.sh b/build.sh
index 2293a252..97764b5a 100755
--- a/build.sh
+++ b/build.sh
@@ -163,7 +163,9 @@ then
         touch "${BoostRoot}/.done"
     fi
     bash "${__currentScriptDir}/src/NativeBridge/build.sh" --configuration $__configuration --pythonver "${PythonVersion}" --pythonpath "${PythonRoot}" --boostpath "${BoostRoot}" 
+    echo "Deleting ${BoostRoot} ${__currentScriptDir}/src/NativeBridge/x64"
     rm -rf "${BoostRoot}"
+	rm -rf "${__currentScriptDir}/src/NativeBridge/x64"
 fi
 
 if [ ${__buildDotNetBridge} = true ]

From bea3ec30bee23a20c21fa3e686eba6aaf16da90c Mon Sep 17 00:00:00 2001
From: Jin Yan <jiyan2@microsoft.com>
Date: Fri, 1 May 2020 09:56:46 -0700
Subject: [PATCH 33/34] check in (#487)

---
 src/python/tests_extended/test_dft_based.py   |  7 +++++++
 .../tests_extended/test_tensor_based.py       | 20 +++++++++----------
 .../test_tensor_invalid_input.py              |  6 +++---
 3 files changed, 20 insertions(+), 13 deletions(-)

diff --git a/src/python/tests_extended/test_dft_based.py b/src/python/tests_extended/test_dft_based.py
index f0fb0763..5cc5d59d 100644
--- a/src/python/tests_extended/test_dft_based.py
+++ b/src/python/tests_extended/test_dft_based.py
@@ -381,6 +381,13 @@ def method(self):
 
 for test_case in TEST_CASES:
     test_name = 'test_%s' % test_case.replace('(', '_').replace(')', '').lower()
+    
+    # The following test for far future time point. On Windows it's treated correctly as expected
+    # but for other OS, system_clock::time_point is defined as nanoseconds (64-bit),
+    # which rolls over somewhere around 2260.
+    if test_name in 'DateTimeSplitter_Complex' and (platform.system() == "Darwin" or platform.system() == "Linux"):
+        continue
+
     method = TestOnnxExport.generate_test_method(test_case)
     setattr(TestOnnxExport, test_name, method)
 
diff --git a/src/python/tests_extended/test_tensor_based.py b/src/python/tests_extended/test_tensor_based.py
index b7dfe98c..437bb3be 100644
--- a/src/python/tests_extended/test_tensor_based.py
+++ b/src/python/tests_extended/test_tensor_based.py
@@ -76,7 +76,7 @@ def test_datetimesplitter(self):
             
     def test_datetimesplitter_complex(self):
         training_data = pd.DataFrame(data=dict(
-            tokens1=[217081624, 1751241600, 217081625, 32445842582]
+            tokens1=[217081624, 1751241600, 217081625]
         ))
 
         cols_to_drop = [
@@ -91,17 +91,17 @@ def test_datetimesplitter_complex(self):
         
         sess = set_up_onnx_model(xf, training_data)
 
-        inferencing_data = np.array([217081624, 1751241600, 217081625, 32445842582]).astype(np.int64).reshape(4,1)
+        inferencing_data = np.array([217081624, 1751241600, 217081625]).astype(np.int64).reshape(4,1)
         result = sess.run(None, {"tokens1": inferencing_data})
         
-        expected_years = np.array([1976, 2025, 1976, 2998]).reshape(4, 1)
-        expected_month = np.array([11, 6, 11, 3]).reshape(4, 1)
-        expected_day = np.array([17, 30, 17, 2]).reshape(4, 1)
-        expected_hour = np.array([12, 0, 12, 14]).reshape(4, 1)
-        expected_minute = np.array([27, 0, 27, 3]).reshape(4, 1)
-        expected_second = np.array([4, 0, 5, 2]).reshape(4, 1)
-        expected_ampm = np.array([1, 0, 1, 1]).reshape(4, 1)
-        expected_holidayname = np.array(["", "", "", ""]).reshape(4, 1)
+        expected_years = np.array([1976, 2025, 1976]).reshape(4, 1)
+        expected_month = np.array([11, 6, 11]).reshape(4, 1)
+        expected_day = np.array([17, 30, 17]).reshape(4, 1)
+        expected_hour = np.array([12, 0, 12]).reshape(4, 1)
+        expected_minute = np.array([27, 0, 27]).reshape(4, 1)
+        expected_second = np.array([4, 0, 5]).reshape(4, 1)
+        expected_ampm = np.array([1, 0, 1]).reshape(4, 1)
+        expected_holidayname = np.array(["", "", ""]).reshape(4, 1)
         
         np.testing.assert_array_equal(result[1],expected_years)
         np.testing.assert_array_equal(result[2],expected_month)
diff --git a/src/python/tests_extended/test_tensor_invalid_input.py b/src/python/tests_extended/test_tensor_invalid_input.py
index 07135d30..d015b107 100644
--- a/src/python/tests_extended/test_tensor_invalid_input.py
+++ b/src/python/tests_extended/test_tensor_invalid_input.py
@@ -396,9 +396,9 @@ def test_pivot_bad_shape(self):
 for test_case_invalid_input in TEST_CASES_FOR_INVALID_INPUT:
     test_name = 'test_%s' % test_case_invalid_input.replace('(', '_').replace(')', '').lower()
     
-    # The following test for negative timepoints. On Linux and Windows it throws as expected.
-    # On Mac negative timepoints are a valid input.
-    if test_name in 'test_datetimesplitter_bad_input_data' and platform.system() == "Darwin":
+    # The following test for negative timepoints. On Windows it throws as expected.
+    # On Mac and Linux negative timepoints are a valid input.
+    if test_name in 'test_datetimesplitter_bad_input_data' and (platform.system() == "Darwin" or platform.system() == "Linux"):
         continue
    
     method = TestOnnxExport.generate_test_method_for_bad(test_case_invalid_input)

From ba376b9bb84ca4bdac4a0c0364c827716a01dbcd Mon Sep 17 00:00:00 2001
From: Jin Yan <jiyan2@microsoft.com>
Date: Fri, 1 May 2020 13:02:15 -0700
Subject: [PATCH 34/34] Fix shape (#488)

* check in

* fix shape

* fix shape
---
 src/python/tests_extended/test_tensor_based.py | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/src/python/tests_extended/test_tensor_based.py b/src/python/tests_extended/test_tensor_based.py
index 437bb3be..3300a7e8 100644
--- a/src/python/tests_extended/test_tensor_based.py
+++ b/src/python/tests_extended/test_tensor_based.py
@@ -91,17 +91,17 @@ def test_datetimesplitter_complex(self):
         
         sess = set_up_onnx_model(xf, training_data)
 
-        inferencing_data = np.array([217081624, 1751241600, 217081625]).astype(np.int64).reshape(4,1)
+        inferencing_data = np.array([217081624, 1751241600, 217081625]).astype(np.int64).reshape(3,1)
         result = sess.run(None, {"tokens1": inferencing_data})
         
-        expected_years = np.array([1976, 2025, 1976]).reshape(4, 1)
-        expected_month = np.array([11, 6, 11]).reshape(4, 1)
-        expected_day = np.array([17, 30, 17]).reshape(4, 1)
-        expected_hour = np.array([12, 0, 12]).reshape(4, 1)
-        expected_minute = np.array([27, 0, 27]).reshape(4, 1)
-        expected_second = np.array([4, 0, 5]).reshape(4, 1)
-        expected_ampm = np.array([1, 0, 1]).reshape(4, 1)
-        expected_holidayname = np.array(["", "", ""]).reshape(4, 1)
+        expected_years = np.array([1976, 2025, 1976]).reshape(3, 1)
+        expected_month = np.array([11, 6, 11]).reshape(3, 1)
+        expected_day = np.array([17, 30, 17]).reshape(3, 1)
+        expected_hour = np.array([12, 0, 12]).reshape(3, 1)
+        expected_minute = np.array([27, 0, 27]).reshape(3, 1)
+        expected_second = np.array([4, 0, 5]).reshape(3, 1)
+        expected_ampm = np.array([1, 0, 1]).reshape(3, 1)
+        expected_holidayname = np.array(["", "", ""]).reshape(3, 1)
         
         np.testing.assert_array_equal(result[1],expected_years)
         np.testing.assert_array_equal(result[2],expected_month)