krishna412
diff --git a/‎how-to-use-azureml/automated-machine-learning/automl_env.yml‎
Lines changed: 1 addition & 0 deletions b/‎how-to-use-azureml/automated-machine-learning/automl_env.yml‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎how-to-use-azureml/automated-machine-learning/forecasting-backtest-many-models/auto-ml-forecasting-backtest-many-models.ipynb‎
Lines changed: 10 additions & 3 deletions b/‎how-to-use-azureml/automated-machine-learning/forecasting-backtest-many-models/auto-ml-forecasting-backtest-many-models.ipynb‎
Lines changed: 10 additions & 3 deletions
diff --git a/‎how-to-use-azureml/automated-machine-learning/forecasting-backtest-single-model/auto-ml-forecasting-backtest-single-model.ipynb‎
Lines changed: 10 additions & 3 deletions b/‎how-to-use-azureml/automated-machine-learning/forecasting-backtest-single-model/auto-ml-forecasting-backtest-single-model.ipynb‎
Lines changed: 10 additions & 3 deletions
diff --git a/‎how-to-use-azureml/automated-machine-learning/forecasting-bike-share/auto-ml-forecasting-bike-share.ipynb‎
Lines changed: 12 additions & 5 deletions b/‎how-to-use-azureml/automated-machine-learning/forecasting-bike-share/auto-ml-forecasting-bike-share.ipynb‎
Lines changed: 12 additions & 5 deletions
diff --git a/‎how-to-use-azureml/automated-machine-learning/forecasting-energy-demand/auto-ml-forecasting-energy-demand.ipynb‎
Lines changed: 13 additions & 5 deletions b/‎how-to-use-azureml/automated-machine-learning/forecasting-energy-demand/auto-ml-forecasting-energy-demand.ipynb‎
Lines changed: 13 additions & 5 deletions
diff --git a/‎how-to-use-azureml/automated-machine-learning/forecasting-forecast-function/auto-ml-forecasting-function.ipynb‎
Lines changed: 10 additions & 4 deletions b/‎how-to-use-azureml/automated-machine-learning/forecasting-forecast-function/auto-ml-forecasting-function.ipynb‎
Lines changed: 10 additions & 4 deletions
diff --git a/‎how-to-use-azureml/automated-machine-learning/forecasting-hierarchical-timeseries/auto-ml-forecasting-hierarchical-timeseries.ipynb‎
Lines changed: 4 additions & 2 deletions b/‎how-to-use-azureml/automated-machine-learning/forecasting-hierarchical-timeseries/auto-ml-forecasting-hierarchical-timeseries.ipynb‎
Lines changed: 4 additions & 2 deletions
@@ -18,6 +18,7 @@ dependencies:
 - pywin32==227
 - PySocks==1.7.1
 - conda-forge::pyqt==5.12.3
+- jsonschema==4.15.0
 - jinja2<=2.11.2
 - markupsafe<2.1.0
 - tqdm==4.64.0
 
@@ -324,7 +324,8 @@
         "| **experiment_timeout_hours**       | Maximum amount of time in hours that the experiment can take before it terminates. This is optional but provides customers with greater control on exit criteria. |\n",
         "| **label_column_name**              | The name of the label column. |\n",
         "| **forecast_horizon**               | The forecast horizon is how many periods forward you would like to forecast. This integer horizon is in units of the timeseries frequency (e.g. daily, weekly). Periods are inferred from your data. |\n",
-        "| **n_cross_validations**            | Number of cross validation splits. Rolling Origin Validation is used to split time-series in a temporally consistent way. |\n",
+        "| **n_cross_validations**            | Number of cross validation splits. The default value is \"auto\", in which case AutoMl determines the number of cross-validations automatically, if a validation set is not provided. Or users could specify an integer value. Rolling Origin Validation is used to split time-series in a temporally consistent way. |\n",
+        "|**cv_step_size**|Number of periods between two consecutive cross-validation folds. The default value is \"auto\", in which case AutoMl determines the cross-validation step size automatically, if a validation set is not provided. Or users could specify an integer value.\n",
         "| **time_column_name**               | The name of your time column. |\n",
         "| **time_series_id_column_names**     | The column names used to uniquely identify timeseries in data that has multiple rows with the same timestamp. |\n",
         "| **track_child_runs**               | Flag to disable tracking of child runs. Only best run is tracked if the flag is set to False (this includes the model and metrics of the run). |\n",
@@ -353,7 +354,8 @@
         "    \"iterations\": 15,\n",
         "    \"experiment_timeout_hours\": 0.25,  # This also needs to be changed based on the dataset. For larger data set this number needs to be bigger.\n",
         "    \"label_column_name\": TARGET_COLNAME,\n",
-        "    \"n_cross_validations\": 3,\n",
+        "    \"n_cross_validations\": \"auto\",  # Feel free to set to a small integer (>=2) if runtime is an issue.\n",
+        "    \"cv_step_size\": \"auto\",\n",
         "    \"time_column_name\": TIME_COLNAME,\n",
         "    \"forecast_horizon\": 6,\n",
         "    \"time_series_id_column_names\": partition_column_names,\n",
@@ -718,7 +720,12 @@
       "name": "python",
       "nbconvert_exporter": "python",
       "pygments_lexer": "ipython3",
-      "version": "3.6.9"
+      "version": "3.8.5"
+    },
+    "vscode": {
+      "interpreter": {
+        "hash": "6bd77c88278e012ef31757c15997a7bea8c943977c43d6909403c00ae11d43ca"
+      }
     }
   },
   "nbformat": 4,
 
@@ -283,7 +283,8 @@
         "| **experiment_timeout_hours**       | Maximum amount of time in hours that the experiment can take before it terminates. This is optional but provides customers with greater control on exit criteria. |\n",
         "| **label_column_name**              | The name of the label column. |\n",
         "| **max_horizon**               | The forecast horizon is how many periods forward you would like to forecast. This integer horizon is in units of the timeseries frequency (e.g. daily, weekly). Periods are inferred from your data. |\n",
-        "| **n_cross_validations**            | Number of cross validation splits. Rolling Origin Validation is used to split time-series in a temporally consistent way. |\n",
+        "| **n_cross_validations**            | Number of cross validation splits. The default value is \"auto\", in which case AutoMl determines the number of cross-validations automatically, if a validation set is not provided. Or users could specify an integer value. Rolling Origin Validation is used to split time-series in a temporally consistent way. |\n",
+        "|**cv_step_size**|Number of periods between two consecutive cross-validation folds. The default value is \"auto\", in which case AutoMl determines the cross-validation step size automatically, if a validation set is not provided. Or users could specify an integer value.\n",
         "| **time_column_name**               | The name of your time column. |\n",
         "| **grain_column_names**     | The column names used to uniquely identify timeseries in data that has multiple rows with the same timestamp. |"
       ]
@@ -301,7 +302,8 @@
         "    \"iterations\": 15,\n",
         "    \"experiment_timeout_hours\": 1,  # This also needs to be changed based on the dataset. For larger data set this number needs to be bigger.\n",
         "    \"label_column_name\": LABEL_COLUMN_NAME,\n",
-        "    \"n_cross_validations\": 3,\n",
+        "    \"n_cross_validations\": \"auto\",  # Feel free to set to a small integer (>=2) if runtime is an issue.\n",
+        "    \"cv_step_size\": \"auto\",\n",
         "    \"time_column_name\": TIME_COLUMN_NAME,\n",
         "    \"max_horizon\": FORECAST_HORIZON,\n",
         "    \"track_child_runs\": False,\n",
@@ -712,7 +714,12 @@
       "name": "python",
       "nbconvert_exporter": "python",
       "pygments_lexer": "ipython3",
-      "version": "3.6.9"
+      "version": "3.8.5"
+    },
+    "vscode": {
+      "interpreter": {
+        "hash": "6bd77c88278e012ef31757c15997a7bea8c943977c43d6909403c00ae11d43ca"
+      }
     }
   },
   "nbformat": 4,
 
@@ -265,7 +265,8 @@
         "|**forecast_horizon**|The forecast horizon is how many periods forward you would like to forecast. This integer horizon is in units of the timeseries frequency (e.g. daily, weekly).|\n",
         "|**country_or_region_for_holidays**|The country/region used to generate holiday features. These should be ISO 3166 two-letter country/region codes (i.e. 'US', 'GB').|\n",
         "|**target_lags**|The target_lags specifies how far back we will construct the lags of the target variable.|\n",
-        "|**freq**|Forecast frequency. This optional parameter represents the period with which the forecast is desired, for example, daily, weekly, yearly, etc. Use this parameter for the correction of time series containing irregular data points or for padding of short time series. The frequency needs to be a pandas offset alias. Please refer to [pandas documentation](https://pandas.pydata.org/pandas-docs/stable/user_guide/timeseries.html#dateoffset-objects) for more information."
+        "|**freq**|Forecast frequency. This optional parameter represents the period with which the forecast is desired, for example, daily, weekly, yearly, etc. Use this parameter for the correction of time series containing irregular data points or for padding of short time series. The frequency needs to be a pandas offset alias. Please refer to [pandas documentation](https://pandas.pydata.org/pandas-docs/stable/user_guide/timeseries.html#dateoffset-objects) for more information.\n",
+        "|**cv_step_size**|Number of periods between two consecutive cross-validation folds. The default value is \"auto\", in which case AutoMl determines the cross-validation step size automatically, if a validation set is not provided. Or users could specify an integer value."
       ]
     },
     {
@@ -285,7 +286,7 @@
         "|**training_data**|Input dataset, containing both features and label column.|\n",
         "|**label_column_name**|The name of the label column.|\n",
         "|**compute_target**|The remote compute for training.|\n",
-        "|**n_cross_validations**|Number of cross validation splits.|\n",
+        "|**n_cross_validations**|Number of cross-validation folds to use for model/pipeline selection. The default value is \"auto\", in which case AutoMl determines the number of cross-validations automatically, if a validation set is not provided. Or users could specify an integer value.\n",
         "|**enable_early_stopping**|If early stopping is on, training will stop when the primary metric is no longer improving.|\n",
         "|**forecasting_parameters**|A class that holds all the forecasting related parameters.|\n",
         "\n",
@@ -350,6 +351,7 @@
         "    country_or_region_for_holidays=\"US\",  # set country_or_region will trigger holiday featurizer\n",
         "    target_lags=\"auto\",  # use heuristic based lag setting\n",
         "    freq=\"D\",  # Set the forecast frequency to be daily\n",
+        "    cv_step_size=\"auto\",\n",
         ")\n",
         "\n",
         "automl_config = AutoMLConfig(\n",
@@ -362,7 +364,7 @@
         "    label_column_name=target_column_name,\n",
         "    compute_target=compute_target,\n",
         "    enable_early_stopping=True,\n",
-        "    n_cross_validations=3,\n",
+        "    n_cross_validations=\"auto\",  # Feel free to set to a small integer (>=2) if runtime is an issue.\n",
         "    max_concurrent_iterations=4,\n",
         "    max_cores_per_iteration=-1,\n",
         "    verbosity=logging.INFO,\n",
@@ -709,7 +711,7 @@
       "name": "python",
       "nbconvert_exporter": "python",
       "pygments_lexer": "ipython3",
-      "version": "3.6.7"
+      "version": "3.8.5"
     },
     "mimetype": "text/x-python",
     "name": "python",
@@ -719,7 +721,12 @@
       "Forecasting"
     ],
     "task": "Forecasting",
-    "version": 3
+    "version": 3,
+    "vscode": {
+      "interpreter": {
+        "hash": "6bd77c88278e012ef31757c15997a7bea8c943977c43d6909403c00ae11d43ca"
+      }
+    }
   },
   "nbformat": 4,
   "nbformat_minor": 4
 
@@ -308,7 +308,8 @@
         "|-|-|\n",
         "|**time_column_name**|The name of your time column.|\n",
         "|**forecast_horizon**|The forecast horizon is how many periods forward you would like to forecast. This integer horizon is in units of the timeseries frequency (e.g. daily, weekly).|\n",
-        "|**freq**|Forecast frequency. This optional parameter represents the period with which the forecast is desired, for example, daily, weekly, yearly, etc. Use this parameter for the correction of time series containing irregular data points or for padding of short time series. The frequency needs to be a pandas offset alias. Please refer to [pandas documentation](https://pandas.pydata.org/pandas-docs/stable/user_guide/timeseries.html#dateoffset-objects) for more information."
+        "|**freq**|Forecast frequency. This optional parameter represents the period with which the forecast is desired, for example, daily, weekly, yearly, etc. Use this parameter for the correction of time series containing irregular data points or for padding of short time series. The frequency needs to be a pandas offset alias. Please refer to [pandas documentation](https://pandas.pydata.org/pandas-docs/stable/user_guide/timeseries.html#dateoffset-objects) for more information.\n",
+        "|**cv_step_size**|Number of periods between two consecutive cross-validation folds. The default value is \"auto\", in which case AutoMl determines the cross-validation step size automatically, if a validation set is not provided. Or users could specify an integer value."
       ]
     },
     {
@@ -328,7 +329,7 @@
         "|**training_data**|The training data to be used within the experiment.|\n",
         "|**label_column_name**|The name of the label column.|\n",
         "|**compute_target**|The remote compute for training.|\n",
-        "|**n_cross_validations**|Number of cross validation splits. Rolling Origin Validation is used to split time-series in a temporally consistent way.|\n",
+        "|**n_cross_validations**|Number of cross-validation folds to use for model/pipeline selection. The default value is \"auto\", in which case AutoMl determines the number of cross-validations automatically, if a validation set is not provided. Or users could specify an integer value.\n",
         "|**enable_early_stopping**|Flag to enble early termination if the score is not improving in the short term.|\n",
         "|**forecasting_parameters**|A class holds all the forecasting related parameters.|\n"
       ]
@@ -352,6 +353,7 @@
         "    time_column_name=time_column_name,\n",
         "    forecast_horizon=forecast_horizon,\n",
         "    freq=\"H\",  # Set the forecast frequency to be hourly\n",
+        "    cv_step_size=\"auto\",\n",
         ")\n",
         "\n",
         "automl_config = AutoMLConfig(\n",
@@ -363,7 +365,7 @@
         "    label_column_name=target_column_name,\n",
         "    compute_target=compute_target,\n",
         "    enable_early_stopping=True,\n",
-        "    n_cross_validations=3,\n",
+        "    n_cross_validations=\"auto\",  # Feel free to set to a small integer (>=2) if runtime is an issue.\n",
         "    verbosity=logging.INFO,\n",
         "    forecasting_parameters=forecasting_parameters,\n",
         ")"
@@ -609,6 +611,7 @@
         "    forecast_horizon=forecast_horizon,\n",
         "    target_lags=12,\n",
         "    target_rolling_window_size=4,\n",
+        "    cv_step_size=\"auto\",\n",
         ")\n",
         "\n",
         "automl_config = AutoMLConfig(\n",
@@ -628,7 +631,7 @@
         "    label_column_name=target_column_name,\n",
         "    compute_target=compute_target,\n",
         "    enable_early_stopping=True,\n",
-        "    n_cross_validations=3,\n",
+        "    n_cross_validations=\"auto\",  # Feel free to set to a small integer (>=2) if runtime is an issue.\n",
         "    verbosity=logging.INFO,\n",
         "    forecasting_parameters=advanced_forecasting_parameters,\n",
         ")"
@@ -778,7 +781,12 @@
       "name": "python",
       "nbconvert_exporter": "python",
       "pygments_lexer": "ipython3",
-      "version": "3.6.9"
+      "version": "3.8.5"
+    },
+    "vscode": {
+      "interpreter": {
+        "hash": "6bd77c88278e012ef31757c15997a7bea8c943977c43d6909403c00ae11d43ca"
+      }
     }
   },
   "nbformat": 4,
 
@@ -335,7 +335,8 @@
         "    forecast_horizon=forecast_horizon,\n",
         "    time_series_id_column_names=[TIME_SERIES_ID_COLUMN_NAME],\n",
         "    target_lags=lags,\n",
-        "    freq=\"H\",  # Set the forecast frequency to be hourly\n",
+        "    freq=\"H\",  # Set the forecast frequency to be hourly,\n",
+        "    cv_step_size=\"auto\",\n",
         ")"
       ]
     },
@@ -365,7 +366,7 @@
         "    enable_early_stopping=True,\n",
         "    training_data=train_data,\n",
         "    compute_target=compute_target,\n",
-        "    n_cross_validations=3,\n",
+        "    n_cross_validations=\"auto\",  # Feel free to set to a small integer (>=2) if runtime is an issue.\n",
         "    verbosity=logging.INFO,\n",
         "    max_concurrent_iterations=4,\n",
         "    max_cores_per_iteration=-1,\n",
@@ -879,13 +880,18 @@
       "name": "python",
       "nbconvert_exporter": "python",
       "pygments_lexer": "ipython3",
-      "version": "3.6.8"
+      "version": "3.8.5"
     },
     "tags": [
       "Forecasting",
       "Confidence Intervals"
     ],
-    "task": "Forecasting"
+    "task": "Forecasting",
+    "vscode": {
+      "interpreter": {
+        "hash": "6bd77c88278e012ef31757c15997a7bea8c943977c43d6909403c00ae11d43ca"
+      }
+    }
   },
   "nbformat": 4,
   "nbformat_minor": 2
 
@@ -263,7 +263,8 @@
         "| **experiment_timeout_hours**       | Maximum amount of time in hours that the experiment can take before it terminates. This is optional but provides customers with greater control on exit criteria. |\n",
         "| **label_column_name**              | The name of the label column. |\n",
         "| **forecast_horizon**               | The forecast horizon is how many periods forward you would like to forecast. This integer horizon is in units of the timeseries frequency (e.g. daily, weekly). Periods are inferred from your data. |\n",
-        "| **n_cross_validations**            | Number of cross validation splits. Rolling Origin Validation is used to split time-series in a temporally consistent way. |\n",
+        "|**n_cross_validations**|Number of cross-validation folds to use for model/pipeline selection. The default value is \"auto\", in which case AutoMl determines the number of cross-validations automatically, if a validation set is not provided. Or users could specify an integer value.\n",
+        "|**cv_step_size**|Number of periods between two consecutive cross-validation folds. The default value is \"auto\", in which case AutoMl determines the cross-validation step size automatically, if a validation set is not provided. Or users could specify an integer value.\n",
         "| **enable_early_stopping**          | Flag to enable early termination if the score is not improving in the short term. |\n",
         "| **time_column_name**               | The name of your time column. |\n",
         "| **hierarchy_column_names**         | The names of columns that define the hierarchical structure of the data from highest level to most granular. |\n",
@@ -311,10 +312,11 @@
         "    \"track_child_runs\": False,\n",
         "    \"pipeline_fetch_max_batch_size\": 15,\n",
         "    \"model_explainability\": model_explainability,\n",
+        "    \"n_cross_validations\": \"auto\",  # Feel free to set to a small integer (>=2) if runtime is an issue.\n",
+        "    \"cv_step_size\": \"auto\",\n",
         "    # The following settings are specific to this sample and should be adjusted according to your own needs.\n",
         "    \"iteration_timeout_minutes\": 10,\n",
         "    \"iterations\": 10,\n",
-        "    \"n_cross_validations\": 2,\n",
         "}\n",
         "\n",
         "hts_parameters = HTSTrainParameters(\n",