%matplotlib inline
%load_ext autoreload
%autoreload 2


import datetime
import time

import matplotlib.pyplot as plt
import numpy as np
import pandas as pd

try:
    from sktime.forecasting.model_selection import temporal_train_test_split
except ImportError:
    try:
        from sktime.split import TemporalTrainTestSplitter as temporal_train_test_split
    except ImportError as e:
        raise ImportError("Failed to import Splitters from sktime. "
                          "Please ensure you have the correct version of sktime installed.") from e

plt.rcParams["figure.figsize"] = [15, 5]
plt.rcParams["font.size"] = 15

import automlx
from automlx import init


! wget https://github.com/Mcompetitions/M4-methods/raw/master/Dataset/Train/Weekly-train.csv -q
! wget https://github.com/Mcompetitions/M4-methods/raw/master/Dataset/M4-info.csv -q


all_series = pd.read_csv("Weekly-train.csv", index_col=0)  # consists of thousands of series
metadata_csv = pd.read_csv("M4-info.csv", index_col=0)  # describes their datetime index


series_id = "W142"
series_metadata = metadata_csv.loc[series_id]
series_values = all_series.loc[series_id]

# drop NaNs for the time period where data wasn't recorded
series_values.dropna(inplace=True)

# retrieve starting date of recording and series length to generate the datetime index
start_date = pd.to_datetime(series_metadata.StartingDate)
future_dates = pd.date_range(start=start_date, periods=len(series_values), freq="W")
y = pd.DataFrame(
    series_values.to_numpy(),
    index=future_dates,
    columns=[(series_metadata.category + "_" + series_id)],
)


y = y.tail(n=200)  # approximately 4 years of data
y.plot(ylabel="Weekly Series " + series_id, grid=True)

<Axes: ylabel='Weekly Series W142'>


print(y.index)
print("Time Index is", "" if y.index.is_monotonic_increasing else "NOT", "monotonic.")
print("Train datatype", type(y))

DatetimeIndex(['2012-12-09 12:00:00', '2012-12-16 12:00:00',
               '2012-12-23 12:00:00', '2012-12-30 12:00:00',
               '2013-01-06 12:00:00', '2013-01-13 12:00:00',
               '2013-01-20 12:00:00', '2013-01-27 12:00:00',
               '2013-02-03 12:00:00', '2013-02-10 12:00:00',
               ...
               '2016-07-31 12:00:00', '2016-08-07 12:00:00',
               '2016-08-14 12:00:00', '2016-08-21 12:00:00',
               '2016-08-28 12:00:00', '2016-09-04 12:00:00',
               '2016-09-11 12:00:00', '2016-09-18 12:00:00',
               '2016-09-25 12:00:00', '2016-10-02 12:00:00'],
              dtype='datetime64[ns]', length=200, freq='W-SUN')
Time Index is  monotonic.
Train datatype <class 'pandas.core.frame.DataFrame'>


y_train, y_test = temporal_train_test_split(y, test_size=26)
print("Training length: ", len(y_train), " Testing length: ", len(y_test))

Training length:  174  Testing length:  26


print("y_train", y_train)
print("\ny_test", y_test)

y_train                      Finance_W142
2012-12-09 12:00:00      4793.269
2012-12-16 12:00:00      4818.969
2012-12-23 12:00:00      4863.783
2012-12-30 12:00:00      4926.357
2013-01-06 12:00:00      4916.616
...                           ...
2016-03-06 12:00:00      5024.759
2016-03-13 12:00:00      5021.153
2016-03-20 12:00:00      4996.524
2016-03-27 12:00:00      5004.032
2016-04-03 12:00:00      5053.536

[174 rows x 1 columns]

y_test                      Finance_W142
2016-04-10 12:00:00      5039.544
2016-04-17 12:00:00      5053.420
2016-04-24 12:00:00      5066.860
2016-05-01 12:00:00      5099.887
2016-05-08 12:00:00      5082.291
2016-05-15 12:00:00      5084.340
2016-05-22 12:00:00      5081.651
2016-05-29 12:00:00      5106.797
2016-06-05 12:00:00      5147.906
2016-06-12 12:00:00      5140.993
2016-06-19 12:00:00      5153.210
2016-06-26 12:00:00      5258.369
2016-07-03 12:00:00      5307.455
2016-07-10 12:00:00      5295.631
2016-07-17 12:00:00      5300.088
2016-07-24 12:00:00      5295.456
2016-07-31 12:00:00      5333.739
2016-08-07 12:00:00      5338.803
2016-08-14 12:00:00      5339.390
2016-08-21 12:00:00      5345.043
2016-08-28 12:00:00      5369.168
2016-09-04 12:00:00      5401.186
2016-09-11 12:00:00      5395.298
2016-09-18 12:00:00      5386.552
2016-09-25 12:00:00      5377.376
2016-10-02 12:00:00      5406.685


init(engine="ray")

[2025-05-22 05:16:38,343] [automlx.backend] Overwriting ray session directory to /tmp/z9fyq_g2/ray, which will be deleted at engine shutdown. If you wish to retain ray logs, provide _temp_dir in ray_setup dict of engine_opts when initializing the AutoMLx engine.


est1 = automlx.Pipeline(task="forecasting", n_algos_tuned=2)
est1.fit(X=None, y=y_train)

print("Selected model: {}".format(est1.selected_model_))
print("Selected model params: {}".format(est1.selected_model_params_))

[2025-05-22 05:16:43,535] [automlx.data_transform] Number of simple differencing orders required: d = 1
[2025-05-22 05:16:43,538] [automlx.data_transform] Seasonal Periodicities; from decomposed/adjusted: [52, 35, 1]
[2025-05-22 05:16:43,603] [automlx.interface] Dataset shape: (174,2)
[2025-05-22 05:16:46,294] [sanerec.autotuning.parameter] Hyperparameter epsilon autotune range is set to its validation range. This could lead to long training times
[2025-05-22 05:16:46,611] [sanerec.autotuning.parameter] Hyperparameter repeat_quality_threshold autotune range is set to its validation range. This could lead to long training times
[2025-05-22 05:16:46,617] [sanerec.autotuning.parameter] Hyperparameter scope autotune range is set to its validation range. This could lead to long training times
[2025-05-22 05:16:46,714] [automlx.data_transform] Running preprocessing. Number of features: 3
[2025-05-22 05:16:46,800] [automlx.data_transform] Preprocessing completed. Took 0.087 secs
[2025-05-22 05:16:46,810] [automlx.process] Running Model Generation
[2025-05-22 05:16:46,860] [automlx] Provided model (VARMAXForecaster) is not supported.Supported models are: ['LGBMForecaster', 'ExtraTreesForecaster', 'ExpSmoothForecaster', 'NaiveForecaster', 'SARIMAXForecaster', 'STLwARIMAForecaster', 'ThetaForecaster', 'ProphetForecaster', 'ETSForecaster', 'STLwESForecaster', 'XGBForecaster']
[2025-05-22 05:16:46,860] [automlx] Provided model (DynFactorForecaster) is not supported.Supported models are: ['LGBMForecaster', 'ExtraTreesForecaster', 'ExpSmoothForecaster', 'NaiveForecaster', 'SARIMAXForecaster', 'STLwARIMAForecaster', 'ThetaForecaster', 'ProphetForecaster', 'ETSForecaster', 'STLwESForecaster', 'XGBForecaster']
[2025-05-22 05:16:46,861] [automlx.process] Model Generation completed.
[2025-05-22 05:16:46,930] [automlx.model_selection] Running Model Selection
[2025-05-22 05:16:50,911] [automlx.dataset] Forecast horizon set to 13 for validation sets.
[2025-05-22 05:17:05,408] [automlx.model_selection] Model Selection completed - Took 18.478 sec - Selected models: [['ETSForecaster', 'STLwARIMAForecaster']]
[2025-05-22 05:17:05,494] [automlx.trials] Running Model Tuning for ['ETSForecaster']
[2025-05-22 05:17:05,566] [automlx.dataset] Forecast horizon set to 13 for validation sets.
[2025-05-22 05:17:13,983] [automlx.trials] Best parameters for ETSForecaster: {'error': 'add', 'trend': 'add', 'damped_trend': True, 'seasonal': 'add', 'seasonal_periods': 52, 'initialization_method': 'estimated', 'initial_level': None, 'initial_trend': None, 'initial_seasonal': None, 'bounds': None, 'dates': None, 'freq': None, 'missing': 'none', 'start_params': None, 'maxiter': 1500, 'disp': -1, 'return_params': False}
[2025-05-22 05:17:13,985] [automlx.trials] Model Tuning completed. Took: 8.490 secs
[2025-05-22 05:17:14,202] [automlx.trials] Running Model Tuning for ['STLwARIMAForecaster']
[2025-05-22 05:17:14,287] [automlx.dataset] Forecast horizon set to 13 for validation sets.
[2025-05-22 05:17:17,083] [automlx.trials] Best parameters for STLwARIMAForecaster: {'seasonal_deg': 1, 'trend_deg': 1, 'low_pass_deg': 1, 'period': 52, 'arima_p': 2, 'arima_d': 1, 'arima_q': 2, 'arima_trend': 'n', 'concentrate_scale': True}
[2025-05-22 05:17:17,084] [automlx.trials] Model Tuning completed. Took: 2.881 secs
[2025-05-22 05:17:18,994] [automlx.interface] Re-fitting pipeline
[2025-05-22 05:17:19,016] [automlx.final_fit] Skipping updating parameter seed, already fixed by FinalFit_5439e7f1-c
[2025-05-22 05:17:20,802] [automlx.interface] AutoMLx completed.
Selected model: ETSForecaster
Selected model params: {'error': 'add', 'trend': 'add', 'damped_trend': True, 'seasonal': 'add', 'seasonal_periods': 52, 'initialization_method': 'estimated', 'initial_level': None, 'initial_trend': None, 'initial_seasonal': None, 'bounds': None, 'dates': None, 'freq': None, 'missing': 'none', 'start_params': None, 'maxiter': 1500, 'disp': -1, 'return_params': False}


predictions = est1.forecast(periods=len(y_test), alpha=0.05)

[2025-05-22 05:17:22,400] [automlx.model] Forecast called on ETSForecaster that's not been fitted.


future_index = y_train.index[-5:].union(y_test.index[:5])
print(future_index)

DatetimeIndex(['2016-03-06 12:00:00', '2016-03-13 12:00:00',
               '2016-03-20 12:00:00', '2016-03-27 12:00:00',
               '2016-04-03 12:00:00', '2016-04-10 12:00:00',
               '2016-04-17 12:00:00', '2016-04-24 12:00:00',
               '2016-05-01 12:00:00', '2016-05-08 12:00:00'],
              dtype='datetime64[ns]', freq='W-SUN')


est1.predict(X=pd.DataFrame(index=future_index))

[2025-05-22 05:17:22,523] [automlx.model] Predict called on ETSForecaster that's not been fitted.


est1.plot_forecast(predictions=predictions, additional_frames=dict(y_test=y_test))


est1.print_summary()


# Each trial is a tuple of
# (algorithm, no. samples, no. features, mean CV score, hyperparameters,
# all CV scores, total CV time (s), memory usage (Gb))
trials = est1.completed_trials_summary_[
    est1.completed_trials_summary_["Step"].str.contains("Model Selection")
]
name_of_score_column = f"Score ({est1._inferred_score_metric[0].name})"
trials.replace([np.inf, -np.inf], np.nan, inplace=True)
trials.dropna(subset=[name_of_score_column], inplace=True)
scores = trials[name_of_score_column].tolist()
models = trials["Algorithm"].tolist()
colors = []

y_margin = 0.10 * (max(scores) - min(scores))
s = pd.Series(scores, index=models).sort_values(ascending=False)
s = s.dropna()
for f in s.keys():
    if f.strip() == est1.selected_model_.strip():
        colors.append("orange")
    elif s[f] >= s.mean():
        colors.append("teal")
    else:
        colors.append("turquoise")


fig, ax = plt.subplots(1)
ax.set_title("Algorithm Selection Trials")
ax.set_ylim(min(scores) - y_margin, max(scores) + y_margin)
ax.set_ylabel(est1._inferred_score_metric[0].name)
s.plot.bar(ax=ax, color=colors, edgecolor="black")
ax.axhline(y=s.mean(), color="black", linewidth=0.5)
plt.show()


# Each trial is a row in a dataframe that contains
# Algorithm, Number of Samples, Number of Features, Hyperparameters, Score, Runtime, Memory Usage, Step as features
trials = est1.completed_trials_summary_[
    est1.completed_trials_summary_["Step"].str.contains("Model Tuning")
]
trials.replace([np.inf, -np.inf], np.nan, inplace=True)
trials.dropna(subset=[name_of_score_column], inplace=True)
trials.drop(trials[trials["Finished"] == -1].index, inplace=True)
trials["Finished"] = trials["Finished"].apply(
    lambda x: time.mktime(datetime.datetime.strptime(x, "%a %b %d %H:%M:%S %Y").timetuple())
)
trials.sort_values(by=["Finished"], ascending=True, inplace=True)
scores = trials[name_of_score_column].tolist()
score = []
score.append(scores[0])
for i in range(1, len(scores)):
    if scores[i] >= score[i - 1]:
        score.append(scores[i])
    else:
        score.append(score[i - 1])
y_margin = 0.10 * (max(score) - min(score))

fig, ax = plt.subplots(1)
ax.set_title("Hyperparameter Tuning Trials")
ax.set_xlabel("Iteration $n$")
ax.set_ylabel(est1._inferred_score_metric[0].name)
ax.grid(color="g", linestyle="-", linewidth=0.1)
ax.set_ylim(min(score) - y_margin, max(score) + y_margin)
ax.plot(range(1, len(trials) + 1), score, "k:", marker="s", color="teal", markersize=3)
plt.show()


print(f"### Plotting is enabled for total models tuned = {len(est1.pipelines_)}.")
print("### Model_name\t\t Val_score ")

for pipeline in est1.pipelines_:
    print(
        pipeline.selected_model_,
        " \t",
        "%.4f"
        % est1.completed_trials_summary_[est1.completed_trials_summary_["Algorithm"] == pipeline.selected_model_].iloc[0][name_of_score_column],
        "\t",  # validation_score
    )
    predictions = pipeline.forecast(periods=len(y_test), alpha=0.05)  # out-of-sample forecast
    predictions.index = y_test.index
    fig = pipeline.plot_forecast(predictions=predictions, additional_frames=dict(y_test=y_test))
    fig.show()

### Plotting is enabled for total models tuned = 2.
### Model_name		 Val_score 
ETSForecaster  	 -0.0361 	
[2025-05-22 05:17:23,818] [automlx.model] Forecast called on ETSForecaster that's not been fitted.

STLwARIMAForecaster  	 -0.0855


series_ids = ["W142", "W143"]
series_values = all_series.loc[series_ids].T

# drop NaNs for the time period where data wasn't recorded
series_values.dropna(inplace=True)

# we will take the first 100 elements of the series
series_values = series_values[:100]

# retrieve starting date of recording and series length to generate the datetime index
start_date = "28-06-00 12:00"
future_dates = pd.date_range(start=start_date, periods=len(series_values), freq="W")
data = pd.DataFrame(series_values.to_numpy(), index=future_dates, columns=series_ids)
data.index = np.arange(0, len(data))

y = pd.DataFrame(data["W142"])
X = pd.DataFrame(data["W143"])


X_train_df, X_test_df = temporal_train_test_split(X, train_size=0.9)
y_train_df, y_test_df = temporal_train_test_split(y, train_size=0.9)


est2 = automlx.Pipeline(
    task="forecasting",
    model_list=[
        "LGBMForecaster",
        "ExtraTreesForecaster",
        "XGBForecaster",
        "SARIMAXForecaster",
        "ProphetForecaster",
    ],
)
est2.fit(X=X_train_df, y=y_train_df)

print("Selected model: {}".format(est2.selected_model_))
print("Selected model params: {}".format(est2.selected_model_params_))

[2025-05-22 05:17:24,162] [automlx.data_transform] Number of simple differencing orders required: d = 0
[2025-05-22 05:17:24,164] [automlx.data_transform] Seasonal Periodicities; from decomposed/adjusted: [1]
[2025-05-22 05:17:24,235] [automlx.interface] Dataset shape: (90,3)
[2025-05-22 05:17:24,342] [automlx.data_transform] Running preprocessing. Number of features: 4
[2025-05-22 05:17:24,449] [automlx.data_transform] Preprocessing completed. Took 0.107 secs
[2025-05-22 05:17:24,490] [automlx.process] Running Model Generation
[2025-05-22 05:17:24,536] [automlx] Provided model (SARIMAXForecaster) is not supported.Supported models are: ['LGBMForecaster', 'ExtraTreesForecaster', 'ExpSmoothForecaster', 'NaiveForecaster', 'ThetaForecaster', 'ETSForecaster', 'XGBForecaster']
[2025-05-22 05:17:24,536] [automlx] Provided model (ProphetForecaster) is not supported.Supported models are: ['LGBMForecaster', 'ExtraTreesForecaster', 'ExpSmoothForecaster', 'NaiveForecaster', 'ThetaForecaster', 'ETSForecaster', 'XGBForecaster']
[2025-05-22 05:17:24,538] [automlx.process] Model Generation completed.
[2025-05-22 05:17:24,590] [automlx.model_selection] Running Model Selection
[2025-05-22 05:17:30,685] [automlx.model_selection] Model Selection completed - Took 6.095 sec - Selected models: [['XGBForecaster']]
[2025-05-22 05:17:30,758] [automlx.trials] Running Model Tuning for ['XGBForecaster']
[2025-05-22 05:17:45,375] [automlx.trials] Best parameters for XGBForecaster: {'differencing_order': 1, 'acf_local_maxima': '[4, 9, 18, 22, 14, 31, 26, 12, 1]', 'use_X': True, 'n_estimators': 16, 'max_depth': 2}
[2025-05-22 05:17:45,376] [automlx.trials] Model Tuning completed. Took: 14.618 secs
[2025-05-22 05:17:45,790] [automlx.interface] Re-fitting pipeline
[2025-05-22 05:17:45,801] [automlx.final_fit] Skipping updating parameter seed, already fixed by FinalFit_3b050512-1
[2025-05-22 05:17:48,871] [automlx.interface] AutoMLx completed.
Selected model: XGBForecaster
Selected model params: {'differencing_order': 1, 'acf_local_maxima': '[4, 9, 18, 22, 14, 31, 26, 12, 1]', 'use_X': True, 'n_estimators': 16, 'max_depth': 2}


series_ids = ["W141", "W142", "W143"]
series_values = all_series.loc[series_ids].T

# drop NaNs for the time period where data wasn't recorded
series_values.dropna(inplace=True)
# we will take the first 100 elements of the series
series_values = series_values[:100]


# retrieve starting date of recording and series length to generate the datetime index
start_date = "28-06-00 12:00"
future_dates = pd.date_range(start=start_date, periods=len(series_values), freq="W")
data = pd.DataFrame(series_values.to_numpy(), index=future_dates, columns=series_ids)
data.index = np.arange(0, len(data))

y = data[["W142", "W143"]]
X = pd.DataFrame(data["W141"])
# adding the constant variable
X["const"] = 1

X_train_df, X_test_df = temporal_train_test_split(X, train_size=0.9)
y_train_df, y_test_df = temporal_train_test_split(y, train_size=0.9)


custom_pipeline = automlx.Pipeline(
    task="forecasting",  # Supports 'classification', regression', 'anomaly_detection' and 'forecasting'
    model_list=[  # Specify the models you want the AutoMLx to consider
        "DynFactorForecaster",
        "VARMAXForecaster",
    ],
    n_algos_tuned=2,  # Choose how many models to tune
    preprocessing=True,  # Disable or enable Preprocessing step. Default to `True`
    search_space={},  # You can specify the hyper-parameters and ranges we search
    max_tuning_trials=2,  # The maximum number of tuning trials. Can be integer or Dict (max number for each model)
    score_metric="neg_sym_mean_abs_percent_error",  # Any scikit-learn metric or a custom function
    time_series_period=None,  # The period of time series
)


custom_pipeline.fit(X=X_train_df, y=y_train_df, cv=8)

[2025-05-22 05:17:49,513] [automlx.data_transform] Number of simple differencing orders required: d = 0
[2025-05-22 05:17:49,515] [automlx.data_transform] Seasonal Periodicities; from decomposed/adjusted: [1]
[2025-05-22 05:17:49,600] [automlx.interface] Dataset shape: (90,5)
[2025-05-22 05:17:49,641] [automlx.interface] Model Tune disabled.
[2025-05-22 05:17:49,711] [automlx.data_transform] Running preprocessing. Number of features: 6
[2025-05-22 05:17:49,823] [automlx.data_transform] Preprocessing completed. Took 0.111 secs
[2025-05-22 05:17:49,873] [automlx.process] Running Model Generation
[2025-05-22 05:17:49,913] [automlx.process] Model Generation completed.
[2025-05-22 05:17:49,972] [automlx.model_selection] Running Model Selection
[2025-05-22 05:17:49,972] [automlx.trials] Fewer models (2) than top_k (2) provided, skipping...
[2025-05-22 05:17:50,044] [automlx.interface] Re-fitting pipeline
[2025-05-22 05:17:50,061] [automlx.final_fit] Skipping updating parameter seed, already fixed by FinalFit_fa016e40-2
[2025-05-22 05:17:51,918] [automlx.interface] AutoMLx completed.

<automlx._interface.forecaster.AutoForecaster at 0x14a81890dfa0>


test_score = custom_pipeline.score(X=X_test_df, y=y_test_df)

print("Ranked models: {}".format(custom_pipeline.ranked_models_))
print("Selected model: {}".format(custom_pipeline.selected_model_))
print("Selected model params: {}".format(custom_pipeline.selected_model_params_))
print(f"Score on test data : {test_score}")

[2025-05-22 05:17:52,159] [automlx.model] Predict called on DynFactorForecaster that's not been fitted.
Ranked models: ['DynFactorForecaster', 'VARMAXForecaster']
Selected model: DynFactorForecaster
Selected model params: {'k_factors': 1, 'error_order': 2, 'factor_order': 2, 'error_cov_type': 'diagonal', 'use_X': True, 'error_var': False, 'enforce_stationarity': True}
Score on test data : -0.45821993166134833


y_pred = custom_pipeline.predict(pd.concat([X_train_df[-5:0], X_test_df], axis=0))
y_forecast = custom_pipeline.forecast(
    len(y_test_df), alpha=0.8, X=X_test_df
)  # out-of-sample forecast

[2025-05-22 05:17:52,258] [automlx.model] Predict called on DynFactorForecaster that's not been fitted.
[2025-05-22 05:17:52,279] [automlx.model] Forecast called on DynFactorForecaster that's not been fitted.


y_forecast


print(
    "Tuned model testing score (negative sMAPE): ", custom_pipeline.score(X=X_test_df, y=y_test_df)
)

[2025-05-22 05:17:52,439] [automlx.model] Predict called on DynFactorForecaster that's not been fitted.
Tuned model testing score (negative sMAPE):  -0.45821993166134833


custom_pipeline.plot_forecast(predictions=y_forecast, additional_frames=dict(test=y_test_df))


explainer = automlx.MLExplainer(est1,
                                None,
                                y_train,
                                task="forecasting")

[2025-05-22 05:17:52,834] [automlx.model] Predict called on ETSForecaster that's not been fitted.


exp = explainer.explain_prediction(forecast_timepoints=[10])

[2025-05-22 05:17:53,040] [automlx.model] Forecast called on ETSForecaster that's not been fitted.
[2025-05-22 05:17:53,648] [automlx.model] Forecast called on ETSForecaster that's not been fitted.


exp[0].to_dataframe(n_features=10)

[2025-05-22 05:17:56,724] [automlx.mlx] Displaying only non-zero attributions.


exp[0].show_in_notebook()


advanced_exp = explainer.explain_prediction(forecast_timepoints=[10], reference_timepoint=-13)
advanced_exp[0].show_in_notebook()

[2025-05-22 05:17:57,467] [automlx.model] Forecast called on ETSForecaster that's not been fitted.
[2025-05-22 05:17:58,072] [automlx.model] Forecast called on ETSForecaster that's not been fitted.

Step	# Samples	# Features	Algorithm	Hyperparameters	Score (neg_sym_mean_abs_percent_error)	Runtime (Seconds)	Memory Usage (GB)	Finished
Model Selection	161	2	ETSForecaster	{'error': 'add', 'trend': 'add', 'damped_trend': False, 'seasonal': 'add', 'seasonal_periods': 52, 'initialization_method': 'estimated', 'initial_level': None, 'initial_trend': None, 'initial_seasonal': None, 'bounds': None, 'dates': None, 'freq': None, 'missing': 'none', 'start_params': None, 'maxiter': 1500, 'disp': -1, 'return_params': False}	-0.0361	5.5539	0.3021	Thu May 22 05:16:57 2025
Model Selection	161	2	STLwARIMAForecaster	{'seasonal_deg': 1, 'trend_deg': 1, 'low_pass_deg': 0, 'period': 52, 'arima_p': 2, 'arima_d': 1, 'arima_q': 2, 'arima_trend': 'n', 'concentrate_scale': True}	-0.0855	1.5110	0.3125	Thu May 22 05:16:56 2025
Model Selection	161	2	XGBForecaster	{'differencing_order': 1, 'acf_local_maxima': '[52, 35, 17, 26, 22, 4, 48, 30, 13, 56, 39, 61, 44, 9, 65, 1]', 'use_X': True, 'n_estimators': 50, 'max_depth': 5}	-0.0951	19.0194	0.7352	Thu May 22 05:17:04 2025
Model Selection	148	2	ExtraTreesForecaster	{'differencing_order': 1, 'acf_local_maxima': '[52, 35, 17, 26, 22, 4, 48, 30, 13, 56, 39, 61, 44, 9, 65, 1]', 'use_X': True, 'n_estimators': 40, 'min_samples_leaf': 0.030458}	-0.1252	23.8061	0.7191	Thu May 22 05:17:01 2025
Model Selection	135	2	LGBMForecaster	{'differencing_order': 1, 'acf_local_maxima': '[52, 35, 17, 26, 22, 4, 48, 30, 13, 56, 39, 61, 44, 9, 65, 1]', 'use_X': True, 'max_depth': 4, 'n_estimators': 37}	-0.13	10.1164	0.7386	Thu May 22 05:17:05 2025
Model Selection	148	2	ThetaForecaster	{'sp': 52, 'deseasonalize': False, 'initial_level': None}	-0.2091	10.4193	0.3012	Thu May 22 05:16:56 2025
Model Selection	161	2	ExpSmoothForecaster	{'trend': 'add', 'damped_trend': True, 'seasonal': None, 'sp': 52, 'use_boxcox': False}	-0.2475	7.6202	0.2963	Thu May 22 05:16:56 2025
Model Selection	109	2	NaiveForecaster	{'strategy': 'last', 'sp': 52, 'window_length': None}	-0.4494	9.1389	0.2845	Thu May 22 05:16:55 2025
Model Selection	161	2	STLwESForecaster	{'seasonal_deg': 1, 'trend_deg': 1, 'low_pass_deg': 1, 'period': 52, 'es_trend': 'add', 'es_damped_trend': True, 'concentrate_scale': True}	-inf	1.5751	0.3132	Thu May 22 05:16:56 2025
Model Selection	161	2	SARIMAXForecaster	{'sp': 52, 'p': 2, 'd': 1, 'q': 2, 'P': 1, 'D': 0, 'Q': 1, 'trend': 'n', 'use_X': True, 'enforce_stationarity': True, 'enforce_invertibility': True, 'method': 'lbfgs', 'disp': -1, 'concentrate_scale': False}	-inf	28.3533	0.3440	Thu May 22 05:17:02 2025
...	...	...	...	...	...	...	...	...
Model Tuning	161	2	ETSForecaster	{'error': 'add', 'trend': 'add', 'damped_trend': False, 'seasonal': 'add', 'seasonal_periods': 35, 'initialization_method': 'estimated', 'initial_level': None, 'initial_trend': None, 'initial_seasonal': None, 'bounds': None, 'dates': None, 'freq': None, 'missing': 'none', 'start_params': None, 'maxiter': 1500, 'disp': -1, 'return_params': False}	-inf	5.7152	0.7399	Thu May 22 05:17:10 2025
Model Tuning	161	2	ETSForecaster	{'error': 'add', 'trend': 'add', 'damped_trend': True, 'seasonal': 'add', 'seasonal_periods': 35, 'initialization_method': 'estimated', 'initial_level': None, 'initial_trend': None, 'initial_seasonal': None, 'bounds': None, 'dates': None, 'freq': None, 'missing': 'none', 'start_params': None, 'maxiter': 1500, 'disp': -1, 'return_params': False}	-inf	5.4003	0.7369	Thu May 22 05:17:13 2025
Model Tuning	161	2	ETSForecaster	{'error': 'add', 'trend': 'mul', 'damped_trend': False, 'seasonal': 'add', 'seasonal_periods': 52, 'initialization_method': 'estimated', 'initial_level': None, 'initial_trend': None, 'initial_seasonal': None, 'bounds': None, 'dates': None, 'freq': None, 'missing': 'none', 'start_params': None, 'maxiter': 1500, 'disp': -1, 'return_params': False}	-inf	6.9341	0.7346	Thu May 22 05:17:11 2025
Model Tuning	148	2	ETSForecaster	{'error': 'add', 'trend': None, 'damped_trend': False, 'seasonal': 'add', 'seasonal_periods': 52, 'initialization_method': 'estimated', 'initial_level': None, 'initial_trend': None, 'initial_seasonal': None, 'bounds': None, 'dates': None, 'freq': None, 'missing': 'none', 'start_params': None, 'maxiter': 1500, 'disp': -1, 'return_params': False}	-inf	5.1213	0.7399	Thu May 22 05:17:11 2025
Model Tuning	148	2	ETSForecaster	{'error': 'mul', 'trend': 'add', 'damped_trend': False, 'seasonal': 'add', 'seasonal_periods': 52, 'initialization_method': 'estimated', 'initial_level': None, 'initial_trend': None, 'initial_seasonal': None, 'bounds': None, 'dates': None, 'freq': None, 'missing': 'none', 'start_params': None, 'maxiter': 1500, 'disp': -1, 'return_params': False}	-inf	9.9058	0.7394	Thu May 22 05:17:08 2025
Model Tuning	161	2	STLwARIMAForecaster	{'seasonal_deg': 0, 'trend_deg': 0, 'low_pass_deg': 0, 'period': 52, 'arima_p': 0, 'arima_d': 1, 'arima_q': 0, 'arima_trend': 'n', 'concentrate_scale': True}	-inf	0.4764	0.7400	Thu May 22 05:17:16 2025
Model Tuning	135	2	STLwARIMAForecaster	{'seasonal_deg': 0, 'trend_deg': 1, 'low_pass_deg': 0, 'period': 52, 'arima_p': 2, 'arima_d': 1, 'arima_q': 2, 'arima_trend': 'n', 'concentrate_scale': True}	-inf	1.8820	0.7403	Thu May 22 05:17:16 2025
Model Tuning	161	2	STLwARIMAForecaster	{'seasonal_deg': 1, 'trend_deg': 1, 'low_pass_deg': 0, 'period': 1, 'arima_p': 2, 'arima_d': 1, 'arima_q': 2, 'arima_trend': 'n', 'concentrate_scale': True}	-inf	0.4002	0.7403	Thu May 22 05:17:16 2025
Model Tuning	161	2	STLwARIMAForecaster	{'seasonal_deg': 1, 'trend_deg': 1, 'low_pass_deg': 0, 'period': 52, 'arima_p': 3, 'arima_d': 1, 'arima_q': 2, 'arima_trend': 'n', 'concentrate_scale': True}	-inf	1.5363	0.7460	Thu May 22 05:17:15 2025
Model Tuning	161	2	STLwARIMAForecaster	{'seasonal_deg': 1, 'trend_deg': 1, 'low_pass_deg': 0, 'period': 52, 'arima_p': 5, 'arima_d': 1, 'arima_q': 2, 'arima_trend': 'n', 'concentrate_scale': True}	-inf	1.7382	0.7460	Thu May 22 05:17:15 2025

	W142	W143	W142_ci_lower	W142_ci_upper
90	1525.364311	4120.705204	1516.139510	1534.589111
91	1532.862846	4110.992426	1519.246154	1546.479538
92	1522.772589	4118.850533	1506.048922	1539.496256
93	1520.196238	4119.049832	1501.057987	1539.334490
94	1520.707582	4115.975299	1499.581227	1541.833938
95	1514.154962	4119.741508	1491.327947	1536.981976
96	1514.379038	4116.655394	1490.057821	1538.700255
97	1509.617328	4118.423102	1483.957322	1535.277333
98	1513.422128	4111.623366	1486.544654	1540.299602
99	1505.548897	4116.366154	1477.551476	1533.546318

	Feature	Attribution
0	Yearly periodicity of Finance_W142	67.238872
1	Trend of Finance_W142	17.761128

Building a Forecaster using AutoMLx

Overview of this Notebook¶

Prerequisites¶

Business Use¶

Table of Contents¶

Setup¶

Load the M4 Forecasting Competition dataset¶

Univariate time series (single-target forecasting)¶

Split data into train and test for the forecasting task¶

Setting the execution engine¶

Create an instance of Oracle AutoMLx¶

Train a forecasting model using Oracle AutoMLx¶

Generating and visualizing forecasts¶

Analyze the AutoML optimization process¶

Algorithm Selection¶

Hyperparameter Tuning¶

Multivariate time series¶

Single-target Forecasting with Exogenous Variables¶

Multi-target Forecasting with Exogenous Variables¶

Advanced AutoML Configuration¶

Specify the number of cross-validation (CV) folds¶

Make predictions¶

Visualization¶

Machine Learning Explainability (MLX)¶

Initializing an MLExplainer¶

Prediction Explanations (Comparative Feature Importance)¶

Visualization¶

References¶

	Finance_W142
2016-03-06 12:00:00	5015.306711
2016-03-13 12:00:00	5013.432026
2016-03-20 12:00:00	4998.150861
2016-03-27 12:00:00	5013.397612
2016-04-03 12:00:00	5028.193875
2016-04-10 12:00:00	5052.535771
2016-04-17 12:00:00	5066.283916
2016-04-24 12:00:00	5079.054044
2016-05-01 12:00:00	5102.910187
2016-05-08 12:00:00	5088.244409