# ------------------------------------------------------------
# 2. Import libraries and data path
# ------------------------------------------------------------

import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
from prophet import Prophet
from pmdarima import auto_arima
from statsmodels.tsa.statespace.sarimax import SARIMAX
import warnings
import logging
from IPython.display import display

# Path to data file
DATA_FILE = "paediatrics_train.csv"

# Silence warnings and logs to keep the notebook clean
warnings.filterwarnings("ignore")
logging.disable(logging.CRITICAL)

# ------------------------------------------------------------
# 3.1 Load and inspect data
# ------------------------------------------------------------

df = pd.read_csv(DATA_FILE, parse_dates=["date"], index_col="date")
df = df.asfreq("D")

print(df.head(), "\n")
print(df.info())

            paed_ed_attends
date                       
2014-04-01               47
2014-04-02               46
2014-04-03               47
2014-04-04               48
2014-04-05               52 

<class 'pandas.core.frame.DataFrame'>
DatetimeIndex: 1056 entries, 2014-04-01 to 2017-02-19
Freq: D
Data columns (total 1 columns):
 #   Column           Non-Null Count  Dtype
---  ------           --------------  -----
 0   paed_ed_attends  1056 non-null   int64
dtypes: int64(1)
memory usage: 16.5 KB
None

# ------------------------------------------------------------
# 3.2 Data Quality Checks
# ------------------------------------------------------------

# Missing values
missing_values = df.isna().sum()

# Duplicate dates
duplicate_dates = df.index.duplicated().sum()

# Check for continuous daily frequency
full_date_range = pd.date_range(start=df.index.min(), end=df.index.max(), freq="D")
missing_dates = full_date_range.difference(df.index)

# Validity of attendance counts
negative_counts = (df["paed_ed_attends"] < 0).sum()
non_integer_counts = (df["paed_ed_attends"] % 1 != 0).sum()

# Display results
print("Missing values per column:")
print(missing_values, "\n")

print(f"Number of duplicate dates: {duplicate_dates}")
print(f"Number of missing dates in daily sequence: {len(missing_dates)}")
print(f"Negative attendance values: {negative_counts}")
print(f"Non-integer attendance values: {non_integer_counts}")

Missing values per column:
paed_ed_attends    0
dtype: int64 

Number of duplicate dates: 0
Number of missing dates in daily sequence: 0
Negative attendance values: 0
Non-integer attendance values: 0

# ------------------------------------------------------------
# 3.3 Train-Test split
# ------------------------------------------------------------

HORIZON = 28

ts_full = df["paed_ed_attends"].astype(float)
ts_train = ts_full.iloc[:-HORIZON]
ts_test = ts_full.iloc[-HORIZON:]

# Print summary
print(f"Total observations: {len(ts_full)}")
print(f"Training observations: {len(ts_train)}")
print(f"Test observations: {len(ts_test)}")

print("\nTraining period:")
print(f"  {ts_train.index.min().date()} to {ts_train.index.max().date()}")

print("\nTest period (held out):")
print(f"  {ts_test.index.min().date()} to {ts_test.index.max().date()}")

Total observations: 1056
Training observations: 1028
Test observations: 28

Training period:
  2014-04-01 to 2017-01-22

Test period (held out):
  2017-01-23 to 2017-02-19

# ------------------------------------------------------------
# 3.4 Visualise the data
# ------------------------------------------------------------

# Line plot of training data only
plt.figure(figsize=(12, 4))
plt.plot(ts_train.index, ts_train.values)
plt.xlabel("Date")
plt.ylabel("Daily paediatric ED attendances")
plt.title("Daily paediatric ED attendances over time (training data only)")
plt.tight_layout()
plt.show()

# ------------------------------------------------------------
# 3.5.1 Visualise seasonality by calendar month
# ------------------------------------------------------------

# Convert series to DataFrame for feature engineering
train_month = ts_train.to_frame(name="paed_ed_attends")

# Add month information
train_month["month"] = train_month.index.month
train_month["month_name"] = train_month.index.month_name()

# Calculate mean daily attendances per calendar month
monthly_mean = (
    train_month.groupby(["month", "month_name"])["paed_ed_attends"]
    .mean()
    .reset_index()
    .sort_values("month")
)

# Plot mean daily attendances by month
plt.figure(figsize=(8, 4))
plt.plot(monthly_mean["month_name"], monthly_mean["paed_ed_attends"], marker="o")
plt.xlabel("Month")
plt.ylabel("Mean daily attendances")
plt.title("Mean daily paediatric ED attendances by month (training data)")
plt.xticks(rotation=45)
plt.tight_layout()
plt.show()

# ------------------------------------------------------------
# 3.5.2 Visualise seasonality by day of week
# ------------------------------------------------------------

# Convert series to DataFrame
train_dayofweek = ts_train.to_frame(name="paed_ed_attends")

# Add day-of-week
train_dayofweek["day_name"] = train_dayofweek.index.day_name()

# Order for days of the week
weekday_order = [
    "Monday",
    "Tuesday",
    "Wednesday",
    "Thursday",
    "Friday",
    "Saturday",
    "Sunday",
]

train_dayofweek["day_name"] = pd.Categorical(
    train_dayofweek["day_name"], categories=weekday_order, ordered=True
)

# Boxplot by day of week
plt.figure(figsize=(8, 4))
train_dayofweek.boxplot(
    column="paed_ed_attends", by="day_name", grid=False, showfliers=False
)
plt.suptitle("")
plt.title("Paediatric ED attendances by day of week (training data)")
plt.xlabel("Day of week")
plt.ylabel("Daily attendances")
plt.tight_layout()
plt.show()

<Figure size 800x400 with 0 Axes>

# ------------------------------------------------------------
# 3.6.1 Visualise distribution of daily attendances
# ------------------------------------------------------------

# Histogram of daily attendances (distribution)
plt.figure(figsize=(8, 4))
plt.hist(ts_train, bins=30)
plt.xlabel("Daily attendances")
plt.ylabel("Frequency")
plt.title("Distribution of daily paediatric ED attendances (training data)")
plt.tight_layout()
plt.show()

# ------------------------------------------------------------
# 3.6.2 Visualise rolling mean and variability
# ------------------------------------------------------------

# Rolling mean and variability of daily attendances (line plot)
rolling_mean = ts_train.rolling(30).mean()
rolling_std = ts_train.rolling(30).std()

plt.figure(figsize=(12, 4))
plt.plot(rolling_mean, label="30-day rolling mean")
plt.plot(rolling_std, label="30-day rolling std")
plt.legend()
plt.title("Rolling mean and variability (training data)")
plt.tight_layout()
plt.show()

# ------------------------------------------------------------
# 4.2 Error metric functions
# ------------------------------------------------------------


def mae(y_true, y_pred):
    """
    Compute Mean Absolute Error (MAE).

    MAE measures the average absolute difference between observed
    and predicted values, expressed in the original units of the data.
    """
    return float(np.mean(np.abs(y_true - y_pred)))


def rmse(y_true, y_pred):
    """
    Compute Root Mean Squared Error (RMSE).

    RMSE penalises larger errors more heavily than MAE and is sensitive
    to occasional large forecast deviations.
    """
    return float(np.sqrt(np.mean((y_true - y_pred) ** 2)))


def smape(y_true, y_pred):
    """
    Compute Symmetric Mean Absolute Percentage Error (sMAPE).

    sMAPE provides a scale-free measure of forecast accuracy by expressing
    errors as a percentage of the average magnitude of observed and
    predicted values.
    """
    denom = (np.abs(y_true) + np.abs(y_pred)) / 2.0
    denom = np.where(denom == 0, 1e-8, denom)
    return float(np.mean(np.abs(y_true - y_pred) / denom) * 100)

# ------------------------------------------------------------
# 4.3 Cross-Validation
# ------------------------------------------------------------

INITIAL_WINDOW = 365 * 2
STEP = 1


def rolling_origin_cv(
    series, horizon=28, initial_window=365 * 2, step=1, forecaster=None
):
    """
    Perform rolling-origin cross-validation using an expanding training window.

    At each forecast origin, the model is trained on all observations up to
    that origin and used to generate a multi-step forecast of length
    `horizon`. The forecast origin is then advanced forward by `step`
    observations and the process is repeated until the end of the series
    is reached.

    This function returns results in "long format", with one row per
    forecast origin and per forecast horizon step. This structure enables
    flexible analysis, including horizon-specific error evaluation
    and aggregation into summary metrics.

    Parameters
    ----------
    series : pd.Series
        Univariate time series indexed by datetime.
    horizon : int, default=28
        Number of future time steps to forecast at each origin.
    initial_window : int, default=365*2
        Number of observations used in the initial training window.
        The training window expands at each iteration.
    step : int, default=1
        Number of observations by which the forecast origin is advanced
        between successive folds.
    forecaster : callable
        Function of the form:
            forecaster(train_series, horizon) -> array-like
        Must return a forecast of length `horizon`.

    Returns
    -------
    pd.DataFrame
        Long-format cross-validation results with columns:
        - origin_date : first timestamp of the test window
        - h           : forecast lead time (1 to horizon)
        - y_true      : observed value
        - y_pred      : forecast value
        - abs_error   : absolute error at that horizon
        - sq_error    : squared error at that horizon
    """

    series = series.dropna()
    n = len(series)
    if initial_window + horizon > n:
        raise ValueError("initial_window + horizon > series length")

    results = []
    last_origin_start = n - horizon

    for origin_end in range(initial_window, last_origin_start + 1, step):
        train_series = series.iloc[:origin_end]
        test_slice = series.iloc[origin_end : origin_end + horizon]

        y_pred = np.asarray(forecaster(train_series, horizon), dtype=float)
        y_true = test_slice.values.astype(float)

        origin_date = test_slice.index[0]
        abs_err = np.abs(y_true - y_pred)
        sq_err = (y_true - y_pred) ** 2

        for h in range(1, horizon + 1):
            results.append(
                {
                    "origin_date": origin_date,
                    "h": h,
                    "y_true": y_true[h - 1],
                    "y_pred": y_pred[h - 1],
                    "abs_error": abs_err[h - 1],
                    "sq_error": sq_err[h - 1],
                }
            )

    return pd.DataFrame(results)


def cv_summarise(cv_long: pd.DataFrame) -> pd.DataFrame:
    """
    Create summary metrics from long-format cross-validation results.

    This function computes forecast accuracy metrics by
    averaging errors across all forecast horizons within each origin.
    It derives MAE, RMSE, and sMAPE from the error terms stored
    in the long-format output.

    Parameters
    ----------
    cv_long : pd.DataFrame
        Long-format cross-validation output generated by
        `rolling_origin_cv`.

    Returns
    -------
    pd.DataFrame
        Short summary with one row per forecast origin containing:
        - MAE   : mean absolute error across all horizons
        - RMSE  : root mean squared error across all horizons
        - sMAPE : symmetric mean absolute percentage error (%)
    """
    # Define sMAPE at the per-row level then average per origin.
    denom = np.abs(cv_long["y_true"]) + np.abs(cv_long["y_pred"])
    smape_row = np.where(
        denom == 0, 0.0, 200.0 * np.abs(cv_long["y_true"] - cv_long["y_pred"]) / denom
    )
    tmp = cv_long.assign(smape_row=smape_row)

    short = tmp.groupby("origin_date", as_index=False).agg(
        MAE=("abs_error", "mean"),
        RMSE=("sq_error", lambda x: float(np.sqrt(np.mean(x)))),
        sMAPE=("smape_row", "mean"),
    )
    return short

# ------------------------------------------------------------
# 5.3 Benchmark forecasters
# ------------------------------------------------------------


def forecast_naive1(train_series: pd.Series, horizon: int) -> np.ndarray:
    """
    Naive benchmark forecaster (NF1).

    Forecasts all future time steps as the last observed value in the
    training series.
    """
    last_val = float(train_series.iloc[-1])
    return np.repeat(last_val, horizon)


def forecast_snaive_weekly(train_series: pd.Series, horizon: int) -> np.ndarray:
    """
    Seasonal naive benchmark forecaster (weekly).

    Forecasts future values by repeating the most recent observed
    weekly pattern (last 7 days).
    """
    season_length = 7
    last_week = train_series.iloc[-season_length:].to_numpy(dtype=float)
    reps = int(np.ceil(horizon / season_length))
    return np.tile(last_week, reps)[:horizon]

# ------------------------------------------------------------
# 5.4.1 Benchmark Model Evaluation (Rolling origin CV on training data)
# ------------------------------------------------------------
y_train = ts_train

cv_naive1 = rolling_origin_cv(
    series=y_train,
    initial_window=INITIAL_WINDOW,
    step=STEP,
    forecaster=forecast_naive1,
)

cv_snaive = rolling_origin_cv(
    series=y_train,
    initial_window=INITIAL_WINDOW,
    step=STEP, 
    forecaster=forecast_snaive_weekly,
)


# Overall MAE across all origins and horizons
summary = pd.DataFrame(
    {
        "Model": ["Naive1 (last value)", "Seasonal Naive (weekly)"],
        "Mean MAE (h=1..28)": [
            cv_naive1["abs_error"].mean(),
            cv_snaive["abs_error"].mean(),
        ],
    }
).sort_values("Mean MAE (h=1..28)")

display(summary)

# ------------------------------------------------------------
# 5.4.2 visualise horizon-wise accuracy
# ------------------------------------------------------------

# Horizon-wise MAE
mae_by_h_naive1 = cv_naive1.groupby("h")["abs_error"].mean().reset_index(name="MAE")
mae_by_h_snaive = cv_snaive.groupby("h")["abs_error"].mean().reset_index(name="MAE")

# Plot horizon-wise MAE
plt.figure(figsize=(8, 4))
plt.plot(mae_by_h_naive1["h"], mae_by_h_naive1["MAE"], label="Naive1")
plt.plot(
    mae_by_h_snaive["h"],
    mae_by_h_snaive["MAE"],
    label="Seasonal Naive (weekly)",
)
plt.xlabel("Forecast lead time (days ahead)")
plt.ylabel("Mean Absolute Error (MAE)")
plt.xticks(range(1, 29, 3))
plt.title("Benchmark accuracy by forecast horizon")
plt.legend()
plt.tight_layout()
plt.show()

# ------------------------------------------------------------
# 6.2.1 SARIMAX Order Selection Using auto-ARIMA
# ------------------------------------------------------------

y = ts_train.astype(float)

y0 = y.iloc[:INITIAL_WINDOW]

auto_model = auto_arima(
    y0,
    seasonal=True,
    m=7,
    stepwise=True,
    suppress_warnings=True,
    error_action="ignore",
)

ORDER = auto_model.order
SEASONAL_ORDER = auto_model.seasonal_order

print("Selected order:", ORDER)
print("Selected seasonal_order:", SEASONAL_ORDER)

Selected order: (1, 1, 2)
Selected seasonal_order: (0, 0, 2, 7)

# ------------------------------------------------------------
# 6.2.2 SARIMAX forecasting function
# ------------------------------------------------------------


def forecast_sarimax(
    train_series: pd.Series, horizon: int, order=ORDER, seasonal_order=SEASONAL_ORDER
) -> np.ndarray:
    """
    Fit a SARIMAX model to the training series and produce a multi-step forecast.

    The model is refitted at each call using the supplied training data and
    pre-selected ARIMA and seasonal orders. This function is intended for use
    within a rolling-origin cross-validation framework, where the training
    window expands over time.

    Parameters
    ----------
    train_series : pd.Series
        Univariate time series of daily paediatric ED attendances, indexed by date.
    horizon : int
        Number of days ahead to forecast.
    order : tuple
        Non-seasonal ARIMA order (p, d, q).
    seasonal_order : tuple
        Seasonal ARIMA order (P, D, Q, m), where m is the seasonal period.

    Returns
    -------
    np.ndarray
        Array of length `horizon` containing the point forecasts.
    """
    model = SARIMAX(
        train_series.astype(float),
        order=order,
        seasonal_order=seasonal_order,
        enforce_stationarity=False,
        enforce_invertibility=False,
    )
    fit = model.fit(disp=False)
    preds = fit.forecast(steps=horizon)
    return preds.to_numpy(dtype=float)

# ------------------------------------------------------------
# 6.3 Prophet functions
# ------------------------------------------------------------


def to_prophet_df(y_series: pd.Series) -> pd.DataFrame:
    """
    Convert a time series into Prophet-compatible DataFrame format.

    Parameters
    ----------
    y_series : pd.Series
        Univariate time series indexed by date.

    Returns
    -------
    pd.DataFrame
        DataFrame with columns:
        - 'ds': datestamps
        - 'y' : observed values
    """
    df = pd.DataFrame({"ds": y_series.index, "y": y_series.values})
    return df


def fit_predict_prophet(y_train: pd.Series, horizon: int):
    """
    Fit a Prophet model to the training data and generate a multi-step forecast.

    The model includes weekly and yearly seasonality and is refitted each time
    the function is called. This design supports use within a rolling-origin
    cross-validation framework.

    Parameters
    ----------
    y_train : pd.Series
        Training time series of daily paediatric ED attendances.
    horizon : int
        Number of days ahead to forecast.

    Returns
    -------
    tuple
        - np.ndarray of length `horizon` containing point forecasts
        - fitted Prophet model object
    """
    df_train = to_prophet_df(y_train)

    model = Prophet(
        weekly_seasonality=True, yearly_seasonality=True, daily_seasonality=False
    )
    model.fit(df_train)

    future = model.make_future_dataframe(periods=horizon, freq="D")
    forecast = model.predict(future)

    preds = forecast["yhat"].iloc[-horizon:].to_numpy()
    return preds, model


def forecast_prophet(train_series: pd.Series, horizon: int) -> np.ndarray:
    """
    Wrapper function to produce Prophet forecasts for rolling-origin CV.

    Parameters
    ----------
    train_series : pd.Series
        Training time series indexed by date.
    horizon : int
        Number of days ahead to forecast.

    Returns
    -------
    np.ndarray
        Array of length `horizon` containing the point forecasts.
    """
    preds, _ = fit_predict_prophet(train_series, horizon)
    return preds

# ------------------------------------------------------------
# 6.4 Cross-Validated Model Comparison
# ------------------------------------------------------------

y = ts_train.astype(float)

# run CV once per model to get long-format results
cv_snaive = rolling_origin_cv(y, initial_window=INITIAL_WINDOW, step=STEP, forecaster=forecast_snaive_weekly)
cv_sarimax = rolling_origin_cv(y, initial_window=INITIAL_WINDOW, step=STEP, forecaster=forecast_sarimax)
cv_prophet = rolling_origin_cv(y, initial_window=INITIAL_WINDOW, step=STEP, forecaster=forecast_prophet)

# Summarise into short format (one row per origin)
cv_snaive_summary = cv_summarise(cv_snaive)
cv_sarimax_summary = cv_summarise(cv_sarimax)
cv_prophet_summary = cv_summarise(cv_prophet)

# add model labels
cv_snaive["model"] = cv_snaive_summary["model"] = "SNaive_weekly"
cv_sarimax["model"] = cv_sarimax_summary["model"] = "SARIMAX_auto"
cv_prophet["model"] = cv_prophet_summary["model"] = "Prophet"

# Combine cross-validation results from all models into single
# DataFrames to enable grouped comparison of performance metrics
cv_all = pd.concat([cv_snaive, cv_sarimax, cv_prophet], ignore_index=True)
cv_summary_all = pd.concat(
    [cv_snaive_summary, cv_sarimax_summary, cv_prophet_summary], ignore_index=True
)

# Summaries across all origins AND all horizons (h=1..28)
summary = cv_summary_all.groupby("model")[["MAE", "RMSE", "sMAPE"]].agg(["mean", "std"])
summary

# ------------------------------------------------------------
# 6.5.1 Model Metrics Comparison Chart
# ------------------------------------------------------------

metrics = ["MAE", "RMSE", "sMAPE"]
order = ["SNaive_weekly", "SARIMAX_auto", "Prophet"]
colors = {
    "SNaive_weekly": "#4C72B0",   # blue
    "SARIMAX_auto": "#DD8452",    # orange
    "Prophet": "#55A868",         # green
}

# Summarise mean ± SD for each metric
summary = {
    m: (cv_summary_all.groupby("model")[m].agg(["mean", "std"]).reindex(order))
    for m in metrics
}

# Plot
fig, axes = plt.subplots(nrows=3, ncols=1, figsize=(8, 10))

x = np.arange(len(order))

for ax, m in zip(axes, metrics):
    s = summary[m]
    bar_colors = [colors[model] for model in order]
    ax.bar(x, s["mean"].values, yerr=s["std"].values, capsize=4, color=bar_colors)
    ax.set_xticks(x)
    ax.set_xticklabels(order, rotation=0, ha="center")
    ax.set_ylabel(f"{m} (mean ± SD)")
    ax.set_title(m)

fig.suptitle("Fig 6.5.1: Rolling-origin CV: Forecast accuracy by model", y=0.98)
fig.tight_layout()
plt.show()

# ------------------------------------------------------------
# 6.5.2 Model Lead Time Comparison Chart
# ------------------------------------------------------------

# Mean absolute error by lead time
mae_by_h = cv_all.groupby(["model", "h"])["abs_error"].mean().reset_index()

plt.figure(figsize=(8, 4))
for model in ["SNaive_weekly", "SARIMAX_auto", "Prophet"]:
    subset = mae_by_h[mae_by_h["model"] == model]
    plt.plot(subset["h"], subset["abs_error"], label=model, color=colors[model] )

plt.xlabel("Forecast lead time (days)")
plt.ylabel("Mean absolute error")
plt.xticks(range(1, 29, 3))
plt.title("Fig 6.5.2: Forecast error by lead time")
plt.legend()
plt.tight_layout()
plt.show()

# ------------------------------------------------------------
# 7.2 Final 28 day Forecast (prophet)
# ------------------------------------------------------------

# Fit final model to full training data, not just the initial window.
y_full = ts_full.astype(float)

df_full = pd.DataFrame({"ds": pd.to_datetime(y_full.index), "y": y_full.values})


final_model = Prophet(
    weekly_seasonality=True, yearly_seasonality=True, daily_seasonality=False
)

final_model.fit(df_full)

# -------------------------------
# Forecast next 28 days
# -------------------------------
H = 28

future = final_model.make_future_dataframe(periods=H, freq="D")
forecast = final_model.predict(future)

fcst_28 = forecast.tail(H).copy()

forecast_mean = forecast["yhat"].iloc[-H:]
forecast_ci_lower = forecast["yhat_lower"].iloc[-H:]
forecast_ci_upper = forecast["yhat_upper"].iloc[-H:]

# -------------------------------
# Plot recent observations + forecast
# -------------------------------
plt.figure(figsize=(10, 4))

plt.plot(y_full.index[-90:], y_full.iloc[-90:], label="Recent observed")

plt.plot(fcst_28["ds"], fcst_28["yhat"], label=f"{H}-day forecast")

plt.fill_between(
    fcst_28["ds"],
    fcst_28["yhat_lower"],
    fcst_28["yhat_upper"],
    color="grey",
    alpha=0.3,
    label="80% Prediction interval",
)

plt.xlabel("Date")
plt.ylabel("Daily paediatric ED attendances")
plt.title(f"{H}-day forecast of paediatric ED attendances (Prophet)")
plt.legend()
plt.tight_layout()
plt.show()

	MAE		RMSE		sMAPE
	mean	std	mean	std	mean	std
model
Prophet	6.317821	1.269248	7.853103	1.446243	12.680870	2.022300
SARIMAX_auto	7.824004	2.416947	9.628206	2.703484	15.622757	4.658216
SNaive_weekly	9.329863	2.557154	11.596437	2.884205	18.594940	4.653329

Forecasting Paediatric Emergency Department Attendances¶

Executive Summary¶

1.1 Introduction¶

1.2 Objectives¶

2 Setup¶

3. Data Description and Initial Analysis¶

3.2 Data Quality Checks¶

3.3 Train Test Split¶

3.4 Overview of Time Series Behaviour¶

3.5 Seasonal effects¶

3.5.2 Short term effects¶

3.6 Distribution and variability¶

3.7 Implications for Forecasting¶

4. Forecasting Framework¶

4.1 Forecasting Task Definition¶

4.2 Error Metrics¶

4.3 Cross-Validation Strategy¶

5. Benchmark Models (Naïve Methods)¶

5.1 Rationale for Benchmark Models¶

5.2.1 Naïve (Last Observation) Forecast¶

5.2.2 Seasonal Naïve (Weekly) Forecast¶

5.3 Benchmark Model Implementation¶

5.4 Benchmark Model Evaluation¶

6. Candidate Forecasting Model¶

6.1 Choice of model¶

6.2 SARIMAX¶

6.2.1 SARIMAX order selection¶

6.2.2 SARIMAX forecasting function¶

6.3 Prophet¶

6.4 Model comparison¶

7. Model Selection and Forecasting Results¶

7.1 Model Selection¶

7.2 Final 28 day Forecast¶

7.3 Interpretation of forecast¶

8 Conclusions and Recommendations¶

8.1 Strengths of this approach¶

8.2 Limitations¶

8.3 Implications for staffing and operational planning¶

	Model	Mean MAE (h=1..28)
0	Naive1 (last value)	9.308777
1	Seasonal Naive (weekly)	9.329863