Merge pull request #2 from ourownstory/objectify

abstract model as object
ourownstory · Nov 10, 2020 · b7cdc3d · b7cdc3d
2 parents cf0cb59 + ac60faf
commit b7cdc3d
Show file tree

Hide file tree

Showing 10 changed files with 676 additions and 249 deletions.
diff --git a/arnet/__init__.py b/arnet/__init__.py
@@ -1,6 +1,6 @@
 import logging
 
-log = logging.getLogger("AR-Net")
+log = logging.getLogger("ARNet")
 log.setLevel("INFO")
 # Create handlers
 c_handler = logging.StreamHandler()
@@ -16,8 +16,13 @@
 log.addHandler(c_handler)
 log.addHandler(f_handler)
 
-from .ar_net import init_ar_learner
-from .make_dataset import load_from_file, tabularize_univariate
-from .utils import pad_ar_params, estimate_noise, split_by_p_valid, nice_print_list
-from .utils import compute_sTPE, coeff_from_model
+# lazy imports ala fastai2 style (for nice print functionality)
+from fastai.basics import *
+from fastai.tabular.all import *
+
+from .ar_net import ARNet
+
+# from .ar_net_legacy import init_ar_learner
+from .utils_data import load_from_file, tabularize_univariate, estimate_noise, split_by_p_valid
+from .utils import pad_ar_params, nice_print_list, compute_sTPE, coeff_from_model
 from .plotting import plot_weights, plot_prediction_sample, plot_error_scatter
diff --git a/arnet/ar_net.py b/arnet/ar_net.py
@@ -1,152 +1,215 @@
+from dataclasses import dataclass, field
+import logging
 import os
-import torch
-
-## lazy imports ala fastai2 style (for nice print functionality)
-from fastai.basics import *
-from fastai.tabular.all import *
-
-## explicit imports (for reference)
-# from fastai.basics import Callback
-# from fastai.data.core import DataLoaders
-# from fastai.learner import Metric
-# from fastai.metrics import mse, mae
-# from fastai.tabular.core import TabularPandas, TabDataLoader
-# from fastai.tabular.learner import tabular_learner
-# from fastai.torch_core import to_detach
-# from fastai.data.transforms import Normalize
-
-## import arnet
-from arnet.make_dataset import load_from_file, tabularize_univariate
-from arnet.utils import pad_ar_params, estimate_noise, split_by_p_valid, nice_print_list, compute_sTPE, coeff_from_model
-from arnet.plotting import plot_weights, plot_prediction_sample, plot_error_scatter
-
-
-class SparsifyAR(Callback):
-    """Callback that adds regularization of first linear layer according to AR-Net paper"""
-
-    def __init__(self, est_sparsity, est_noise=1.0, reg_strength=0.02, **kwargs):
-        super().__init__(**kwargs)
-        self.lam = 0.0
-        if est_sparsity is not None:
-            self.lam = reg_strength * est_noise * (1.0 / est_sparsity - 1.0)
-
-    def after_loss(self):
-        if not self.training:
-            return
-        abs_weights = None
-        for layer in self.learn.model.modules():
-            if isinstance(layer, torch.nn.Linear):
-                abs_weights = torch.abs(layer.weight)
-                break
-        if abs_weights is None:
-            raise NotImplementedError("weight regualarization only implemented for model with Linear layer")
-        reg = torch.div(2.0, 1.0 + torch.exp(-3.0 * abs_weights.pow(1.0 / 3.0))) - 1.0
-        self.learn.loss += self.lam * torch.mean(reg)
-
-    _docs = dict(after_loss="Add regularization of first linear layer")
-
-
-class sTPE(Metric):
-    """ "
-    Symmetrical Total Percentage Error of learned weights compared to underlying AR coefficients.
-    Computed as the average over snapshots at each batch.
-    """
-
-    def __init__(self, ar_params, at_epoch_end=False):
-        self.ar_params = ar_params
-        self.at_epoch_end = at_epoch_end
-
-    def reset(self):
-        self.total, self.count = 0.0, 0
-        self.sTPE = None
-
-    def accumulate(self, learn):
-        self.sTPE = to_detach(
-            compute_sTPE(est=coeff_from_model(model=learn.model, reversed_weights=True), real=self.ar_params)
+import pandas as pd
+import matplotlib.pyplot as plt
+
+from fastai.data.core import DataLoaders
+from fastai.tabular.core import TabularPandas, TabDataLoader
+from fastai.tabular.learner import tabular_learner, TabularLearner
+from fastai.data.transforms import Normalize
+from fastai.learner import load_learner
+
+from arnet import utils, utils_data, plotting, fastai_mods
+
+log = logging.getLogger("ARNet")
+
+
+@dataclass
+class ARNet:
+    ar_order: int
+    sparsity: float = None
+    est_noise: float = None
+    start_reg_pct: float = 0.0
+    full_reg_pct: float = 0.5
+    n_forecasts: int = 1
+    n_epoch: int = 20
+    lr: float = None
+    loss_func: str = "huber"
+    train_bs: int = 32
+    valid_bs: int = 1024
+    valid_p: float = 0.1
+    ar_params: list = None
+    log_level: str = None
+
+    dls: DataLoaders = field(init=False)
+    learn: TabularLearner = field(init=False)
+    coeff: list = field(init=False)
+    df: pd.DataFrame = field(init=False)
+
+    def __post_init__(self):
+        if self.log_level is not None:
+            utils.set_logger_level(log, self.log_level)
+        self.loss_func = fastai_mods.get_loss_func(self.loss_func)
+        df = None
+
+    def tabularize(self, series):
+        if self.est_noise is None:
+            self.est_noise = utils_data.estimate_noise(series)
+            log.info("estimated noise of series: {}".format(self.est_noise))
+
+        df_all = utils_data.tabularize_univariate(series, self.ar_order, self.n_forecasts)
+
+        log.debug("tabularized df")
+        log.debug("df columns: {}".format(list(df_all.columns)))
+        log.debug("df shape: {}".format(df_all.shape))
+        # log.debug("df head(3): {}".format(df_all.head(3)))
+        self.df = df_all
+        return self
+
+    def make_datasets(
+        self,
+        series=None,
+        valid_p=None,
+        train_bs=None,
+        valid_bs=None,
+        normalize=False,
+    ):
+        if series is None:
+            if self.df is None:
+                raise ValueError("must pass a series.")
+        else:
+            self.tabularize(series)
+        valid_p = self.valid_p if valid_p is None else valid_p
+        train_bs = self.train_bs if train_bs is None else train_bs
+        valid_bs = self.valid_bs if valid_bs is None else valid_bs
+
+        procs = []
+        if normalize:
+            procs.append(Normalize)
+
+        df_all = self.df
+        splits = utils_data.split_by_p_valid(valid_p, len(df_all))
+        cont_names = [col for col in list(df_all.columns) if "x_" == col[:2]]
+        target_names = [col for col in list(df_all.columns) if "y_" == col[:2]]
+        tp = TabularPandas(
+            df_all,
+            procs=procs,
+            cat_names=None,
+            cont_names=cont_names,
+            y_names=target_names,
+            splits=splits,
         )
-        self.total += self.sTPE
-        self.count += 1
-
-    @property
-    def value(self):
-        if self.at_epoch_end:
-            return self.sTPE
-        return self.total / self.count if self.count != 0 else None
-
-    @property
-    def name(self):
-        return "sTPE of AR coeff"
-
-
-def init_ar_learner(
-    series,
-    ar_order,
-    n_forecasts=1,
-    valid_p=0.1,
-    sparsity=None,
-    ar_params=None,
-    train_bs=32,
-    valid_bs=128,
-    verbose=False,
-):
-    if sparsity is not None and sparsity == 1.0:
-        sparsity = None
-    df_all = tabularize_univariate(series, ar_order, n_forecasts)
-    est_noise = estimate_noise(series)
-
-    if verbose:
-        print("tabularized df")
-        print("df columns", list(df_all.columns))
-        print("df shape", df_all.shape)
-        # if nested_list: print("x_dim:", len(df_all['x'][0]), "y_dim:", len(df_all['y'][0]))
-        # print("df head(3)", df_all.head(3))
-        print("estimated noise of series", est_noise)
-
-    ## split
-    splits = split_by_p_valid(valid_p, len(df_all), verbose)
-
-    cont_names = [col for col in list(df_all.columns) if "x_" == col[:2]]
-    target_names = [col for col in list(df_all.columns) if "y_" == col[:2]]
-
-    ## preprocess?
-    # procs = [Normalize]
-    procs = []
-
-    tp = TabularPandas(df_all, procs=procs, cat_names=None, cont_names=cont_names, y_names=target_names, splits=splits)
-    if verbose:
-        print("cont var num", len(tp.cont_names), tp.cont_names)
-        # print(tp.iloc[0:5])
-
-    ### next: data loader, learner
-    trn_dl = TabDataLoader(tp.train, bs=train_bs, shuffle=True, drop_last=True)
-    val_dl = TabDataLoader(tp.valid, bs=valid_bs)
-    dls = DataLoaders(trn_dl, val_dl)
-
-    # if verbose:
-    #     print("showing batch")
-    #     print(dls.show_batch(show=False))
-
-    callbacks = []
-    if sparsity is not None:
-        callbacks.append(SparsifyAR(sparsity, est_noise))
-        if verbose:
-            print("reg lam: ", callbacks[0].lam)
-
-    metrics = [mae]
-    if ar_params is not None:
-        metrics.append(sTPE(ar_params, at_epoch_end=False))
-
-    tm_config = {"use_bn": False, "bn_final": False, "bn_cont": False}
-    learn = tabular_learner(
-        dls,
-        layers=[],  # Note: None defaults to [200, 100]
-        config=tm_config,  # None calls tabular_config()
-        n_out=len(target_names),  # None calls get_c(dls)
-        train_bn=False,  # passed to Learner
-        metrics=metrics,  # passed on to TabularLearner, to parent Learner
-        loss_func=mse,
-        cbs=callbacks,
-    )
-    if verbose:
-        print(learn.model)
-    return learn
+        log.debug("cont var num: {}, names: {}".format(len(tp.cont_names), tp.cont_names))
+
+        trn_dl = TabDataLoader(tp.train, bs=train_bs, shuffle=True, drop_last=True)
+        val_dl = TabDataLoader(tp.valid, bs=valid_bs)
+        self.dls = DataLoaders(trn_dl, val_dl)
+        log.debug("showing batch")
+        log.debug("{}".format(self.dls.show_batch(show=False)))
+        return self
+
+    def create_learner(
+        self,
+        sparsity=None,
+        ar_params=None,
+        loss_func=None,
+        start_reg_pct=None,
+        full_reg_pct=None,
+    ):
+        sparsity = self.sparsity if sparsity is None else sparsity
+        ar_params = self.ar_params if ar_params is None else ar_params
+        loss_func = self.loss_func if loss_func is None else fastai_mods.get_loss_func(loss_func)
+        start_reg_pct = self.start_reg_pct if start_reg_pct is None else start_reg_pct
+        full_reg_pct = self.full_reg_pct if full_reg_pct is None else full_reg_pct
+
+        metrics = ["MSE", "MAE"]
+        metrics = [fastai_mods.get_loss_func(m) for m in metrics]
+        if ar_params is not None:
+            metrics.append(fastai_mods.sTPE(ar_params, at_epoch_end=False))
+
+        callbacks = []
+        if sparsity is not None:
+            regularizer = fastai_mods.SparsifyAR(
+                sparsity,
+                self.est_noise,
+                start_pct=start_reg_pct,
+                full_pct=full_reg_pct,
+            )
+
+            callbacks.append(regularizer)
+            log.info("reg lam (max): {}".format(callbacks[0].lam_max))
+
+        tm_config = {"use_bn": False, "bn_final": False, "bn_cont": False}
+        self.learn = tabular_learner(
+            self.dls,
+            layers=[],  # Note: None defaults to [200, 100]
+            config=tm_config,  # None calls tabular_config()
+            n_out=self.n_forecasts,  # None calls get_c(dls)
+            train_bn=False,  # passed to Learner
+            metrics=metrics,  # passed on to TabularLearner, to parent Learner
+            loss_func=loss_func,
+            cbs=callbacks,
+        )
+        log.debug("{}".format(self.learn.model))
+        return self
+
+    def find_lr(self, plot=True):
+        if self.learn is None:
+            raise ValueError("create learner first.")
+        lr_at_min, lr_steep = self.learn.lr_find(start_lr=1e-6, end_lr=1, num_it=500, show_plot=plot)
+        if plot:
+            plt.show()
+        log.debug("lr at minimum: {}; (steepest lr: {})".format(lr_at_min, lr_steep))
+        lr = lr_at_min
+        log.info("Optimal learning rate: {}".format(lr))
+        self.lr = lr
+        return self
+
+    def fit(self, n_epoch=None, lr=None, cycles=1, plot=True):
+        n_epoch = self.n_epoch if n_epoch is None else n_epoch
+        lr = self.lr if lr is None else lr
+        if lr is None:
+            self.find_lr(plot=plot)
+            lr = self.lr
+        for i in range(0, cycles):
+            self.learn.fit_one_cycle(n_epoch=n_epoch, lr_max=lr, div=25.0, div_final=10000.0, pct_start=0.25)
+            lr = lr / 10
+            if plot:
+                self.learn.recorder.plot_loss()
+        if plot:
+            plt.show()
+        # record Coeff
+        self.coeff = utils.coeff_from_model(self.learn.model)
+        return self
+
+    def fit_with_defaults(self, series):
+        self.make_datasets(series)
+        self.create_learner()
+        self.fit(plot=False)
+        return self
+
+    def plot_weights(self, **kwargs):
+        plotting.plot_weights(
+            ar_val=self.ar_order,
+            weights=self.coeff[0],
+            ar=self.ar_params,
+            **kwargs,
+        )
+
+    def plot_fitted_obs(self, num_obs=100, **kwargs):
+        preds, y = self.learn.get_preds()
+        if num_obs is not None:
+            y = y[0:num_obs]
+            preds = preds[0:num_obs]
+        plotting.plot_prediction_sample(preds, y, **kwargs)
+
+    def plot_errors(self, **kwargs):
+        preds, y = self.learn.get_preds()
+        plotting.plot_error_scatter(preds, y, **kwargs)
+
+    def save_model(self, results_path="results", model_name=None):
+        # self.learn.freeze()
+        sparsity = 1.0 if self.sparsity is None else self.sparsity
+        if model_name is None:
+            model_name = "ar{}_sparse_{:.3f}_ahead_{}_epoch_{}.pkl".format(
+                self.ar_order, sparsity, self.n_forecasts, self.n_epoch
+            )
+        self.learn.export(fname=os.path.join(results_path, model_name))
+        return self
+
+    def load_model(self, results_path="results", model_name=None, cpu=True):
+        self.learn = load_learner(fname=os.path.join(results_path, model_name), cpu=cpu)
+        # can unfreeze the model and fine_tune
+        self.learn.unfreeze()
+        return self