Merge branch 'main' into notebooks

ai2es · Feb 29, 2024 · 2ac500e · 2ac500e
2 parents 7b5acb8 + c11779c
commit 2ac500e
Show file tree

Hide file tree

Showing 7 changed files with 1,681 additions and 1,754 deletions.
diff --git a/mlguess/keras/callbacks.py b/mlguess/keras/callbacks.py
@@ -1,21 +1,21 @@
-from tensorflow.python.keras import backend as K
-from tensorflow.python.keras.callbacks import (
+from keras import backend as K
+from keras.callbacks import (
     Callback,
     ModelCheckpoint,
     CSVLogger,
     EarlyStopping,
 )
-import tensorflow as tf
-from tensorflow.python.keras.callbacks import ReduceLROnPlateau, LearningRateScheduler
+from keras.callbacks import ReduceLROnPlateau, LearningRateScheduler
 from typing import List, Dict
 import logging
 from functools import partial
 import math
 import os
+import keras
+import keras.ops as ops
 
 logger = logging.getLogger(__name__)
 
-
 def get_callbacks(config: Dict[str, str], path_extend=False) -> List[Callback]:
     callbacks = []
 
@@ -73,17 +73,10 @@ def on_epoch_end(self, epoch: int, logs: Dict[str, float] = None) -> None:
         logs["lr"] = K.get_value(self.model.optimizer.lr)
 
 
-class ReportEpoch(tf.keras.callbacks.Callback):
-    def __init__(self, annealing_coef, this_epoch_num):
-        super(ReportEpoch, self).__init__()
-        self.this_epoch = 0
-        self.annealing_coef = annealing_coef
-        self.this_epoch_num = this_epoch_num
+class ReportEpoch(keras.callbacks.Callback):
+    def __init__(self, epoch_var):
+        self.epoch_var = epoch_var
 
     def on_epoch_begin(self, epoch, logs=None):
-        if logs is None:
-            logs = {}
-        self.this_epoch += 1
-        K.set_value(
-            self.this_epoch_num, self.this_epoch
-        )
+        self.epoch_var.assign_add(1)
+
diff --git a/mlguess/keras/deprecated/callbacks.py b/mlguess/keras/deprecated/callbacks.py
@@ -0,0 +1,68 @@
+import keras
+import keras.ops as ops
+
+logger = logging.getLogger(__name__)
+
+def get_callbacks(config: Dict[str, str], path_extend=False) -> List[Callback]:
+    callbacks = []
+
+    if "callbacks" in config:
+        if path_extend:
+            save_data = os.path.join(config["save_loc"], path_extend)
+        else:
+            save_data = config["save_loc"]
+        config = config["callbacks"]
+    else:
+        return []
+
+    if "ModelCheckpoint" in config:
+        config["ModelCheckpoint"]["filepath"] = os.path.join(
+            save_data, config["ModelCheckpoint"]["filepath"]
+        )
+        callbacks.append(ModelCheckpoint(**config["ModelCheckpoint"]))
+        logger.info("... loaded Checkpointer")
+
+    if "EarlyStopping" in config:
+        callbacks.append(EarlyStopping(**config["EarlyStopping"]))
+        logger.info("... loaded EarlyStopping")
+
+    # LearningRateTracker(),  ## ReduceLROnPlateau does this already, use when supplying custom LR annealer
+
+    if "ReduceLROnPlateau" in config:
+        callbacks.append(ReduceLROnPlateau(**config["ReduceLROnPlateau"]))
+        logger.info("... loaded ReduceLROnPlateau")
+
+    if "CSVLogger" in config:
+        config["CSVLogger"]["filename"] = os.path.join(
+            save_data, config["CSVLogger"]["filename"]
+        )
+        callbacks.append(CSVLogger(**config["CSVLogger"]))
+        logger.info("... loaded CSVLogger")
+
+    if "LearningRateScheduler" in config:
+        drop = config["LearningRateScheduler"]["drop"]
+        epochs_drop = config["LearningRateScheduler"]["epochs_drop"]
+        f = partial(step_decay, drop=drop, epochs_drop=epochs_drop)
+        callbacks.append(LearningRateScheduler(f))
+        callbacks.append(LearningRateTracker())
+
+    return callbacks
+
+
+def step_decay(epoch, drop=0.2, epochs_drop=5.0, init_lr=0.001):
+    lrate = init_lr * math.pow(drop, math.floor((1 + epoch) / epochs_drop))
+    return lrate
+
+
+class LearningRateTracker(Callback):
+    def on_epoch_end(self, epoch: int, logs: Dict[str, float] = None) -> None:
+        logs = logs or {}
+        logs["lr"] = K.get_value(self.model.optimizer.lr)
+
+
+class ReportEpoch(keras.callbacks.Callback):
+    def __init__(self, epoch_var):
+        self.epoch_var = epoch_var
+
+    def on_epoch_begin(self, epoch, logs=None):
+        self.epoch_var.assign_add(1)
diff --git a/mlguess/keras/deprecated/losses.py b/mlguess/keras/deprecated/losses.py
@@ -0,0 +1,182 @@
+import numpy as np
+import logging
+import keras
+import keras.ops as ops
+
+backend = keras.backend.backend()
+if backend == "tensorflow":
+    from tensorflow.math import digamma, lgamma
+elif backend == "jax":
+    from jax.scipy.special import digamma
+    from jax.lax import lgamma
+elif backend == "torch":
+    from torch.special import digamma
+    from torch import lgamma
+
+
+class DirichletEvidentialLoss(keras.losses.Loss):
+    """
+    Loss function for an evidential categorical model.
+    Args:
+        callback (list): List of callbacks.
+        name (str): reference name
+        this_epoch_num (int):  Epoch callback
+        class_weights (list): List of class weights (experimental)
+    """
+    def __init__(self, callback=None, name="dirichlet", this_epoch_num=None, class_weights=None):
+
+        super().__init__()
+        self.callback = callback
+        self.__name__ = name
+        self.class_weights = class_weights
+        self.this_epoch_num = this_epoch_num
+        if self.class_weights:
+            logging.warning("The application of class weights to this loss is experimental.")
+
+    def kl(self, alpha):
+        beta = ops.ones((1, alpha.shape[1]), dtype="float32")
+        S_alpha = ops.sum(alpha, axis=1, keepdims=True)
+        S_beta = ops.sum(beta, axis=1, keepdims=True)
+        lnB = lgamma(S_alpha) - ops.sum(
+            lgamma(alpha), axis=1, keepdims=True
+        )
+        lnB_uni = ops.sum(
+            lgamma(beta), axis=1, keepdims=True
+        ) - lgamma(S_beta)
+
+        dg0 = digamma(S_alpha)
+        dg1 = digamma(alpha)
+
+        if self.class_weights:
+            kl = (ops.sum(self.class_weights * (alpha - beta) * (dg1 - dg0), axis=1, keepdims=True) + lnB +
+                  lnB_uni)
+        else:
+            kl = (ops.sum((alpha - beta) * (dg1 - dg0), axis=1, keepdims=True) + lnB + lnB_uni)
+        return kl
+
+    def __call__(self, y, output, sample_weight=None):
+        evidence = ops.relu(output)
+        alpha = evidence + 1
+
+        S = ops.sum(alpha, axis=1, keepdims=True)
+        m = alpha / S
+
+        if self.class_weights:
+            A = ops.sum(self.class_weights * (y - m) ** 2, axis=1, keepdims=True)
+            B = ops.sum(self.class_weights * alpha * (S - alpha) / (S * S * (S + 1)), axis=1, keepdims=True)
+        else:
+            A = ops.sum((y - m) ** 2, axis=1, keepdims=True)
+            B = ops.sum(alpha * (S - alpha) / (S * S * (S + 1)), axis=1, keepdims=True)
+
+        annealing_coef = ops.minimum(1.0, self.this_epoch_num / self.callback.annealing_coef)
+        alpha_hat = y + (1 - y) * alpha
+        C = annealing_coef * self.KL(alpha_hat)
+        C = ops.mean(C, axis=1)
+
+        return ops.mean(A + B + C)
+
+class EvidentialRegressionLoss(keras.losses.Loss):
+    """
+    Loss function for an evidential regression model. The total loss is the Negative Log Likelihood of the
+    Normal Inverse Gamma summed with the error and scaled by the evidential coefficient. The coefficient has a strong
+    influence on the uncertainty predictions (less so for the predictions themselves) of the model and must be tuned
+    for individual datasets.
+    Loss = loss_nll + coeff * loss_reg
+    Args:
+        coeff (float): Evidential Coefficient
+    """
+    def __init__(self, coeff=1.0):
+        super(EvidentialRegressionLoss, self).__init__()
+        self.coeff = coeff
+
+    def nig_nll(self, y, gamma, v, alpha, beta, reduce=True):
+        v = ops.maximum(v, keras.backend.epsilon())
+        twoBlambda = 2 * beta * (1 + v)
+        nll = (0.5 * ops.log(np.pi / v)
+               - alpha * ops.log(twoBlambda)
+               + (alpha + 0.5) * ops.log(v * (y - gamma) ** 2 + twoBlambda)
+               + lgamma(alpha)
+               - lgamma(alpha + 0.5))
+
+        return ops.mean(nll) if reduce else nll
+
+    def nig_reg(self, y, gamma, v, alpha, reduce=True):
+        error = ops.abs(y - gamma)
+        evi = 2 * v + alpha
+        reg = error * evi
+
+        return ops.mean(reg) if reduce else reg
+
+    def call(self, y_true, evidential_output):
+        gamma, v, alpha, beta = ops.split(evidential_output, 4, axis=-1)
+        loss_nll = self.nig_nll(y_true, gamma, v, alpha, beta)
+        loss_reg = self.nig_reg(y_true, gamma, v, alpha)
+
+        return loss_nll + self.coeff * loss_reg
+
+    def get_config(self):
+        config = super(EvidentialRegressionLoss, self).get_config()
+        config.update({"coeff": self.coeff})
+        return config
+
+def gaussian_nll(y, y_pred, reduce=True):
+    """
+    Loss function for a parametric Gaussian Loss.
+    Args:
+        y: Training data targets
+        y_pred: Model predicitons
+    Returns:
+        Mean Negative log likelihood
+    """
+    ax = list(range(1, len(y.shape)))
+    mu, sigma = ops.split(y_pred, 2, axis=-1)
+    logprob = (-ops.log(sigma)
+               - 0.5 * ops.log(2 * np.pi)
+               - 0.5 * ((y - mu) / sigma) ** 2)
+    loss = ops.mean(-logprob, axis=ax)
+    return ops.mean(loss) if reduce else loss
+
+
+class EvidentialRegressionCoupledLoss(keras.losses.Loss):
+    def __init__(self, r=1.0, coeff=1.0):
+        """
+        implementation of the loss from meinert and lavin that fixes issues with the original
+        evidential loss for regression. The loss couples the virtual evidence values with coefficient r.
+        In this new loss, the regularizer is unnecessary.
+        """
+        super(EvidentialRegressionCoupledLoss, self).__init__()
+        self.coeff = coeff
+        self.r = r
+
+    def nig_nll(self, y, gamma, v, alpha, beta, reduce=True):
+        # couple the parameters as per meinert and lavin
+
+        twoBlambda = 2 * beta * (1 + v)
+        nll = (0.5 * ops.log(np.pi / v)
+               - alpha * ops.log(twoBlambda)
+               + (alpha + 0.5) * ops.log(v * (y - gamma) ** 2 + twoBlambda)
+               + lgamma(alpha)
+               - lgamma(alpha + 0.5))
+
+        return ops.mean(nll) if reduce else nll
+
+    def nig_reg(self, y, gamma, v, alpha, reduce=True):
+        error = ops.abs(y - gamma)  # can try squared loss here to target the right minimizer
+        evi = (v + 2 * alpha)  # new paper: = v + 2 * alpha, can try to change this to just 2alpha
+        reg = error * evi
+
+        return ops.mean(reg) if reduce else reg
+
+    def call(self, y_true, evidential_output):
+        gamma, v, alpha, beta = ops.split(evidential_output, 4, axis=-1)
+        v = (2 * (alpha - 1) / self.r)  # need to couple this way otherwise alpha could be negative
+
+        loss_nll = self.nig_nll(y_true, gamma, v, alpha, beta)
+        loss_reg = self.nig_reg(y_true, gamma, v, alpha)
+
+        return loss_nll + self.coeff * loss_reg
+
+    def get_config(self):
+        config = super(EvidentialRegressionCoupledLoss, self).get_config()
+        config.update({"r": self.r, "coeff": self.coeff})
+        return config