From a0f9e0003dee61df34c2884e9186248d353ecfaf Mon Sep 17 00:00:00 2001
From: James Fulton <djamesfulton@yahoo.co.uk>
Date: Thu, 20 Jun 2024 10:41:55 +0000
Subject: [PATCH] refactor flat model

---
 pvnet_summation/models/flat_model.py | 105 +++++++++++++++++++++++++++
 tests/models/test_flat_model.py      |  36 +++++++++
 2 files changed, 141 insertions(+)
 create mode 100644 pvnet_summation/models/flat_model.py
 create mode 100644 tests/models/test_flat_model.py

diff --git a/pvnet_summation/models/flat_model.py b/pvnet_summation/models/flat_model.py
new file mode 100644
index 0000000..d627adb
--- /dev/null
+++ b/pvnet_summation/models/flat_model.py
@@ -0,0 +1,105 @@
+"""Simple model which only uses outputs of PVNet for all GSPs"""
+
+from typing import Optional
+
+import numpy as np
+import pvnet
+import torch
+import torch.nn.functional as F
+from pvnet.models.multimodal.linear_networks.basic_blocks import AbstractLinearNetwork
+from pvnet.models.multimodal.linear_networks.networks import DefaultFCNet
+from pvnet.optimizers import AbstractOptimizer
+from torch import nn
+
+from pvnet_summation.models.base_model import BaseModel
+
+
+class FlatModel(BaseModel):
+    """Neural network which combines GSP predictions from PVNet naively
+    
+    This model flattens all the features into a 1D vector before feeding them into the sub network
+    """
+
+    name = "FlatModel"
+
+    def __init__(
+        self,
+        output_network: AbstractLinearNetwork,
+        model_name: str,
+        model_version: Optional[str] = None,
+        output_quantiles: Optional[list[float]] = None,
+        relative_scale_pvnet_outputs: bool = False,
+        predict_difference_from_sum: bool = False,
+        optimizer: AbstractOptimizer = pvnet.optimizers.Adam(),
+    ):
+        """Neural network which combines GSP predictions from PVNet naively
+
+        Args:
+            model_name: Model path either locally or on huggingface.
+            model_version: Model version if using huggingface. Set to None if using local.
+            output_quantiles: A list of float (0.0, 1.0) quantiles to predict values for. If set to
+                None the output is a single value.
+            output_network: A partially instantiated pytorch Module class used to combine the 1D
+                features to produce the forecast.
+            relative_scale_pvnet_outputs: If true, the PVNet predictions are scaled by a factor
+                which is proportional to their capacities.
+            predict_difference_from_sum: Whether to use the sum of GSPs as an estimate for the
+                national sum and train the model to correct this estimate. Otherwise the model tries
+                to learn the national sum from the PVNet outputs directly.
+            optimizer (AbstractOptimizer): Optimizer
+        """
+
+        super().__init__(model_name, model_version, optimizer, output_quantiles)
+
+        self.relative_scale_pvnet_outputs = relative_scale_pvnet_outputs
+        self.predict_difference_from_sum = predict_difference_from_sum
+        
+        self.model = output_network(
+            in_features=np.prod(self.pvnet_output_shape),
+            out_features=self.num_output_features,
+        )
+        
+        # Add linear layer if predicting difference from sum
+        # This allows difference to be positive or negative
+        if predict_difference_from_sum:
+            self.model = nn.Sequential(
+                self.model, nn.Linear(self.num_output_features, self.num_output_features)
+            )
+
+        self.save_hyperparameters()
+
+    def forward(self, x):
+        """Run model forward"""
+
+        if "pvnet_outputs" not in x:
+            x["pvnet_outputs"] = self.predict_pvnet_batch(x["pvnet_inputs"])
+
+        if self.relative_scale_pvnet_outputs:
+            if self.pvnet_model.use_quantile_regression:
+                eff_cap = x["effective_capacity"].unsqueeze(-1)
+            else:
+                eff_cap = x["effective_capacity"]
+
+            # The effective_capacit[ies] are relative fractions of the national capacity. They sum
+            # to 1 and they are quite small values. For the largest GSP the capacity is around 0.03.
+            # Therefore we apply this scaling to make the input values a more sensible size
+            x_in = x["pvnet_outputs"] * eff_cap * 100
+        else:
+            x_in = x["pvnet_outputs"]
+
+        x_in = torch.flatten(x_in, start_dim=1)
+        out = self.model(x_in)
+
+        if self.use_quantile_regression:
+            # Shape: batch_size, seq_length * num_quantiles
+            out = out.reshape(out.shape[0], self.forecast_len, len(self.output_quantiles))
+
+        if self.predict_difference_from_sum:
+            gsp_sum = self.sum_of_gsps(x)
+
+            if self.use_quantile_regression:
+                gsp_sum = gsp_sum.unsqueeze(-1)
+
+            out = F.leaky_relu(gsp_sum + out)
+
+        return out
\ No newline at end of file
diff --git a/tests/models/test_flat_model.py b/tests/models/test_flat_model.py
new file mode 100644
index 0000000..aec06e8
--- /dev/null
+++ b/tests/models/test_flat_model.py
@@ -0,0 +1,36 @@
+from torch.optim import SGD
+import pytest
+
+
+def test_model_forward(model, sample_batch):
+    y = model.forward(sample_batch)
+
+    # check output is the correct shape
+    # batch size=2, forecast_len=16
+    assert tuple(y.shape) == (2, 16), y.shape
+
+
+def test_model_backward(model, sample_batch):
+    opt = SGD(model.parameters(), lr=0.001)
+
+    y = model(sample_batch)
+
+    # Backwards on sum drives sum to zero
+    y.sum().backward()
+
+
+def test_quantile_model_forward(quantile_model, sample_batch):
+    y_quantiles = quantile_model(sample_batch)
+
+    # check output is the correct shape
+    # batch size=2, forecast_len=15, num_quantiles=3
+    assert tuple(y_quantiles.shape) == (2, 16, 3), y_quantiles.shape
+
+
+def test_quantile_model_backward(quantile_model, sample_batch):
+    opt = SGD(quantile_model.parameters(), lr=0.001)
+
+    y_quantiles = quantile_model(sample_batch)
+
+    # Backwards on sum drives sum to zero
+    y_quantiles.sum().backward()