v0.6.11

bartzbeielstein · bartzbeielstein · commit 7b248c21b521 · 2023-07-26T00:14:02.000+02:00
cnn implementation
diff --git a/pyproject.toml b/pyproject.toml
@@ -7,7 +7,7 @@ build-backend = "setuptools.build_meta"
 
 [project]
 name = "spotPython"
-version = "0.6.10"
+version = "0.6.11"
 authors = [
   { name="T. Bartz-Beielstein", email="tbb@bartzundbartz.de" }
 ]
diff --git a/src/spotPython/budget/ocba.py b/src/spotPython/budget/ocba.py
@@ -16,10 +16,13 @@ def get_ocba(means, vars, delta) -> int32:
     variances, and incremental budget using the OCBA algorithm.
 
     References:
-        [1]: Chun-Hung Chen and Loo Hay Lee: Stochastic Simulation Optimization: An Optimal Computer Budget Allocation, pp. 49 and pp. 215
-        [2]: C.S.M Currie and T. Monks: How to choose the best setup for a system. A tutorial for the Simulation Workshop 2021, see:
-        [sw21_tutorial.ipynb](https://colab.research.google.com/github/TomMonks/sim-tools/blob/master/examples/sw21_tutorial.ipynb) and
-        [sim-tools](https://github.com/TomMonks/sim-tools)
+        [1]: Chun-Hung Chen and Loo Hay Lee: Stochastic Simulation Optimization: An Optimal Computer Budget Allocation,
+        pp. 49 and pp. 215
+        [2]: C.S.M Currie and T. Monks: How to choose the best setup for a system.
+        A tutorial for the Simulation Workshop 2021, see:
+        https://colab.research.google.com/github/TomMonks/sim-tools/blob/master/examples/sw21_tutorial.ipynb
+        and
+        https://github.com/TomMonks/sim-tools
 
     Args:
         means (numpy.array): An array of means.
diff --git a/src/spotPython/build/kriging.py b/src/spotPython/build/kriging.py
@@ -158,7 +158,8 @@ def __init__(
 
         References:
 
-            [[1](https://scikit-learn.org/stable/auto_examples/gaussian_process/plot_gpr_noisy_targets.html)] scikit-learn: Gaussian Processes regression: basic introductory example
+            [[1](https://scikit-learn.org/stable/auto_examples/gaussian_process/plot_gpr_noisy_targets.html)]
+            scikit-learn: Gaussian Processes regression: basic introductory example
 
         """
         super().__init__(name, seed, log_level)
diff --git a/src/spotPython/fun/hyperlightning.py b/src/spotPython/fun/hyperlightning.py
@@ -0,0 +1,119 @@
+import logging
+import numpy as np
+from numpy.random import default_rng
+from numpy import array
+
+# here we use train_model from spotPython.light.trainmodel
+# and not from spot.light.traintest:
+from spotPython.light.trainmodel import train_model
+from spotPython.hyperparameters.values import (
+    assign_values,
+    generate_one_config_from_var_dict,
+)
+
+logger = logging.getLogger(__name__)
+py_handler = logging.FileHandler(f"{__name__}.log", mode="w")
+py_formatter = logging.Formatter("%(name)s %(asctime)s %(levelname)s %(message)s")
+py_handler.setFormatter(py_formatter)
+logger.addHandler(py_handler)
+
+
+class HyperLightning:
+    """
+    Hyperparameter Tuning for Lightning.
+    """
+
+    def __init__(self, seed: int = 126, log_level: int = 50) -> None:
+        self.seed = seed
+        self.rng = default_rng(seed=self.seed)
+        self.fun_control = {
+            "seed": None,
+            "data": None,
+            "step": 10_000,
+            "horizon": None,
+            "grace_period": None,
+            "metric_river": None,
+            "metric_sklearn": None,
+            "weights": array([1, 0, 0]),
+            "weight_coeff": 0.0,
+            "log_level": log_level,
+            "var_name": [],
+            "var_type": [],
+        }
+        self.log_level = self.fun_control["log_level"]
+        logger.setLevel(self.log_level)
+        logger.info(f"Starting the logger at level {self.log_level} for module {__name__}:")
+
+    def check_X_shape(self, X: np.ndarray) -> np.ndarray:
+        """
+        Checks the shape of the input array X and raises an exception if it is not valid.
+
+        Args:
+            X (np.ndarray):
+                input array.
+
+        Returns:
+            np.ndarray:
+                input array with valid shape.
+
+        Raises:
+            Exception:
+                if the shape of the input array is not valid.
+
+        Examples:
+            >>> hyper_light = HyperLight(seed=126, log_level=50)
+            >>> X = np.array([[1, 2], [3, 4]])
+            >>> hyper_light.check_X_shape(X)
+            array([[1, 2],
+                   [3, 4]])
+        """
+        try:
+            X.shape[1]
+        except ValueError:
+            X = np.array([X])
+        if X.shape[1] != len(self.fun_control["var_name"]):
+            raise Exception("Invalid shape of input array X.")
+        return X
+
+    def fun(self, X: np.ndarray, fun_control: dict = None) -> np.ndarray:
+        """
+        Evaluates the function for the given input array X and control parameters.
+
+        Args:
+            X (np.ndarray):
+                input array.
+            fun_control (dict):
+                dictionary containing control parameters for the hyperparameter tuning.
+
+        Returns:
+            (np.ndarray):
+                array containing the evaluation results.
+
+        Examples:
+            >>> hyper_light = HyperLight(seed=126, log_level=50)
+                X = np.array([[1, 2], [3, 4]])
+                fun_control = {"weights": np.array([1, 0, 0])}
+                hyper_light.fun(X, fun_control)
+                array([nan, nan])
+        """
+        z_res = np.array([], dtype=float)
+        if fun_control is not None:
+            self.fun_control.update(fun_control)
+        self.check_X_shape(X)
+        var_dict = assign_values(X, self.fun_control["var_name"])
+        # type information and transformations are considered in generate_one_config_from_var_dict:
+        for config in generate_one_config_from_var_dict(var_dict, self.fun_control):
+            logger.debug(f"\nconfig: {config}")
+            # extract parameters like epochs, batch_size, lr, etc. from config
+            # config_id = generate_config_id(config)
+            try:
+                print("fun: Calling train_model")
+                df_eval = train_model(config, self.fun_control)
+                print("fun: train_model returned")
+            except Exception as err:
+                logger.error(f"Error in fun(). Call to train_model failed. {err=}, {type(err)=}")
+                logger.error("Setting df_eval to np.nan")
+                df_eval = np.nan
+            z_val = self.fun_control["weights"] * df_eval
+            z_res = np.append(z_res, z_val)
+        return z_res
diff --git a/src/spotPython/light/cifar10/cifar10datamodule.py b/src/spotPython/light/cifar10/cifar10datamodule.py
@@ -53,9 +53,7 @@ def setup(self, stage: Optional[str] = None) -> None:
         # https://lightning.ai/docs/pytorch/latest/notebooks/course_UvA-DL/04-inception-resnet-densenet.html
         DATA_MEANS = (0.49139968, 0.48215841, 0.44653091)
         DATA_STDS = (0.24703223, 0.24348513, 0.26158784)
-        transform = transforms.Compose(
-                [transforms.ToTensor(), transforms.Normalize(DATA_MEANS, DATA_STDS)]
-            )
+        transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize(DATA_MEANS, DATA_STDS)])
         # Assign train/val datasets for use in dataloaders
         if stage == "fit" or stage is None:
             data_full = CIFAR10(root=self.data_dir, train=True, transform=transform)
@@ -75,8 +73,9 @@ def train_dataloader(self) -> DataLoader:
 
         """
         print("train_dataloader: self.batch_size", self.batch_size)
-        return DataLoader(self.data_train, batch_size=self.batch_size, shuffle=True, drop_last = True,
-                          num_workers=self.num_workers)
+        return DataLoader(
+            self.data_train, batch_size=self.batch_size, shuffle=True, drop_last=True, num_workers=self.num_workers
+        )
 
     def val_dataloader(self) -> DataLoader:
         """
@@ -88,8 +87,9 @@ def val_dataloader(self) -> DataLoader:
 
         """
         print("val_dataloader: self.batch_size", self.batch_size)
-        return DataLoader(self.data_val, batch_size=self.batch_size, shuffle=False,
-                          drop_last=False, num_workers=self.num_workers)
+        return DataLoader(
+            self.data_val, batch_size=self.batch_size, shuffle=False, drop_last=False, num_workers=self.num_workers
+        )
 
     def test_dataloader(self) -> DataLoader:
         """
@@ -101,5 +101,6 @@ def test_dataloader(self) -> DataLoader:
 
         """
         print("train_data_loader: self.batch_size", self.batch_size)
-        return DataLoader(self.data_test, batch_size=self.batch_size, shuffle=False,
-                          drop_last=False, num_workers=self.num_workers)
+        return DataLoader(
+            self.data_test, batch_size=self.batch_size, shuffle=False, drop_last=False, num_workers=self.num_workers
+        )
diff --git a/src/spotPython/light/cnn/googlenet.py b/src/spotPython/light/cnn/googlenet.py
@@ -1,35 +1,48 @@
-import os
-import urllib.request
 from types import SimpleNamespace
-from urllib.error import HTTPError
-
-import lightning as L
-import matplotlib
-import matplotlib.pyplot as plt
-import matplotlib_inline.backend_inline
-import numpy as np
-import seaborn as sns
-import tabulate
-import torch
 import torch.nn as nn
-import torch.optim as optim
-import torch.utils.data as data
-import torchvision
+from spotPython.light.cnn.inceptionblock import InceptionBlock
 
-from IPython.display import HTML, display
-from lightning.pytorch.callbacks import LearningRateMonitor, ModelCheckpoint
-from PIL import Image
-from torchvision import transforms
-from torchvision.datasets import CIFAR10
 
-matplotlib_inline.backend_inline.set_matplotlib_formats("svg", "pdf")  # For export
-matplotlib.rcParams["lines.linewidth"] = 2.0
-sns.reset_orig()
+class GoogleNet(nn.Module):
+    """GoogleNet architecture
 
+    Args:
+        num_classes (int):
+            Number of classes for the classification task. Defaults to 10.
+        act_fn_name (str):
+            Name of the activation function. Defaults to "relu".
+        **kwargs:
+            Additional keyword arguments.
 
-class GoogleNet(nn.Module):
-    def __init__(self, num_classes=10, act_fn_name="relu", **kwargs):
+    Attributes:
+        hparams (SimpleNamespace):
+            Namespace containing the hyperparameters.
+        input_net (nn.Sequential):
+            Input network.
+        inception_blocks (nn.Sequential):
+            Inception blocks.
+        output_net (nn.Sequential):
+            Output network.
+
+    Returns:
+        (torch.Tensor):
+            Output tensor of the GoogleNet architecture
+
+    Examples:
+        >>> from spotPython.light.cnn.googlenet import GoogleNet
+            import torch
+            import torch.nn as nn
+            model = GoogleNet()
+            x = torch.randn(1, 3, 32, 32)
+            y = model(x)
+            y.shape
+            torch.Size([1, 10])
+    """
+
+    def __init__(self, num_classes: int = 10, act_fn_name: str = "relu", **kwargs):
         super().__init__()
+        # TODO: Replace this by act_fn handlers specified in the config file:
+        act_fn_by_name = {"tanh": nn.Tanh, "relu": nn.ReLU, "leakyrelu": nn.LeakyReLU, "gelu": nn.GELU}
         self.hparams = SimpleNamespace(
             num_classes=num_classes, act_fn_name=act_fn_name, act_fn=act_fn_by_name[act_fn_name]
         )
@@ -100,7 +113,7 @@ def _create_network(self):
         )
 
     def _init_params(self):
-        # Based on our discussion in Tutorial 4, we should initialize the
+        # We should initialize the
         # convolutions according to the activation function
         for m in self.modules():
             if isinstance(m, nn.Conv2d):
@@ -113,4 +126,4 @@ def forward(self, x):
         x = self.input_net(x)
         x = self.inception_blocks(x)
         x = self.output_net(x)
-        return x
+        return x
diff --git a/src/spotPython/light/cnn/inceptionblock.py b/src/spotPython/light/cnn/inceptionblock.py
@@ -1,42 +1,50 @@
-import os
-import urllib.request
-from types import SimpleNamespace
-from urllib.error import HTTPError
-
-import lightning as L
-import matplotlib
-import matplotlib.pyplot as plt
-import matplotlib_inline.backend_inline
-import numpy as np
-import seaborn as sns
-import tabulate
 import torch
 import torch.nn as nn
-import torch.optim as optim
-import torch.utils.data as data
-import torchvision
-
-from IPython.display import HTML, display
-from lightning.pytorch.callbacks import LearningRateMonitor, ModelCheckpoint
-from PIL import Image
-from torchvision import transforms
-from torchvision.datasets import CIFAR10
 
-matplotlib_inline.backend_inline.set_matplotlib_formats("svg", "pdf")  # For export
-matplotlib.rcParams["lines.linewidth"] = 2.0
-sns.reset_orig()
-
-# PyTorch
-# Torchvision
 
 class InceptionBlock(nn.Module):
     def __init__(self, c_in, c_red: dict, c_out: dict, act_fn):
         """
-        Inputs:
-            c_in - Number of input feature maps from the previous layers
-            c_red - Dictionary with keys "3x3" and "5x5" specifying the output of the dimensionality reducing 1x1 convolutions
-            c_out - Dictionary with keys "1x1", "3x3", "5x5", and "max"
-            act_fn - Activation class constructor (e.g. nn.ReLU)
+        Inception block as used in GoogLeNet.
+
+        Description from
+        [P. Lippe:INCEPTION, RESNET AND DENSENET](https://lightning.ai/docs/pytorch/stable/)
+        An Inception block applies four convolution blocks separately on the same feature map:
+        a 1x1, 3x3, and 5x5 convolution, and a max pool operation.
+        This allows the network to look at the same data with different receptive fields.
+        Of course, learning only 5x5 convolution would be theoretically more powerful.
+        However, this is not only more computation and memory heavy but also tends to overfit much easier.
+        The 1x1 convolutions are used to reduce the number of input channels to the 3x3 and 5x5 convolutions,
+        which reduces the number of parameters and computation.
+
+        Args:
+            c_in:
+                Number of input feature maps from the previous layers
+            c_red:
+                Dictionary with keys "3x3" and "5x5" specifying
+                the output of the dimensionality reducing 1x1 convolutions
+            c_out:
+                Dictionary with keys "1x1", "3x3", "5x5", and "max"
+            act_fn:
+                Activation class constructor (e.g. nn.ReLU)
+
+        Returns:
+            torch.Tensor:
+                Output tensor of the inception block
+
+        Examples:
+            >>> from spotPython.light.cnn.googlenet import InceptionBlock
+                import torch
+                import torch.nn as nn
+                block = InceptionBlock(3,
+                            {"3x3": 32, "5x5": 16},
+                            {"1x1": 16, "3x3": 32, "5x5": 8, "max": 8},
+                            nn.ReLU)
+                x = torch.randn(1, 3, 32, 32)
+                y = block(x)
+                y.shape
+                torch.Size([1, 64, 32, 32])
+
         """
         super().__init__()
 
@@ -79,4 +87,4 @@ def forward(self, x):
         x_5x5 = self.conv_5x5(x)
         x_max = self.max_pool(x)
         x_out = torch.cat([x_1x1, x_3x3, x_5x5, x_max], dim=1)
-        return x_out
+        return x_out
diff --git a/src/spotPython/light/cnn/netcnnbase.py b/src/spotPython/light/cnn/netcnnbase.py
diff --git a/src/spotPython/light/trainmodel.py b/src/spotPython/light/trainmodel.py
diff --git a/src/spotPython/light/utils.py b/src/spotPython/light/utils.py

Original file line number	Diff line number	Diff line change
`@@ -7,7 +7,7 @@ build-backend = "setuptools.build_meta"`
`7`	`7`
`8`	`8`	`[project]`
`9`	`9`	`name = "spotPython"`
`10`		`-version = "0.6.10"`
	`10`	`+version = "0.6.11"`
`11`	`11`	`authors = [`
`12`	`12`	`{ name="T. Bartz-Beielstein", email="tbb@bartzundbartz.de" }`
`13`	`13`	`]`