Add files via upload

2025-07-04 05:00:04 +02:00 · 2023-02-04 14:24:47 +01:00 · 2023-02-04 14:24:47 +01:00 · d23e2edd8d
commit d23e2edd8d
parent 5ac2f1dc96
14 changed files with 1406 additions and 84 deletions
--- a/network/Dataset.py
+++ b/network/Dataset.py
@ -12,6 +12,8 @@ class DatasetMaster(torch.utils.data.Dataset, ABC):
    pattern_storage: np.ndarray
    number_of_pattern: int
    mean: list[float]
    initial_size: list[int]
    channel_size: int
    # Initialize
    def __init__(
@ -36,6 +38,9 @@ class DatasetMaster(torch.utils.data.Dataset, ABC):
        self.mean = []
        self.initial_size = [0, 0]
        self.channel_size = 0
    def __len__(self) -> int:
        return self.number_of_pattern
@ -74,6 +79,9 @@ class DatasetMNIST(DatasetMaster):
        mean = self.pattern_storage.mean(3).mean(2).mean(0)
        self.mean = [*mean]
        self.initial_size = [28, 28]
        self.channel_size = 1
    def __getitem__(self, index: int) -> tuple[torch.Tensor, int]:
        image = self.pattern_storage[index, 0:1, :, :]
@ -154,6 +162,9 @@ class DatasetFashionMNIST(DatasetMaster):
        mean = self.pattern_storage.mean(3).mean(2).mean(0)
        self.mean = [*mean]
        self.initial_size = [28, 28]
        self.channel_size = 1
    def __getitem__(self, index: int) -> tuple[torch.Tensor, int]:
        image = self.pattern_storage[index, 0:1, :, :]
@ -240,6 +251,9 @@ class DatasetCIFAR(DatasetMaster):
        mean = self.pattern_storage.mean(3).mean(2).mean(0)
        self.mean = [*mean]
        self.initial_size = [32, 32]
        self.channel_size = 3
    def __getitem__(self, index: int) -> tuple[torch.Tensor, int]:
        image = self.pattern_storage[index, :, :, :]
--- a/network/HDynamicLayer.py
+++ b/network/HDynamicLayer.py
@ -0,0 +1,451 @@
 import torch
 from network.PyHDynamicCNNCPU import HDynamicCNNCPU
 from network.PyHDynamicCNNGPU import HDynamicCNNGPU
 global_sbs_gpu_setting: list[torch.Tensor] = []
 global_sbs_size: list[torch.Tensor] = []
 global_sbs_hdynamic_cpp: list[HDynamicCNNCPU | HDynamicCNNGPU] = []
 class HDynamicLayer(torch.nn.Module):
    _sbs_gpu_setting_position: int
    _sbs_hdynamic_cpp_position: int
    _gpu_tuning_factor: int
    _number_of_cpu_processes: int
    _output_size: list[int]
    _w_trainable: bool
    _output_layer: bool
    _local_learning: bool
    device: torch.device
    default_dtype: torch.dtype
    def __init__(
        self,
        output_size: list[int],
        output_layer: bool = False,
        local_learning: bool = False,
        number_of_cpu_processes: int = 1,
        w_trainable: bool = False,
        skip_gradient_calculation: bool = False,
        device: torch.device | None = None,
        default_dtype: torch.dtype | None = None,
        gpu_tuning_factor: int = 5,
    ) -> None:
        super().__init__()
        assert device is not None
        self.device = device
        self.default_dtype = default_dtype
        self._gpu_tuning_factor = int(gpu_tuning_factor)
        self._number_of_cpu_processes = int(number_of_cpu_processes)
        self._w_trainable = bool(w_trainable)
        self._skip_gradient_calculation = bool(skip_gradient_calculation)
        self._output_size = output_size
        self._output_layer = bool(output_layer)
        self._local_learning = bool(local_learning)
        global_sbs_gpu_setting.append(torch.tensor([0]))
        global_sbs_size.append(torch.tensor([0, 0, 0, 0]))
        if device == torch.device("cpu"):
            global_sbs_hdynamic_cpp.append(HDynamicCNNCPU())
        else:
            global_sbs_hdynamic_cpp.append(HDynamicCNNGPU())
        self._sbs_gpu_setting_position = len(global_sbs_gpu_setting) - 1
        self._sbs_hdynamic_cpp_position = len(global_sbs_hdynamic_cpp) - 1
        self.functional_sbs = FunctionalSbS.apply
    ####################################################################
    # Forward                                                          #
    ####################################################################
    def forward(
        self,
        input: torch.Tensor,
        spike: torch.Tensor,
        epsilon_xy: torch.Tensor,
        epsilon_t_0: torch.Tensor,
        weights: torch.Tensor,
        h_initial: torch.Tensor,
        last_grad_scale: torch.Tensor,
        labels: torch.Tensor | None = None,
        keep_last_grad_scale: bool = False,
        disable_scale_grade: bool = True,
        forgetting_offset: float = -1.0,
    ) -> torch.Tensor:
        if labels is None:
            labels_copy: torch.Tensor = torch.tensor(
                [], dtype=torch.int64, device=self.device
            )
        else:
            labels_copy = (
                labels.detach().clone().type(dtype=torch.int64).to(device=self.device)
            )
        if (spike.shape[-2] * spike.shape[-1]) > self._gpu_tuning_factor:
            gpu_tuning_factor = self._gpu_tuning_factor
        else:
            gpu_tuning_factor = 0
        parameter_list = torch.tensor(
            [
                int(self._number_of_cpu_processes),  # 0
                int(self._output_size[0]),  # 1
                int(self._output_size[1]),  # 2
                int(gpu_tuning_factor),  # 3
                int(self._sbs_gpu_setting_position),  # 4
                int(self._sbs_hdynamic_cpp_position),  # 5
                int(self._w_trainable),  # 6
                int(disable_scale_grade),  # 7
                int(keep_last_grad_scale),  # 8
                int(self._skip_gradient_calculation),  # 9
                int(self._output_layer),  # 10
                int(self._local_learning),  # 11
            ],
            dtype=torch.int64,
        )
        # SbS forward functional
        return self.functional_sbs(
            input,
            spike,
            epsilon_xy,
            epsilon_t_0,
            weights,
            h_initial,
            parameter_list,
            last_grad_scale,
            torch.tensor(
                forgetting_offset, device=self.device, dtype=self.default_dtype
            ),
            labels_copy,
        )
 class FunctionalSbS(torch.autograd.Function):
    @staticmethod
    def forward(  # type: ignore
        ctx,
        input: torch.Tensor,
        spikes: torch.Tensor,
        epsilon_xy: torch.Tensor | None,
        epsilon_t_0: torch.Tensor,
        weights: torch.Tensor,
        h_initial: torch.Tensor,
        parameter_list: torch.Tensor,
        grad_output_scale: torch.Tensor,
        forgetting_offset: torch.Tensor,
        labels: torch.Tensor,
    ) -> torch.Tensor:
        number_of_spikes: int = int(spikes.shape[1])
        if input.device == torch.device("cpu"):
            hdyn_number_of_cpu_processes: int = int(parameter_list[0])
        else:
            hdyn_number_of_cpu_processes = -1
        output_size_0: int = int(parameter_list[1])
        output_size_1: int = int(parameter_list[2])
        gpu_tuning_factor: int = int(parameter_list[3])
        sbs_gpu_setting_position = int(parameter_list[4])
        sbs_hdynamic_cpp_position = int(parameter_list[5])
        # ###########################################################
        # H dynamic
        # ###########################################################
        assert epsilon_t_0.ndim == 1
        assert epsilon_t_0.shape[0] >= number_of_spikes
        # ############################################
        # Make space for the results
        # ############################################
        output = torch.empty(
            (
                int(input.shape[0]),
                int(weights.shape[1]),
                output_size_0,
                output_size_1,
            ),
            dtype=input.dtype,
            device=input.device,
        )
        assert output.is_contiguous() is True
        if epsilon_xy is not None:
            assert epsilon_xy.is_contiguous() is True
            assert epsilon_xy.ndim == 3
        assert epsilon_t_0.is_contiguous() is True
        assert weights.is_contiguous() is True
        assert spikes.is_contiguous() is True
        assert h_initial.is_contiguous() is True
        assert weights.ndim == 2
        assert h_initial.ndim == 1
        sbs_profile = global_sbs_gpu_setting[sbs_gpu_setting_position].clone()
        sbs_size = global_sbs_size[sbs_gpu_setting_position].clone()
        if input.device != torch.device("cpu"):
            if (
                (sbs_profile.numel() == 1)
                or (sbs_size[0] != int(output.shape[0]))
                or (sbs_size[1] != int(output.shape[1]))
                or (sbs_size[2] != int(output.shape[2]))
                or (sbs_size[3] != int(output.shape[3]))
            ):
                sbs_profile = torch.zeros(
                    (14, 7), dtype=torch.int64, device=torch.device("cpu")
                )
                global_sbs_hdynamic_cpp[sbs_hdynamic_cpp_position].gpu_occupancy_export(
                    int(output.shape[2]),
                    int(output.shape[3]),
                    int(output.shape[0]),
                    int(output.shape[1]),
                    sbs_profile.data_ptr(),
                    int(sbs_profile.shape[0]),
                    int(sbs_profile.shape[1]),
                )
                global_sbs_gpu_setting[sbs_gpu_setting_position] = sbs_profile.clone()
                sbs_size[0] = int(output.shape[0])
                sbs_size[1] = int(output.shape[1])
                sbs_size[2] = int(output.shape[2])
                sbs_size[3] = int(output.shape[3])
                global_sbs_size[sbs_gpu_setting_position] = sbs_size.clone()
            else:
                global_sbs_hdynamic_cpp[sbs_hdynamic_cpp_position].gpu_occupancy_import(
                    sbs_profile.data_ptr(),
                    int(sbs_profile.shape[0]),
                    int(sbs_profile.shape[1]),
                )
        global_sbs_hdynamic_cpp[sbs_hdynamic_cpp_position].update(
            output.data_ptr(),
            int(output.shape[0]),
            int(output.shape[1]),
            int(output.shape[2]),
            int(output.shape[3]),
            epsilon_xy.data_ptr() if epsilon_xy is not None else int(0),
            int(epsilon_xy.shape[0]) if epsilon_xy is not None else int(0),
            int(epsilon_xy.shape[1]) if epsilon_xy is not None else int(0),
            int(epsilon_xy.shape[2]) if epsilon_xy is not None else int(0),
            epsilon_t_0.data_ptr(),
            int(epsilon_t_0.shape[0]),
            weights.data_ptr(),
            int(weights.shape[0]),
            int(weights.shape[1]),
            spikes.data_ptr(),
            int(spikes.shape[0]),
            int(spikes.shape[1]),
            int(spikes.shape[2]),
            int(spikes.shape[3]),
            h_initial.data_ptr(),
            int(h_initial.shape[0]),
            hdyn_number_of_cpu_processes,
            float(forgetting_offset.cpu().item()),
            int(gpu_tuning_factor),
        )
        # ###########################################################
        # Save the necessary data for the backward pass
        # ###########################################################
        ctx.save_for_backward(
            input,
            weights,
            output,
            parameter_list,
            grad_output_scale,
            labels,
        )
        return output
    @staticmethod
    def backward(ctx, grad_output):
        # ##############################################
        # Get the variables back
        # ##############################################
        (
            input,
            weights,
            output,
            parameter_list,
            last_grad_scale,
            labels,
        ) = ctx.saved_tensors
        assert labels.numel() > 0
        # ##############################################
        # Default output
        # ##############################################
        grad_input = None
        grad_spikes = None
        grad_eps_xy = None
        grad_epsilon_t_0 = None
        grad_weights = None
        grad_h_initial = None
        grad_parameter_list = None
        grad_forgetting_offset = None
        grad_labels = None
        # ##############################################
        # Parameters
        # ##############################################
        parameter_w_trainable: bool = bool(parameter_list[6])
        parameter_disable_scale_grade: bool = bool(parameter_list[7])
        parameter_keep_last_grad_scale: bool = bool(parameter_list[8])
        parameter_skip_gradient_calculation: bool = bool(parameter_list[9])
        parameter_output_layer: bool = bool(parameter_list[10])
        parameter_local_learning: bool = bool(parameter_list[11])
        # ##############################################
        # Dealing with overall scale of the gradient
        # ##############################################
        if parameter_disable_scale_grade is False:
            if parameter_keep_last_grad_scale is True:
                last_grad_scale = torch.tensor(
                    [torch.abs(grad_output).max(), last_grad_scale]
                ).max()
            grad_output /= last_grad_scale
        grad_output_scale = last_grad_scale.clone()
        input /= input.sum(dim=1, keepdim=True, dtype=weights.dtype)
        # #################################################
        # User doesn't want us to calculate the gradients
        # #################################################
        if parameter_skip_gradient_calculation is True:
            return (
                grad_input,
                grad_spikes,
                grad_eps_xy,
                grad_epsilon_t_0,
                grad_weights,
                grad_h_initial,
                grad_parameter_list,
                grad_output_scale,
                grad_forgetting_offset,
                grad_labels,
            )
        # #################################################
        # Calculate backprop error (grad_input)
        # #################################################
        backprop_r: torch.Tensor = weights.unsqueeze(0).unsqueeze(-1).unsqueeze(
            -1
        ) * output.unsqueeze(1)
        backprop_bigr: torch.Tensor = backprop_r.sum(dim=2)
        backprop_z: torch.Tensor = backprop_r * (
            1.0 / (backprop_bigr + 1e-20)
        ).unsqueeze(2)
        grad_input: torch.Tensor = (backprop_z * grad_output.unsqueeze(1)).sum(2)
        del backprop_z
        # #################################################
        # Calculate weight gradient (grad_weights)
        # #################################################
        if parameter_w_trainable is False:
            # #################################################
            # We don't train this weight
            # #################################################
            grad_weights = None
        elif (parameter_output_layer is False) and (parameter_local_learning is True):
            # #################################################
            # Local learning
            # #################################################
            grad_weights = (
                (-2 * (input - backprop_bigr).unsqueeze(2) * output.unsqueeze(1))
                .sum(0)
                .sum(-1)
                .sum(-1)
            )
        elif (parameter_output_layer is True) and (parameter_local_learning is True):
            target_one_hot: torch.Tensor = torch.zeros(
                (
                    labels.shape[0],
                    output.shape[1],
                ),
                device=input.device,
                dtype=input.dtype,
            )
            target_one_hot.scatter_(
                1,
                labels.to(input.device).unsqueeze(1),
                torch.ones(
                    (labels.shape[0], 1),
                    device=input.device,
                    dtype=input.dtype,
                ),
            )
            target_one_hot = target_one_hot.unsqueeze(-1).unsqueeze(-1)
            # (-2 * (input - backprop_bigr).unsqueeze(2) * (target_one_hot-output).unsqueeze(1))
            # (-2 * input.unsqueeze(2) * (target_one_hot-output).unsqueeze(1))
            grad_weights = (
                (
                    -2
                    * (input - backprop_bigr).unsqueeze(2)
                    * target_one_hot.unsqueeze(1)
                )
                .sum(0)
                .sum(-1)
                .sum(-1)
            )
        else:
            # #################################################
            # Backprop
            # #################################################
            backprop_f: torch.Tensor = output.unsqueeze(1) * (
                input / (backprop_bigr**2 + 1e-20)
            ).unsqueeze(2)
            result_omega: torch.Tensor = backprop_bigr.unsqueeze(
                2
            ) * grad_output.unsqueeze(1)
            result_omega -= (backprop_r * grad_output.unsqueeze(1)).sum(2).unsqueeze(2)
            result_omega *= backprop_f
            del backprop_f
            grad_weights = result_omega.sum(0).sum(-1).sum(-1)
            del result_omega
        del backprop_bigr
        del backprop_r
        return (
            grad_input,
            grad_spikes,
            grad_eps_xy,
            grad_epsilon_t_0,
            grad_weights,
            grad_h_initial,
            grad_parameter_list,
            grad_output_scale,
            grad_forgetting_offset,
            grad_labels,
        )
--- a/network/InputSpikeImage.py
+++ b/network/InputSpikeImage.py
@ -0,0 +1,104 @@
 import torch
 from network.SpikeLayer import SpikeLayer
 from network.SpikeCountLayer import SpikeCountLayer
 class InputSpikeImage(torch.nn.Module):
    _reshape: bool
    _normalize: bool
    _device: torch.device
    number_of_spikes: int
    def __init__(
        self,
        number_of_spikes: int = -1,
        number_of_cpu_processes: int = 1,
        reshape: bool = False,
        normalize: bool = True,
        device: torch.device | None = None,
    ) -> None:
        super().__init__()
        assert device is not None
        self._device = device
        self._reshape = bool(reshape)
        self._normalize = bool(normalize)
        self.number_of_spikes = int(number_of_spikes)
        if device != torch.device("cpu"):
            number_of_cpu_processes_spike_generator = 0
        else:
            number_of_cpu_processes_spike_generator = number_of_cpu_processes
        self.spike_generator = SpikeLayer(
            number_of_cpu_processes=number_of_cpu_processes_spike_generator,
            device=device,
        )
        self.spike_count = SpikeCountLayer(
            number_of_cpu_processes=number_of_cpu_processes
        )
    ####################################################################
    # Forward                                                          #
    ####################################################################
    def forward(self, input: torch.Tensor) -> torch.Tensor:
        if self.number_of_spikes < 1:
            return input
        input_shape: list[int] = [
            int(input.shape[0]),
            int(input.shape[1]),
            int(input.shape[2]),
            int(input.shape[3]),
        ]
        if self._reshape is True:
            input_work = (
                input.detach()
                .clone()
                .to(self._device)
                .reshape(
                    (input_shape[0], input_shape[1] * input_shape[2] * input_shape[3])
                )
                .unsqueeze(-1)
                .unsqueeze(-1)
            )
        else:
            input_work = input.detach().clone().to(self._device)
        spikes = self.spike_generator(
            input=input_work, number_of_spikes=self.number_of_spikes
        )
        if self._reshape is True:
            dim_s: int = input_shape[1] * input_shape[2] * input_shape[3]
        else:
            dim_s = input_shape[1]
        output: torch.Tensor = self.spike_count(spikes, dim_s)
        if self._reshape is True:
            output = (
                output.squeeze(-1)
                .squeeze(-1)
                .reshape(
                    (input_shape[0], input_shape[1], input_shape[2], input_shape[3])
                )
            )
        if self._normalize is True:
            output = output.type(dtype=input_work.dtype)
            output = output / output.sum(dim=-1, keepdim=True).sum(
                dim=-2, keepdim=True
            ).sum(dim=-3, keepdim=True)
        return output
--- a/network/Makefile
+++ b/network/Makefile
@ -3,20 +3,22 @@ export
 all:
 	cd h_dynamic_cnn_cpu_cpp && $(MAKE) all
-	cd h_dynamic_cnn_gpu_cpp && $(MAKE) all
+	cd h_dynamic_cnn_gpu_cpp_v1 && $(MAKE) all
 	cd spike_generation_cpu_cpp && $(MAKE) all
 	cd spike_generation_gpu_cpp_v2 && $(MAKE) all 
 	cd multiplication_approximation_cpu_cpp && $(MAKE) all
 	cd multiplication_approximation_gpu_cpp && $(MAKE) all
 	cd count_spikes_cpu_cpp && $(MAKE) all
 	cd sort_spikes_cpu_cpp && $(MAKE) all
 	$(PYBIN)python3 pybind11_auto_pyi.py
 clean:
 	cd h_dynamic_cnn_cpu_cpp && $(MAKE) clean
-	cd h_dynamic_cnn_gpu_cpp && $(MAKE) clean
+	cd h_dynamic_cnn_gpu_cpp_v1 && $(MAKE) clean
 	cd spike_generation_cpu_cpp && $(MAKE) clean
 	cd spike_generation_gpu_cpp_v2 && $(MAKE) clean 
 	cd multiplication_approximation_cpu_cpp && $(MAKE) clean
 	cd multiplication_approximation_gpu_cpp && $(MAKE) clean
 	cd count_spikes_cpu_cpp && $(MAKE) clean
 	cd sort_spikes_cpu_cpp && $(MAKE) clean
--- a/network/SbSLayer.py
+++ b/network/SbSLayer.py
@ -0,0 +1,480 @@
 import torch
 from network.SpikeLayer import SpikeLayer
 from network.HDynamicLayer import HDynamicLayer
 from network.calculate_output_size import calculate_output_size
 from network.SortSpikesLayer import SortSpikesLayer
 class SbSLayer(torch.nn.Module):
    _epsilon_xy: torch.Tensor | None = None
    _epsilon_xy_use: bool
    _epsilon_0: float
    _weights: torch.nn.parameter.Parameter
    _weights_exists: bool = False
    _kernel_size: list[int]
    _stride: list[int]
    _dilation: list[int]
    _padding: list[int]
    _output_size: torch.Tensor
    _number_of_spikes: int
    _number_of_cpu_processes: int
    _number_of_neurons: int
    _number_of_input_neurons: int
    _epsilon_xy_intitial: float
    _h_initial: torch.Tensor | None = None
    _w_trainable: bool
    _last_grad_scale: torch.nn.parameter.Parameter
    _keep_last_grad_scale: bool
    _disable_scale_grade: bool
    _forgetting_offset: float
    _weight_noise_range: list[float]
    _skip_gradient_calculation: bool
    _is_pooling_layer: bool
    _input_size: list[int]
    _output_layer: bool = False
    _local_learning: bool = False
    device: torch.device
    default_dtype: torch.dtype
    _gpu_tuning_factor: int
    _max_grad_weights: torch.Tensor | None = None
    _number_of_grad_weight_contributions: float = 0.0
    last_input_store: bool = False
    last_input_data: torch.Tensor | None = None
    _cooldown_after_number_of_spikes: int = -1
    _reduction_cooldown: float = 1.0
    _layer_id: int = -1
    spike_full_layer_input_distribution: bool = False
    def __init__(
        self,
        number_of_input_neurons: int,
        number_of_neurons: int,
        input_size: list[int],
        forward_kernel_size: list[int],
        number_of_spikes: int,
        epsilon_xy_intitial: float = 0.1,
        epsilon_xy_use: bool = False,
        epsilon_0: float = 1.0,
        weight_noise_range: list[float] = [0.0, 1.0],
        is_pooling_layer: bool = False,
        strides: list[int] = [1, 1],
        dilation: list[int] = [0, 0],
        padding: list[int] = [0, 0],
        number_of_cpu_processes: int = 1,
        w_trainable: bool = False,
        keep_last_grad_scale: bool = False,
        disable_scale_grade: bool = True,
        forgetting_offset: float = -1.0,
        skip_gradient_calculation: bool = False,
        device: torch.device | None = None,
        default_dtype: torch.dtype | None = None,
        gpu_tuning_factor: int = 10,
        layer_id: int = -1,
        cooldown_after_number_of_spikes: int = -1,
        reduction_cooldown: float = 1.0,
    ) -> None:
        super().__init__()
        assert device is not None
        assert default_dtype is not None
        self.device = device
        self.default_dtype = default_dtype
        self._w_trainable = bool(w_trainable)
        self._keep_last_grad_scale = bool(keep_last_grad_scale)
        self._skip_gradient_calculation = bool(skip_gradient_calculation)
        self._disable_scale_grade = bool(disable_scale_grade)
        self._epsilon_xy_intitial = float(epsilon_xy_intitial)
        self._stride = strides
        self._dilation = dilation
        self._padding = padding
        self._kernel_size = forward_kernel_size
        self._number_of_input_neurons = int(number_of_input_neurons)
        self._number_of_neurons = int(number_of_neurons)
        self._epsilon_0 = float(epsilon_0)
        self._number_of_cpu_processes = int(number_of_cpu_processes)
        self._number_of_spikes = int(number_of_spikes)
        self._weight_noise_range = weight_noise_range
        self._is_pooling_layer = bool(is_pooling_layer)
        self._cooldown_after_number_of_spikes = int(cooldown_after_number_of_spikes)
        self.reduction_cooldown = float(reduction_cooldown)
        self._layer_id = layer_id
        self._epsilon_xy_use = epsilon_xy_use
        assert len(input_size) == 2
        self._input_size = input_size
        # The GPU hates me...
        # Too many SbS threads == bad
        # Thus I need to limit them...
        # (Reminder: We cannot access the mini-batch size here,
        # which is part of the GPU thread size calculation...)
        self._last_grad_scale = torch.nn.parameter.Parameter(
            torch.tensor(-1.0, dtype=self.default_dtype),
            requires_grad=True,
        )
        self._forgetting_offset = float(forgetting_offset)
        self._output_size = calculate_output_size(
            value=input_size,
            kernel_size=self._kernel_size,
            stride=self._stride,
            dilation=self._dilation,
            padding=self._padding,
        )
        self.set_h_init_to_uniform()
        self.spike_generator = SpikeLayer(
            number_of_spikes=self._number_of_spikes,
            number_of_cpu_processes=self._number_of_cpu_processes,
            device=self.device,
        )
        self.h_dynamic = HDynamicLayer(
            output_size=self._output_size.tolist(),
            output_layer=self._output_layer,
            local_learning=self._local_learning,
            number_of_cpu_processes=number_of_cpu_processes,
            w_trainable=w_trainable,
            skip_gradient_calculation=skip_gradient_calculation,
            device=device,
            default_dtype=self.default_dtype,
            gpu_tuning_factor=gpu_tuning_factor,
        )
        assert len(input_size) >= 2
        self.spikes_sorter = SortSpikesLayer(
            kernel_size=self._kernel_size,
            input_shape=[
                self._number_of_input_neurons,
                int(input_size[0]),
                int(input_size[1]),
            ],
            output_size=self._output_size.clone(),
            strides=self._stride,
            dilation=self._dilation,
            padding=self._padding,
            number_of_cpu_processes=number_of_cpu_processes,
        )
        # TODO: TEST
        if layer_id == 0:
            self.spike_full_layer_input_distribution = True
        # ###############################################################
        # Initialize the weights
        # ###############################################################
        if self._is_pooling_layer is True:
            self.weights = self._make_pooling_weights()
        else:
            assert len(self._weight_noise_range) == 2
            weights = torch.empty(
                (
                    int(self._kernel_size[0])
                    * int(self._kernel_size[1])
                    * int(self._number_of_input_neurons),
                    int(self._number_of_neurons),
                ),
                dtype=self.default_dtype,
                device=self.device,
            )
            torch.nn.init.uniform_(
                weights,
                a=float(self._weight_noise_range[0]),
                b=float(self._weight_noise_range[1]),
            )
            self.weights = weights
    ####################################################################
    # Variables in and out                                             #
    ####################################################################
    def get_epsilon_t(self, number_of_spikes: int):
        """Generates the time series of the basic epsilon."""
        t = (
            torch.arange(
                0, number_of_spikes, dtype=self.default_dtype, device=self.device
            )
            + 1
        )
        # torch.ones((number_of_spikes), dtype=self.default_dtype, device=self.device
        epsilon_t: torch.Tensor = t ** (-1.0 / 2.0)
        if (self._cooldown_after_number_of_spikes < number_of_spikes) and (
            self._cooldown_after_number_of_spikes >= 0
        ):
            epsilon_t[
                self._cooldown_after_number_of_spikes : number_of_spikes
            ] /= self._reduction_cooldown
        return epsilon_t
    @property
    def weights(self) -> torch.Tensor | None:
        if self._weights_exists is False:
            return None
        else:
            return self._weights
    @weights.setter
    def weights(self, value: torch.Tensor):
        assert value is not None
        assert torch.is_tensor(value) is True
        assert value.dim() == 2
        temp: torch.Tensor = (
            value.detach()
            .clone(memory_format=torch.contiguous_format)
            .type(dtype=self.default_dtype)
            .to(device=self.device)
        )
        temp /= temp.sum(dim=0, keepdim=True, dtype=self.default_dtype)
        if self._weights_exists is False:
            self._weights = torch.nn.parameter.Parameter(temp, requires_grad=True)
            self._weights_exists = True
        else:
            self._weights.data = temp
    @property
    def h_initial(self) -> torch.Tensor | None:
        return self._h_initial
    @h_initial.setter
    def h_initial(self, value: torch.Tensor):
        assert value is not None
        assert torch.is_tensor(value) is True
        assert value.dim() == 1
        assert value.dtype == self.default_dtype
        self._h_initial = (
            value.detach()
            .clone(memory_format=torch.contiguous_format)
            .type(dtype=self.default_dtype)
            .to(device=self.device)
            .requires_grad_(False)
        )
    def update_pre_care(self):
        if self._weights.grad is not None:
            assert self._number_of_grad_weight_contributions > 0
            self._weights.grad /= self._number_of_grad_weight_contributions
            self._number_of_grad_weight_contributions = 0.0
    def update_after_care(self, threshold_weight: float):
        if self._w_trainable is True:
            self.norm_weights()
            self.threshold_weights(threshold_weight)
            self.norm_weights()
    def after_batch(self, new_state: bool = False):
        if self._keep_last_grad_scale is True:
            self._last_grad_scale.data = self._last_grad_scale.grad
            self._keep_last_grad_scale = new_state
        self._last_grad_scale.grad = torch.zeros_like(self._last_grad_scale.grad)
    ####################################################################
    # Helper functions                                                 #
    ####################################################################
    def _make_pooling_weights(self) -> torch.Tensor:
        """For generating the pooling weights."""
        assert self._number_of_neurons is not None
        assert self._kernel_size is not None
        weights: torch.Tensor = torch.zeros(
            (
                int(self._kernel_size[0]),
                int(self._kernel_size[1]),
                int(self._number_of_neurons),
                int(self._number_of_neurons),
            ),
            dtype=self.default_dtype,
            device=self.device,
        )
        for i in range(0, int(self._number_of_neurons)):
            weights[:, :, i, i] = 1.0
        weights = weights.moveaxis(-1, 0).moveaxis(-1, 1)
        weights = torch.nn.functional.unfold(
            input=weights,
            kernel_size=(int(self._kernel_size[0]), int(self._kernel_size[1])),
            dilation=(1, 1),
            padding=(0, 0),
            stride=(1, 1),
        ).squeeze()
        weights = torch.moveaxis(weights, 0, 1)
        return weights
    def set_h_init_to_uniform(self) -> None:
        assert self._number_of_neurons > 2
        self.h_initial: torch.Tensor = torch.full(
            (self._number_of_neurons,),
            (1.0 / float(self._number_of_neurons)),
            dtype=self.default_dtype,
            device=self.device,
        )
    def norm_weights(self) -> None:
        assert self._weights_exists is True
        temp: torch.Tensor = (
            self._weights.data.detach()
            .clone(memory_format=torch.contiguous_format)
            .type(dtype=self.default_dtype)
            .to(device=self.device)
        )
        temp /= temp.sum(dim=0, keepdim=True, dtype=self.default_dtype)
        self._weights.data = temp
    def threshold_weights(self, threshold: float) -> None:
        assert self._weights_exists is True
        assert threshold >= 0
        torch.clamp(
            self._weights.data,
            min=float(threshold),
            max=None,
            out=self._weights.data,
        )
    ####################################################################
    # Forward                                                          #
    ####################################################################
    def forward(
        self,
        input: torch.Tensor,
        labels: torch.Tensor | None = None,
    ) -> torch.Tensor:
        # Are we happy with the input?
        assert input is not None
        assert torch.is_tensor(input) is True
        assert input.dim() == 4
        assert input.dtype == self.default_dtype
        assert input.shape[1] == self._number_of_input_neurons
        assert input.shape[2] == self._input_size[0]
        assert input.shape[3] == self._input_size[1]
        # Are we happy with the rest of the network?
        assert self._epsilon_0 is not None
        assert self._h_initial is not None
        assert self._forgetting_offset is not None
        assert self._weights_exists is True
        assert self._weights is not None
        # Convolution of the input...
        # Well, this is a convoltion layer
        # there needs to be convolution somewhere
        input_convolved = torch.nn.functional.fold(
            torch.nn.functional.unfold(
                input.requires_grad_(True),
                kernel_size=(int(self._kernel_size[0]), int(self._kernel_size[1])),
                dilation=(int(self._dilation[0]), int(self._dilation[1])),
                padding=(int(self._padding[0]), int(self._padding[1])),
                stride=(int(self._stride[0]), int(self._stride[1])),
            ),
            output_size=tuple(self._output_size.tolist()),
            kernel_size=(1, 1),
            dilation=(1, 1),
            padding=(0, 0),
            stride=(1, 1),
        )
        # We might need the convolved input for other layers
        # let us keep it for the future
        if self.last_input_store is True:
            self.last_input_data = input_convolved.detach().clone()
            self.last_input_data /= self.last_input_data.sum(dim=1, keepdim=True)
        else:
            self.last_input_data = None
        epsilon_t_0: torch.Tensor = (
            (self.get_epsilon_t(self._number_of_spikes) * self._epsilon_0)
            .type(input.dtype)
            .to(input.device)
        )
        if (self._epsilon_xy is None) and (self._epsilon_xy_use is True):
            self._epsilon_xy = torch.full(
                (
                    input_convolved.shape[1],
                    input_convolved.shape[2],
                    input_convolved.shape[3],
                ),
                float(self._epsilon_xy_intitial),
                dtype=self.default_dtype,
                device=self.device,
            )
        if self._epsilon_xy_use is True:
            assert self._epsilon_xy is not None
            # In the case somebody tried to replace the matrix with wrong dimensions
            assert self._epsilon_xy.shape[0] == input_convolved.shape[1]
            assert self._epsilon_xy.shape[1] == input_convolved.shape[2]
            assert self._epsilon_xy.shape[2] == input_convolved.shape[3]
        else:
            assert self._epsilon_xy is None
        if self.spike_full_layer_input_distribution is False:
            spike = self.spike_generator(input_convolved, int(self._number_of_spikes))
        else:
            input_shape = input.shape
            input = (
                input.reshape(
                    (input_shape[0], input_shape[1] * input_shape[2] * input_shape[3])
                )
                .unsqueeze(-1)
                .unsqueeze(-1)
            )
            spike_unsorted = self.spike_generator(input, int(self._number_of_spikes))
            input = (
                input.squeeze(-1)
                .squeeze(-1)
                .reshape(
                    (input_shape[0], input_shape[1], input_shape[2], input_shape[3])
                )
            )
            spike = self.spikes_sorter(spike_unsorted).to(device=input_convolved.device)
        output = self.h_dynamic(
            input=input_convolved,
            spike=spike,
            epsilon_xy=self._epsilon_xy,
            epsilon_t_0=epsilon_t_0,
            weights=self._weights,
            h_initial=self._h_initial,
            last_grad_scale=self._last_grad_scale,
            labels=labels,
            keep_last_grad_scale=self._keep_last_grad_scale,
            disable_scale_grade=self._disable_scale_grade,
            forgetting_offset=self._forgetting_offset,
        )
        self._number_of_grad_weight_contributions += (
            output.shape[0] * output.shape[-2] * output.shape[-1]
        )
        return output
--- a/network/SbSReconstruction.py
+++ b/network/SbSReconstruction.py
@ -1,15 +1,15 @@
 import torch
-from network.SbS import SbS
+from network.SbSLayer import SbSLayer
 class SbSReconstruction(torch.nn.Module):
-    _the_sbs_layer: SbS
+    _the_sbs_layer: SbSLayer
    def __init__(
        self,
-        the_sbs_layer: SbS,
+        the_sbs_layer: SbSLayer,
    ) -> None:
        super().__init__()
--- a/network/SortSpikesLayer.py
+++ b/network/SortSpikesLayer.py
@ -0,0 +1,173 @@
 import torch
 from network.PySortSpikesCPU import SortSpikesCPU
 class SortSpikesLayer(torch.nn.Module):
    _kernel_size: list[int]
    _stride: list[int]
    _dilation: list[int]
    _padding: list[int]
    _output_size: torch.Tensor
    _number_of_cpu_processes: int
    _input_shape: list[int]
    order: torch.Tensor | None = None
    order_convoled: torch.Tensor | None = None
    indices: torch.Tensor | None = None
    def __init__(
        self,
        kernel_size: list[int],
        input_shape: list[int],
        output_size: torch.Tensor,
        strides: list[int] = [1, 1],
        dilation: list[int] = [0, 0],
        padding: list[int] = [0, 0],
        number_of_cpu_processes: int = 1,
    ) -> None:
        super().__init__()
        self._stride = strides
        self._dilation = dilation
        self._padding = padding
        self._kernel_size = kernel_size
        self._output_size = output_size
        self._number_of_cpu_processes = number_of_cpu_processes
        self._input_shape = input_shape
        self.sort_spikes = SortSpikesCPU()
        self.order = (
            torch.arange(
                0,
                self._input_shape[0] * self._input_shape[1] * self._input_shape[2],
                device=torch.device("cpu"),
            )
            .reshape(
                (
                    1,
                    self._input_shape[0],
                    self._input_shape[1],
                    self._input_shape[2],
                )
            )
            .type(dtype=torch.float32)
        )
        self.order_convoled = torch.nn.functional.fold(
            torch.nn.functional.unfold(
                self.order,
                kernel_size=(
                    int(self._kernel_size[0]),
                    int(self._kernel_size[1]),
                ),
                dilation=(int(self._dilation[0]), int(self._dilation[1])),
                padding=(int(self._padding[0]), int(self._padding[1])),
                stride=(int(self._stride[0]), int(self._stride[1])),
            ),
            output_size=tuple(self._output_size.tolist()),
            kernel_size=(1, 1),
            dilation=(1, 1),
            padding=(0, 0),
            stride=(1, 1),
        ).type(dtype=torch.int64)
        assert self.order_convoled is not None
        self.order_convoled = self.order_convoled.reshape(
            (
                self.order_convoled.shape[1]
                * self.order_convoled.shape[2]
                * self.order_convoled.shape[3]
            )
        )
        max_length: int = 0
        max_range: int = (
            self._input_shape[0] * self._input_shape[1] * self._input_shape[2]
        )
        for id in range(0, max_range):
            idx = torch.where(self.order_convoled == id)[0]
            max_length = max(max_length, int(idx.shape[0]))
        self.indices = torch.full(
            (max_range, max_length),
            -1,
            dtype=torch.int64,
            device=torch.device("cpu"),
        )
        for id in range(0, max_range):
            idx = torch.where(self.order_convoled == id)[0]
            self.indices[id, 0 : int(idx.shape[0])] = idx
    ####################################################################
    # Forward                                                          #
    ####################################################################
    def forward(
        self,
        input: torch.Tensor,
    ) -> torch.Tensor:
        assert len(self._input_shape) == 3
        assert input.shape[-2] == 1
        assert input.shape[-1] == 1
        assert self.indices is not None
        spikes_count = torch.zeros(
            (input.shape[0], int(self._output_size[0]), int(self._output_size[1])),
            device=torch.device("cpu"),
            dtype=torch.int64,
        )
        input_cpu = input.clone().cpu()
        self.sort_spikes.count(
            input_cpu.data_ptr(),  # Input
            int(input_cpu.shape[0]),
            int(input_cpu.shape[1]),
            int(input_cpu.shape[2]),
            int(input_cpu.shape[3]),
            spikes_count.data_ptr(),  # Output
            int(spikes_count.shape[0]),
            int(spikes_count.shape[1]),
            int(spikes_count.shape[2]),
            self.indices.data_ptr(),  # Positions
            int(self.indices.shape[0]),
            int(self.indices.shape[1]),
            int(self._number_of_cpu_processes),
        )
        spikes_output = torch.full(
            (
                input.shape[0],
                int(spikes_count.max()),
                int(self._output_size[0]),
                int(self._output_size[1]),
            ),
            -1,
            dtype=torch.int64,
            device=torch.device("cpu"),
        )
        self.sort_spikes.process(
            input_cpu.data_ptr(),  # Input
            int(input_cpu.shape[0]),
            int(input_cpu.shape[1]),
            int(input_cpu.shape[2]),
            int(input_cpu.shape[3]),
            spikes_output.data_ptr(),  # Output
            int(spikes_output.shape[0]),
            int(spikes_output.shape[1]),
            int(spikes_output.shape[2]),
            int(spikes_output.shape[3]),
            self.indices.data_ptr(),  # Positions
            int(self.indices.shape[0]),
            int(self.indices.shape[1]),
            int(self._number_of_cpu_processes),
        )
        return spikes_output
--- a/network/SpikeCountLayer.py
+++ b/network/SpikeCountLayer.py
@ -0,0 +1,52 @@
 import torch
 from network.PyCountSpikesCPU import CountSpikesCPU
 class SpikeCountLayer(torch.nn.Module):
    _number_of_cpu_processes: int
    def __init__(
        self,
        number_of_cpu_processes: int = 1,
    ) -> None:
        super().__init__()
        self._number_of_cpu_processes = number_of_cpu_processes
    ####################################################################
    # Forward                                                          #
    ####################################################################
    def forward(self, input: torch.Tensor, dim_s: int) -> torch.Tensor:
        assert input.ndim == 4
        assert dim_s > 0
        input_cpu = input.cpu()
        histogram = torch.zeros(
            (
                int(input.shape[0]),
                int(dim_s),
                int(input.shape[-2]),
                int(input.shape[-1]),
            ),
            dtype=torch.int64,
            device=input_cpu.device,
        )
        count_spikes = CountSpikesCPU()
        count_spikes.process(
            input_cpu.data_ptr(),
            int(input_cpu.shape[0]),
            int(input_cpu.shape[1]),
            int(input_cpu.shape[2]),
            int(input_cpu.shape[3]),
            histogram.data_ptr(),
            int(histogram.shape[1]),
            int(self._number_of_cpu_processes),
        )
        return histogram.to(device=input.device)
--- a/network/SpikeLayer.py
+++ b/network/SpikeLayer.py
@ -3,8 +3,6 @@ import torch
 from network.PySpikeGenerationCPU import SpikeGenerationCPU
 from network.PySpikeGenerationGPU import SpikeGenerationGPU
 # from PyCountSpikesCPU import CountSpikesCPU
 global_spike_generation_gpu_setting: list[torch.Tensor] = []
 global_spike_size: list[torch.Tensor] = []
 global_spike_generation_cpp: list[SpikeGenerationCPU | SpikeGenerationGPU] = []
@ -16,28 +14,21 @@ class SpikeLayer(torch.nn.Module):
    _spike_generation_gpu_setting_position: int
    _number_of_cpu_processes: int
    _number_of_spikes: int
-
+    device: torch.device
    _spikes: torch.Tensor | None = None
    _store_spikes: bool
    def __init__(
        self,
-        number_of_spikes: int = 1,
+        number_of_spikes: int = -1,
        number_of_cpu_processes: int = 1,
        device: torch.device | None = None,
        default_dtype: torch.dtype | None = None,
        store_spikes: bool = False,
    ) -> None:
        super().__init__()
        assert device is not None
        assert default_dtype is not None
        self.device = device
        self.default_dtype = default_dtype
        self._number_of_cpu_processes = number_of_cpu_processes
        self._number_of_spikes = number_of_spikes
        self._store_spikes = store_spikes
        global_spike_generation_gpu_setting.append(torch.tensor([0]))
        global_spike_size.append(torch.tensor([0, 0, 0, 0]))
@ -62,7 +53,6 @@ class SpikeLayer(torch.nn.Module):
        self,
        input: torch.Tensor,
        number_of_spikes: int | None = None,
        store_spikes: bool | None = None,
    ) -> torch.Tensor:
        if number_of_spikes is None:
@ -80,18 +70,7 @@ class SpikeLayer(torch.nn.Module):
            dtype=torch.int64,
        )
-        spikes = self.functional_spike_generation(input, parameter_list)
+        return self.functional_spike_generation(input, parameter_list)
        if (store_spikes is not None) and (store_spikes is True):
            self._spikes = spikes.detach().clone()
        elif (store_spikes is not None) and (store_spikes is False):
            self._spikes = None
        elif self._store_spikes is True:
            self._spikes = spikes.detach().clone()
        else:
            self._spikes = None
        return spikes
 class FunctionalSpikeGeneration(torch.autograd.Function):
--- a/network/build_network.py
+++ b/network/build_network.py
@ -3,10 +3,11 @@ import torch
 from network.calculate_output_size import calculate_output_size
 from network.Parameter import Config
-from network.SbS import SbS
+from network.SbSLayer import SbSLayer
 from network.SplitOnOffLayer import SplitOnOffLayer
 from network.Conv2dApproximation import Conv2dApproximation
 from network.SbSReconstruction import SbSReconstruction
 from network.InputSpikeImage import InputSpikeImage
 def build_network(
@ -144,7 +145,7 @@ def build_network(
                is_pooling_layer = True
            network.append(
-                SbS(
+                SbSLayer(
                    number_of_input_neurons=in_channels,
                    number_of_neurons=out_channels,
                    input_size=input_size[-1],
@ -190,7 +191,7 @@ def build_network(
            logging.info(f"Layer: {layer_id} -> SbS Reconstruction Layer")
            assert layer_id > 0
-            assert isinstance(network[-1], SbS) is True
+            assert isinstance(network[-1], SbSLayer) is True
            network.append(SbSReconstruction(network[-1]))
            network[-1]._w_trainable = False
@ -365,6 +366,36 @@ def build_network(
            ).tolist()
            input_size.append(input_size_temp)
        # #############################################################
        # Approx CONV2D layer:
        # #############################################################
        elif (
            cfg.network_structure.layer_type[layer_id]
            .upper()
            .startswith("INPUT SPIKE IMAGE")
            is True
        ):
            logging.info(f"Layer: {layer_id} -> Input Spike Image Layer")
            number_of_spikes: int = -1
            if len(cfg.number_of_spikes) > layer_id:
                number_of_spikes = cfg.number_of_spikes[layer_id]
            elif len(cfg.number_of_spikes) == 1:
                number_of_spikes = cfg.number_of_spikes[0]
            network.append(
                InputSpikeImage(
                    number_of_spikes=number_of_spikes,
                    number_of_cpu_processes=cfg.number_of_cpu_processes,
                    reshape=True,
                    normalize=True,
                    device=device,
                )
            )
            input_size.append(input_size[-1])
        # #############################################################
        # Failure becaue we didn't found the selection of layer
        # #############################################################
--- a/network/build_optimizer.py
+++ b/network/build_optimizer.py
@ -1,7 +1,7 @@
 # %%
 import torch
 from network.Parameter import Config
-from network.SbS import SbS
+from network.SbSLayer import SbSLayer
 from network.Conv2dApproximation import Conv2dApproximation
 from network.Adam import Adam
@ -20,7 +20,7 @@ def build_optimizer(
    for id in range(0, len(network)):
-        if (isinstance(network[id], SbS) is True) and (
+        if (isinstance(network[id], SbSLayer) is True) and (
            network[id]._w_trainable is True
        ):
            parameter_list_weights.append(network[id]._weights)
--- a/network/load_previous_weights.py
+++ b/network/load_previous_weights.py
@ -3,9 +3,10 @@ import torch
 import glob
 import numpy as np
-from network.SbS import SbS
+from network.SbSLayer import SbSLayer
 from network.SplitOnOffLayer import SplitOnOffLayer
 from network.Conv2dApproximation import Conv2dApproximation
 import os
 def load_previous_weights(
@ -14,22 +15,28 @@ def load_previous_weights(
    logging,
    device: torch.device,
    default_dtype: torch.dtype,
    order_id: float | int | None = None,
 ) -> None:
    if order_id is None:
        post_fix: str = ""
    else:
        post_fix = f"_{order_id}"
    for id in range(0, len(network)):
        # #################################################
        # SbS
        # #################################################
-        if isinstance(network[id], SbS) is True:
+        if isinstance(network[id], SbSLayer) is True:
-            # Are there weights that overwrite the initial weights?
+            filename_wilcard = os.path.join(
-            file_to_load = glob.glob(overload_path + "/Weight_L" + str(id) + "_*.npy")
+                overload_path, f"Weight_L{id}_*{post_fix}.npy"
            )
            file_to_load = glob.glob(filename_wilcard)
            if len(file_to_load) > 1:
-                raise Exception(
+                raise Exception(f"Too many previous weights files {filename_wilcard}")
                    f"Too many previous weights files {overload_path}/Weight_L{id}*.npy"
                )
            if len(file_to_load) == 1:
                network[id].weights = torch.tensor(
@ -45,13 +52,13 @@ def load_previous_weights(
            # Conv2d weights
            # #################################################
-            # Are there weights that overwrite the initial weights?
+            filename_wilcard = os.path.join(
-            file_to_load = glob.glob(overload_path + "/Weight_L" + str(id) + "_*.npy")
+                overload_path, f"Weight_L{id}_*{post_fix}.npy"
            )
            file_to_load = glob.glob(filename_wilcard)
            if len(file_to_load) > 1:
-                raise Exception(
+                raise Exception(f"Too many previous weights files {filename_wilcard}")
                    f"Too many previous weights files {overload_path}/Weight_L{id}*.npy"
                )
            if len(file_to_load) == 1:
                network[id]._parameters["weight"].data = torch.tensor(
@ -65,13 +72,13 @@ def load_previous_weights(
            # Conv2d bias
            # #################################################
-            # Are there biases that overwrite the initial weights?
+            filename_wilcard = os.path.join(
-            file_to_load = glob.glob(overload_path + "/Bias_L" + str(id) + "_*.npy")
+                overload_path, f"Bias_L{id}_*{post_fix}.npy"
            )
            file_to_load = glob.glob(filename_wilcard)
            if len(file_to_load) > 1:
-                raise Exception(
+                raise Exception(f"Too many previous weights files {filename_wilcard}")
                    f"Too many previous weights files {overload_path}/Weight_L{id}*.npy"
                )
            if len(file_to_load) == 1:
                network[id]._parameters["bias"].data = torch.tensor(
@ -87,13 +94,13 @@ def load_previous_weights(
            # Approximate Conv2d weights
            # #################################################
-            # Are there weights that overwrite the initial weights?
+            filename_wilcard = os.path.join(
-            file_to_load = glob.glob(overload_path + "/Weight_L" + str(id) + "_*.npy")
+                overload_path, f"Weight_L{id}_*{post_fix}.npy"
            )
            file_to_load = glob.glob(filename_wilcard)
            if len(file_to_load) > 1:
-                raise Exception(
+                raise Exception(f"Too many previous weights files {filename_wilcard}")
                    f"Too many previous weights files {overload_path}/Weight_L{id}*.npy"
                )
            if len(file_to_load) == 1:
                network[id].weights.data = torch.tensor(
@ -107,13 +114,13 @@ def load_previous_weights(
            # Approximate Conv2d bias
            # #################################################
-            # Are there biases that overwrite the initial weights?
+            filename_wilcard = os.path.join(
-            file_to_load = glob.glob(overload_path + "/Bias_L" + str(id) + "_*.npy")
+                overload_path, f"Bias_L{id}_*{post_fix}.npy"
            )
            file_to_load = glob.glob(filename_wilcard)
            if len(file_to_load) > 1:
-                raise Exception(
+                raise Exception(f"Too many previous weights files {filename_wilcard}")
                    f"Too many previous weights files {overload_path}/Weight_L{id}*.npy"
                )
            if len(file_to_load) == 1:
                network[id].bias.data = torch.tensor(
@ -127,13 +134,13 @@ def load_previous_weights(
        # SplitOnOffLayer
        # #################################################
        if isinstance(network[id], SplitOnOffLayer) is True:
-            # Are there weights that overwrite the initial weights?
+            filename_wilcard = os.path.join(
-            file_to_load = glob.glob(overload_path + "/Mean_L" + str(id) + "_*.npy")
+                overload_path, f"Mean_L{id}_*{post_fix}.npy"
            )
            file_to_load = glob.glob(filename_wilcard)
            if len(file_to_load) > 1:
-                raise Exception(
+                raise Exception(f"Too many previous mean files {filename_wilcard}")
                    f"Too many previous mean files {overload_path}/Mean_L{id}*.npy"
                )
            if len(file_to_load) == 1:
                network[id].mean = torch.tensor(
--- a/network/loop_train_test.py
+++ b/network/loop_train_test.py
@ -3,7 +3,7 @@ import time
 from network.Parameter import Config
 from torch.utils.tensorboard import SummaryWriter
-from network.SbS import SbS
+from network.SbSLayer import SbSLayer
 from network.save_weight_and_bias import save_weight_and_bias
 from network.SbSReconstruction import SbSReconstruction
@ -19,7 +19,7 @@ def add_weight_and_bias_to_histogram(
        # ################################################
        # Log the SbS Weights
        # ################################################
-        if isinstance(network[id], SbS) is True:
+        if isinstance(network[id], SbSLayer) is True:
            if network[id]._w_trainable is True:
                try:
@ -175,7 +175,7 @@ def forward_pass_train(
        .to(device=device)
    )
    for id in range(0, len(network)):
-        if isinstance(network[id], SbS) is True:
+        if isinstance(network[id], SbSLayer) is True:
            h_collection.append(network[id](h_collection[-1], labels))
        else:
            h_collection.append(network[id](h_collection[-1]))
@ -203,7 +203,7 @@ def forward_pass_test(
    )
    for id in range(0, len(network)):
        if (cfg.extract_noisy_pictures is True) or (overwrite_number_of_spikes != -1):
-            if isinstance(network[id], SbS) is True:
+            if isinstance(network[id], SbSLayer) is True:
                h_collection.append(
                    network[id](
                        h_collection[-1],
@ -228,7 +228,7 @@ def run_optimizer(
    cfg: Config,
 ) -> None:
    for id in range(0, len(network)):
-        if isinstance(network[id], SbS) is True:
+        if isinstance(network[id], SbSLayer) is True:
            network[id].update_pre_care()
    for optimizer_item in optimizer:
@ -236,7 +236,7 @@ def run_optimizer(
            optimizer_item.step()
    for id in range(0, len(network)):
-        if isinstance(network[id], SbS) is True:
+        if isinstance(network[id], SbSLayer) is True:
            network[id].update_after_care(
                cfg.learning_parameters.learning_rate_threshold_w
                / float(
@ -288,11 +288,11 @@ def run_lr_scheduler(
 def deal_with_gradient_scale(epoch_id: int, mini_batch_number: int, network):
    if (epoch_id == 0) and (mini_batch_number == 0):
        for id in range(0, len(network)):
-            if isinstance(network[id], SbS) is True:
+            if isinstance(network[id], SbSLayer) is True:
                network[id].after_batch(True)
    else:
        for id in range(0, len(network)):
-            if isinstance(network[id], SbS) is True:
+            if isinstance(network[id], SbSLayer) is True:
                network[id].after_batch()
@ -309,6 +309,7 @@ def loop_train(
    tb: SummaryWriter,
    lr_scheduler,
    last_test_performance: float,
    order_id: float | int | None = None,
 ) -> tuple[float, float, float, float]:
    correct_in_minibatch: int = 0
@ -529,7 +530,10 @@ def loop_train(
                # Save the Weights and Biases
                # ################################################
                save_weight_and_bias(
-                    cfg=cfg, network=network, iteration_number=epoch_id
+                    cfg=cfg,
                    network=network,
                    iteration_number=epoch_id,
                    order_id=order_id,
                )
                # ################################################
--- a/network/save_weight_and_bias.py
+++ b/network/save_weight_and_bias.py
@ -3,14 +3,23 @@ import torch
 from network.Parameter import Config
 import numpy as np
-from network.SbS import SbS
+from network.SbSLayer import SbSLayer
 from network.SplitOnOffLayer import SplitOnOffLayer
 from network.Conv2dApproximation import Conv2dApproximation
 import os
 def save_weight_and_bias(
-    cfg: Config, network: torch.nn.modules.container.Sequential, iteration_number: int
+    cfg: Config,
    network: torch.nn.modules.container.Sequential,
    iteration_number: int,
    order_id: float | int | None = None,
 ) -> None:
    if order_id is None:
        post_fix: str = ""
    else:
        post_fix = f"_{order_id}"
    for id in range(0, len(network)):
@ -18,11 +27,14 @@ def save_weight_and_bias(
        # Save the SbS Weights
        # ################################################
-        if isinstance(network[id], SbS) is True:
+        if isinstance(network[id], SbSLayer) is True:
            if network[id]._w_trainable is True:
                np.save(
-                    f"{cfg.weight_path}/Weight_L{id}_S{iteration_number}.npy",
+                    os.path.join(
                        cfg.weight_path,
                        f"Weight_L{id}_S{iteration_number}{post_fix}.npy",
                    ),
                    network[id].weights.detach().cpu().numpy(),
                )
@ -34,13 +46,18 @@ def save_weight_and_bias(
            if network[id]._w_trainable is True:
                # Save the new values
                np.save(
-                    f"{cfg.weight_path}/Weight_L{id}_S{iteration_number}.npy",
+                    os.path.join(
                        cfg.weight_path,
                        f"Weight_L{id}_S{iteration_number}{post_fix}.npy",
                    ),
                    network[id]._parameters["weight"].data.detach().cpu().numpy(),
                )
                # Save the new values
                np.save(
-                    f"{cfg.weight_path}/Bias_L{id}_S{iteration_number}.npy",
+                    os.path.join(
                        cfg.weight_path, f"Bias_L{id}_S{iteration_number}{post_fix}.npy"
                    ),
                    network[id]._parameters["bias"].data.detach().cpu().numpy(),
                )
@ -52,20 +69,28 @@ def save_weight_and_bias(
            if network[id]._w_trainable is True:
                # Save the new values
                np.save(
-                    f"{cfg.weight_path}/Weight_L{id}_S{iteration_number}.npy",
+                    os.path.join(
                        cfg.weight_path,
                        f"Weight_L{id}_S{iteration_number}{post_fix}.npy",
                    ),
                    network[id].weights.data.detach().cpu().numpy(),
                )
                # Save the new values
                if network[id].bias is not None:
                    np.save(
-                        f"{cfg.weight_path}/Bias_L{id}_S{iteration_number}.npy",
+                        os.path.join(
                            cfg.weight_path,
                            f"Bias_L{id}_S{iteration_number}{post_fix}.npy",
                        ),
                        network[id].bias.data.detach().cpu().numpy(),
                    )
        if isinstance(network[id], SplitOnOffLayer) is True:
            np.save(
-                f"{cfg.weight_path}/Mean_L{id}_S{iteration_number}.npy",
+                os.path.join(
                    cfg.weight_path, f"Mean_L{id}_S{iteration_number}{post_fix}.npy"
                ),
                network[id].mean.detach().cpu().numpy(),
            )