2022-04-30 02:07:09 +02:00
|
|
|
# MIT License
|
|
|
|
# Copyright 2022 University of Bremen
|
|
|
|
#
|
|
|
|
# Permission is hereby granted, free of charge, to any person obtaining
|
|
|
|
# a copy of this software and associated documentation files (the "Software"),
|
|
|
|
# to deal in the Software without restriction, including without limitation
|
|
|
|
# the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
|
|
# and/or sell copies of the Software, and to permit persons to whom the
|
|
|
|
# Software is furnished to do so, subject to the following conditions:
|
|
|
|
#
|
|
|
|
# The above copyright notice and this permission notice shall be included
|
|
|
|
# in all copies or substantial portions of the Software.
|
|
|
|
#
|
|
|
|
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
|
|
|
# EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
|
|
|
# MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
|
|
|
|
# IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,
|
|
|
|
# DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
|
|
|
|
# OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR
|
|
|
|
# THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
|
|
|
#
|
|
|
|
#
|
|
|
|
# David Rotermund ( davrot@uni-bremen.de )
|
|
|
|
#
|
|
|
|
#
|
|
|
|
# Release history:
|
|
|
|
# ================
|
|
|
|
# 1.0.0 -- 01.05.2022: first release
|
|
|
|
#
|
|
|
|
#
|
|
|
|
|
|
|
|
# %%
|
|
|
|
from dataclasses import dataclass, field
|
|
|
|
import numpy as np
|
|
|
|
import torch
|
|
|
|
import os
|
|
|
|
|
|
|
|
|
|
|
|
@dataclass
|
|
|
|
class Network:
|
|
|
|
"""Parameters of the network. The details about
|
|
|
|
its layers and the number of output neurons."""
|
|
|
|
|
|
|
|
number_of_output_neurons: int = field(default=0)
|
|
|
|
forward_neuron_numbers: list[list[int]] = field(default_factory=list)
|
2022-05-01 17:03:19 +02:00
|
|
|
is_pooling_layer: list[bool] = field(default_factory=list)
|
|
|
|
|
|
|
|
forward_kernel_size: list[list[int]] = field(default_factory=list)
|
2022-04-30 02:07:09 +02:00
|
|
|
strides: list[list[int]] = field(default_factory=list)
|
|
|
|
dilation: list[list[int]] = field(default_factory=list)
|
|
|
|
padding: list[list[int]] = field(default_factory=list)
|
2022-05-01 17:03:19 +02:00
|
|
|
|
2022-04-30 02:07:09 +02:00
|
|
|
w_trainable: list[bool] = field(default_factory=list)
|
|
|
|
eps_xy_trainable: list[bool] = field(default_factory=list)
|
|
|
|
eps_xy_mean: list[bool] = field(default_factory=list)
|
|
|
|
|
|
|
|
|
|
|
|
@dataclass
|
|
|
|
class LearningParameters:
|
|
|
|
"""Parameter required for training"""
|
|
|
|
|
2022-05-01 17:03:19 +02:00
|
|
|
learning_active: bool = field(default=True)
|
|
|
|
|
2022-04-30 02:07:09 +02:00
|
|
|
loss_coeffs_mse: float = field(default=0.5)
|
|
|
|
loss_coeffs_kldiv: float = field(default=1.0)
|
2022-05-01 17:03:19 +02:00
|
|
|
|
|
|
|
optimizer_name: str = field(default="Adam")
|
2022-04-30 02:07:09 +02:00
|
|
|
learning_rate_gamma_w: float = field(default=-1.0)
|
|
|
|
learning_rate_gamma_eps_xy: float = field(default=-1.0)
|
|
|
|
learning_rate_threshold_w: float = field(default=0.00001)
|
|
|
|
learning_rate_threshold_eps_xy: float = field(default=0.00001)
|
2022-05-01 17:03:19 +02:00
|
|
|
|
|
|
|
lr_schedule_name: str = field(default="ReduceLROnPlateau")
|
2022-05-04 14:42:44 +02:00
|
|
|
lr_scheduler_use_performance: bool = field(default=True)
|
2022-05-01 17:03:19 +02:00
|
|
|
lr_scheduler_factor_w: float = field(default=0.75)
|
|
|
|
lr_scheduler_patience_w: int = field(default=-1)
|
2022-05-08 15:43:10 +02:00
|
|
|
lr_scheduler_tau_w: int = field(default=10)
|
2022-05-01 17:03:19 +02:00
|
|
|
|
|
|
|
lr_scheduler_factor_eps_xy: float = field(default=0.75)
|
|
|
|
lr_scheduler_patience_eps_xy: int = field(default=-1)
|
2022-05-08 15:43:10 +02:00
|
|
|
lr_scheduler_tau_eps_xy: int = field(default=10)
|
2022-05-01 17:03:19 +02:00
|
|
|
|
|
|
|
number_of_batches_for_one_update: int = field(default=1)
|
|
|
|
overload_path: str = field(default="./Previous")
|
|
|
|
|
2022-04-30 02:07:09 +02:00
|
|
|
weight_noise_amplitude: float = field(default=0.01)
|
|
|
|
eps_xy_intitial: float = field(default=0.1)
|
2022-05-01 17:03:19 +02:00
|
|
|
|
2022-04-30 02:07:09 +02:00
|
|
|
test_every_x_learning_steps: int = field(default=50)
|
|
|
|
test_during_learning: bool = field(default=True)
|
2022-05-01 17:03:19 +02:00
|
|
|
|
2022-04-30 02:07:09 +02:00
|
|
|
alpha_number_of_iterations: int = field(default=0)
|
|
|
|
|
|
|
|
|
|
|
|
@dataclass
|
|
|
|
class Augmentation:
|
|
|
|
"""Parameters used for data augmentation."""
|
|
|
|
|
|
|
|
crop_width_in_pixel: int = field(default=2)
|
2022-05-01 17:03:19 +02:00
|
|
|
|
2022-04-30 02:07:09 +02:00
|
|
|
flip_p: float = field(default=0.5)
|
2022-05-01 17:03:19 +02:00
|
|
|
|
2022-04-30 02:07:09 +02:00
|
|
|
jitter_brightness: float = field(default=0.5)
|
|
|
|
jitter_contrast: float = field(default=0.1)
|
|
|
|
jitter_saturation: float = field(default=0.1)
|
|
|
|
jitter_hue: float = field(default=0.15)
|
|
|
|
|
2022-05-01 17:03:19 +02:00
|
|
|
use_on_off_filter: bool = field(default=True)
|
|
|
|
|
2022-04-30 02:07:09 +02:00
|
|
|
|
|
|
|
@dataclass
|
|
|
|
class ImageStatistics:
|
|
|
|
"""(Statistical) information about the input. i.e.
|
|
|
|
mean values and the x and y size of the input"""
|
|
|
|
|
|
|
|
mean: list[float] = field(default_factory=list)
|
|
|
|
the_size: list[int] = field(default_factory=list)
|
|
|
|
|
|
|
|
|
|
|
|
@dataclass
|
|
|
|
class Config:
|
|
|
|
"""Master config class."""
|
|
|
|
|
|
|
|
# Sub classes
|
|
|
|
network_structure: Network = field(default_factory=Network)
|
|
|
|
learning_parameters: LearningParameters = field(default_factory=LearningParameters)
|
|
|
|
augmentation: Augmentation = field(default_factory=Augmentation)
|
|
|
|
image_statistics: ImageStatistics = field(default_factory=ImageStatistics)
|
|
|
|
|
|
|
|
batch_size: int = field(default=500)
|
|
|
|
data_mode: str = field(default="")
|
|
|
|
|
|
|
|
learning_step: int = field(default=0)
|
|
|
|
learning_step_max: int = field(default=10000)
|
|
|
|
|
|
|
|
number_of_cpu_processes: int = field(default=-1)
|
|
|
|
|
|
|
|
number_of_spikes: int = field(default=0)
|
2022-05-04 14:42:44 +02:00
|
|
|
cooldown_after_number_of_spikes: int = field(default=-1)
|
2022-04-30 02:07:09 +02:00
|
|
|
|
|
|
|
weight_path: str = field(default="./Weights/")
|
|
|
|
eps_xy_path: str = field(default="./EpsXY/")
|
|
|
|
data_path: str = field(default="./")
|
2022-05-04 14:42:44 +02:00
|
|
|
results_path: str = field(default="./Results")
|
2022-04-30 02:07:09 +02:00
|
|
|
|
|
|
|
reduction_cooldown: float = field(default=25.0)
|
|
|
|
epsilon_0: float = field(default=1.0)
|
|
|
|
|
|
|
|
def __post_init__(self) -> None:
|
|
|
|
"""Post init determines the number of cores.
|
|
|
|
Creates the required directory and gives us an optimized
|
|
|
|
(for the amount of cores) batch size."""
|
|
|
|
number_of_cpu_processes_temp = os.cpu_count()
|
|
|
|
|
|
|
|
if self.number_of_cpu_processes < 1:
|
|
|
|
if number_of_cpu_processes_temp is None:
|
|
|
|
self.number_of_cpu_processes = 1
|
|
|
|
else:
|
|
|
|
self.number_of_cpu_processes = number_of_cpu_processes_temp
|
|
|
|
|
|
|
|
os.makedirs(self.weight_path, exist_ok=True)
|
|
|
|
os.makedirs(self.eps_xy_path, exist_ok=True)
|
|
|
|
os.makedirs(self.data_path, exist_ok=True)
|
2022-05-04 14:42:44 +02:00
|
|
|
os.makedirs(self.results_path, exist_ok=True)
|
2022-04-30 02:07:09 +02:00
|
|
|
|
|
|
|
self.batch_size = (
|
|
|
|
self.batch_size // self.number_of_cpu_processes
|
|
|
|
) * self.number_of_cpu_processes
|
|
|
|
|
|
|
|
self.batch_size = np.max((self.batch_size, self.number_of_cpu_processes))
|
|
|
|
self.batch_size = int(self.batch_size)
|
|
|
|
|
|
|
|
def get_epsilon_t(self):
|
|
|
|
"""Generates the time series of the basic epsilon."""
|
|
|
|
np_epsilon_t: np.ndarray = np.ones((self.number_of_spikes), dtype=np.float32)
|
2022-05-04 14:42:44 +02:00
|
|
|
if (self.cooldown_after_number_of_spikes < self.number_of_spikes) and (
|
|
|
|
self.cooldown_after_number_of_spikes >= 0
|
|
|
|
):
|
|
|
|
np_epsilon_t[
|
|
|
|
self.cooldown_after_number_of_spikes : self.number_of_spikes
|
|
|
|
] /= self.reduction_cooldown
|
2022-04-30 02:07:09 +02:00
|
|
|
return torch.tensor(np_epsilon_t)
|
|
|
|
|
|
|
|
def get_update_after_x_pattern(self):
|
|
|
|
"""Tells us after how many pattern we need to update the weights."""
|
2022-05-08 15:43:10 +02:00
|
|
|
return (
|
|
|
|
self.batch_size * self.learning_parameters.number_of_batches_for_one_update
|
|
|
|
)
|