robintux/utils.py

## utils.py
import numpy as np
import copy
import time
import signal

import matplotlib.pyplot as plt
from graphviz import Digraph

from pandas import DataFrame
from sklearn.metrics import r2_score, mean_absolute_error, mean_squared_error, log_loss

import torch
from torch.autograd import Variable
import torch.nn.init as init
import torch.utils.data

from pycuda import autoinit, driver


#######################################################################################################################

def gpu_stat():
    if torch.cuda.is_available():

        def pretty_bytes(bytes, precision=1):
            abbrevs = ((1<<50, 'PB'),(1<<40, 'TB'),(1<<30, 'GB'),(1<<20, 'MB'),(1<<10, 'kB'),(1, 'bytes'))
            if bytes == 1:
                return '1 byte'
            for factor, suffix in abbrevs:
                if bytes >= factor:
                    break
            return '%.*f%s' % (precision, bytes / factor, suffix)

        device = autoinit.device
        print()
        print( 'GPU Name: %s' % device.name())
        print( 'GPU Memory: %s' % pretty_bytes(device.total_memory()))
        print( 'CUDA Version: %s' % str(driver.get_version()))
        print( 'GPU Free/Total Memory: %d%%' % ((driver.mem_get_info()[0] /driver.mem_get_info()[1]) * 100))

#####################################################################################################################

class HYPERPARAMETERS(dict):
    """
    Class that holds a set of hyperparameters as name-value pairs and for convenience makes them accesssable
    as attributes.
    Example:
        H = HYPERPARAMETERS({ 'parameter_name' : parameter_value, ... })
        access using H.parameter_name or by H['parameter_name']
    """
    def __init__(self, dictionary):
        super(HYPERPARAMETERS, self).__init__(dictionary)
    def __getattr__(self, name):
        return self[name]
    def __setattr__(self, name, value):
        self[name] = value
    def __getstate__(self):
        return self
    def __setstate__(self, d):
        self = d

#####################################################################################################################

def to_np(x):
    return x.data.cpu().numpy()

def to_var(x):
    if torch.cuda.is_available():
        x = x.cuda()
    return Variable(x)

#####################################################################################################################

#save_checkpoint({
#            'model' : type(model).__name__
#            'epoch': epoch + 1,
#            'state_dict': model.state_dict(),
#            'optimizer' : optimizer.state_dict(),
#        })
def save_checkpoint(state, filename='./chkp/checkpoint.tar'):
    torch.save(state, filename)
    print("=> saved checkpoint '{}' (epoch {})".format(filename, state['epoch']))


def load_checkpoint(model, optimizer=None, filename='./chkp/checkpoint.tar'):
    checkpoint = torch.load(filename)
    model.load_state_dict(checkpoint['state_dict'])
    if not optimizer is None:
        optimizer.load_state_dict(checkpoint['optimizer'])
    print("=> loaded checkpoint '{}' (epoch {})".format(filename, checkpoint['epoch']))
    return checkpoint

#####################################################################################################################

# https://github.com/robintibor/braindecode/blob/master/braindecode/torch_ext/init.py

def glorot_weight_zero_bias(model):
    """
    Initalize parameters of all modules
    by initializing weights with glorot  uniform/xavier initialization,
    and setting biases to zero.
    Weights from batch norm layers are set to 1.

    Parameters
    ----------
    model: Module
    """
    for module in model.modules():
        if hasattr(module, 'weight') and not module.weight is None:
            if not ('BatchNorm' in module.__class__.__name__):
                init.xavier_uniform_(module.weight, gain=1)
            else:
                init.constant_(module.weight, 1)
        if hasattr(module, 'bias'):
            if module.bias is not None:
                init.constant_(module.bias, 0)

#####################################################################################################################

# https://discuss.pytorch.org/t/solved-learning-rate-decay/6825/4

def adjust_learning_rate(optimizer, epoch, init_lr=0.001, lr_decay_epoch=30):
    """Sets the learning rate to the initial LR decayed by 10 every lr_decay_epoch epochs"""
    lr = init_lr * (0.1**(epoch // lr_decay_epoch))

    for param_group in optimizer.state_dict()['param_groups']:
        param_group['lr'] = lr

    return lr

#####################################################################################################################

class PlotLosses(object):
    """
    Plots the train loss and validation score in a matlibplot plot during training whenever
    plot_loss and plot_prediction are called inside the epoch loop.
    """
    def __init__(self, figsize=(12,6)):
        plt.ion()

        self.fig, self.ax = plt.subplots(1,2,figsize=figsize)

        self.ax[0].set_xlabel("Epoch");
        self.ax[0].set_ylabel("Loss");
        self.ax[0].grid(True)

        self.ax[1].set_xlabel("X");
        self.ax[1].set_ylabel("Y");
        self.ax[1].set_ylim([-1,1])
        self.ax[1].grid(True)

        self.fig.canvas.draw()
        plt.show(block=False)

    def plot_loss(self, loss, epoch, epochs, lr):
        iter_array = np.arange(1, epochs, 1)

        self.ax[0].set_title("Epoch # " + str(epoch) + "/" + str(epochs)
                             + " Loss # %.4f" % loss[-1] + " LR # %.2e" % lr)
        self.ax[0].plot(np.arange(0, epoch, 1), loss)

        self.fig.canvas.draw()
        plt.show(block=False)

    def plot_prediction(self, x, y, x_h, y_h, label1="train", label2="predict"):
        plt.cla()
        self.ax[1].set_title("Prediction")
        self.ax[1].scatter (x, y, c='red', label=str(label1), s=1.0, alpha=0.3)
        self.ax[1].scatter (x_h, y_h, c='green', label=str(label2), s=10.0, alpha=0.3)
        self.ax[1].legend()

        self.fig.canvas.draw()
        plt.show(block=False)

    def close(self):
        plt.ioff ()
        plt.close(self.fig)

#####################################################################################################################

# https://github.com/szagoruyko/pytorchviz/blob/master/torchviz/dot.py

def make_dot(var, params):
    """ Produces Graphviz representation of PyTorch autograd graph

    Blue nodes are the Variables that require grad, orange are Tensors
    saved for backward in torch.autograd.Function

    Args:
        var: output Variable
        params: dict of (name, Variable) to add names to node that
            require grad (TODO: make optional)
    """
    param_map = {id(v): k for k, v in params.items()}

    node_attr = dict(style='filled',
                     shape='box',
                     align='left',
                     fontsize='12',
                     ranksep='0.1',
                     height='0.2')
    dot = Digraph(node_attr=node_attr, graph_attr=dict(size="8,8"))
    seen = set()

    def size_to_str(size):
        return '('+(', ').join(['%d'% v for v in size])+')'

    def add_nodes(var):
        if var not in seen:
            if torch.is_tensor(var):
                dot.node(str(id(var)), size_to_str(var.size()), fillcolor='orange')
            elif hasattr(var, 'variable'):
                u = var.variable
                node_name = '%s\n %s' % (param_map.get(id(u)), size_to_str(u.size()))
                dot.node(str(id(var)), node_name, fillcolor='lightblue')
            else:
                dot.node(str(id(var)), str(type(var).__name__))
            seen.add(var)
            if hasattr(var, 'next_functions'):
                for u in var.next_functions:
                    if u[0] is not None:
                        dot.edge(str(id(u[0])), str(id(var)))
                        add_nodes(u[0])
            if hasattr(var, 'saved_tensors'):
                for t in var.saved_tensors:
                    dot.edge(str(id(t)), str(id(var)))
                    add_nodes(t)
    add_nodes(var.grad_fn)
    return dot

#####################################################################################################################

def layer_weight(data):
    mean = np.mean(data)
    std = np.std(data)

    hist, bins = np.histogram(data, bins=50)
    width = np.diff(bins)
    center = (bins[:-1] + bins[1:]) / 2

    return { 'mean':mean,
             'std':std,
             'hist':hist,
             'center':center,
             'width':width
             }

def layer_stats(model):
    for module in model.modules():
        if hasattr(module, 'weight') and hasattr(module, 'bias'):
            fig, ax = plt.subplots(1,2,figsize=(8,3))

            if not module.weight is None:
                w = layer_weight(to_np(module.weight))
                ax[0].set_title("Weight - Mean # %.4f" % w['mean'] + " STD # %.2e" % w['std'])
                ax[0].bar(w['center'], w['hist'], align='center', width=w['width'])

            if not module.bias is None:
                b = layer_weight(to_np(module.bias))
                ax[1].set_title("Bias - Mean # %.4f" % b['mean'] + " STD # %.2e" % b['std'])
                ax[1].bar(b['center'], b['hist'], align='center', width=b['width'])
                plt.show()

#####################################################################################################################

# https://stackoverflow.com/questions/42480111/model-summary-in-pytorch
# https://github.com/fchollet/keras/blob/master/keras/utils/layer_utils.py

def print_summary(model, line_length=None, positions=None, print_fn=print):
    """Prints a summary of a model.
    # Arguments
        model: model instance.
        line_length: Total length of printed lines
            (e.g. set this to adapt the display to different
            terminal window sizes).
        positions: Relative or absolute positions of log elements in each line.
            If not provided, defaults to `[.33, .55, .67, 1.]`.
        print_fn: Print function to use.
            It will be called on each line of the summary.
            You can set it to a custom function
            in order to capture the string summary.
    """

    line_length = line_length or 65
    positions = positions or [.45, .85, 1.]
    if positions[-1] <= 1:
        positions = [int(line_length * p) for p in positions]
    # header names for the different log elements
    to_display = ['Layer (type)', 'Shape', 'Param #']

    def print_row(fields, positions):
        line = ''
        for i in range(len(fields)):
            if i > 0:
                line = line[:-1] + ' '
            line += str(fields[i])
            line = line[:positions[i]]
            line += ' ' * (positions[i] - len(line))
        print_fn(line)

    print_fn( "Summary for model: " + model.__class__.__name__)
    print_fn('_' * line_length)
    print_row(to_display, positions)
    print_fn('=' * line_length)

    def print_module_summary(name, module):
        count_params = sum([np.prod(p.size()) for p in module.parameters()])
        output_shape = tuple([tuple(p.size()) for p in module.parameters()])
        cls_name = module.__class__.__name__
        fields = [name + ' (' + cls_name + ')', output_shape, count_params]
        print_row(fields, positions)

    module_count = len(set(model.modules()))
    for i, item in enumerate(model.named_modules()):
        name, module = item
        cls_name = str(module.__class__)
        if not 'torch' in cls_name or 'container' in cls_name:
            continue

        print_module_summary(name, module)
        if i == module_count - 1:
            print_fn('=' * line_length)
        else:
            print_fn('_' * line_length)

    trainable_count = 0
    non_trainable_count = 0
    for name, param in model.named_parameters():
        if 'bias' in name or 'weight' in name :
            trainable_count += np.prod(param.size())
        else:
            non_trainable_count += np.prod(param.size())

    print_fn('Total params:         {:,}'.format(trainable_count + non_trainable_count))
    print_fn('Trainable params:     {:,}'.format(trainable_count))
    print_fn('Non-trainable params: {:,}'.format(non_trainable_count))
    print_fn('_' * line_length)

#####################################################################################################################

def stat_summary(y, y_hat, n, p):
    # local time & date
    t = time.localtime()

    # printing output to screen
    print( '\n==============================================================================' )
    print(  "Date: ", time.strftime("%a, %d %b %Y",t) )
    print(  "Time: ", time.strftime("%H:%M:%S",t) )
    print( '==============================================================================')
    print( 'Parameters:               % 5.0f' % p + '           Cases: %5.0f' % n )
    print( '==============================================================================' )
    print( 'Models stats' )
    print( '==============================================================================' )
    print( 'Mean Squared Error        % -5.6f         ' % mean_squared_error(y, y_hat) )
    print( 'Mean Absolute Error       % -5.6f         ' % mean_squared_error(y, y_hat) )
    print( 'Root Mean Squared Error   % -5.6f         ' % np.sqrt(mean_squared_error(y, y_hat)) )
    print( 'R-squared                 % -5.6f         ' % r2_score(y, y_hat) )
    print( '==============================================================================')

#####################################################################################################################

# https://stackoverflow.com/questions/842557/how-to-prevent-a-block-of-code-from-being-interrupted-by-keyboardinterrupt-in-py

class DelayedKeyboardInterrupt(object):
    def __init__(self):
        self.signal_received = None

    def __enter__(self):
        self.signal_received = None
        self.old_handler = signal.signal(signal.SIGINT, self.handler)

    def handler(self, sig, frame):
        self.signal_received = (sig, frame)
        print('SIGINT received. Delaying KeyboardInterrupt.')

    def __exit__(self, type, value, traceback):
        signal.signal(signal.SIGINT, self.old_handler)
        if self.signal_received:
            self.old_handler(*self.signal_received)

#####################################################################################################################

def residual_plots(y, y_hat, figsize=(16,4)):
    residuals = DataFrame(y - y_hat)

    fig, ax = plt.subplots(1,3,figsize=figsize)

    # scatter plot
    ax[0].scatter(y_hat, residuals,s=1.0, alpha=0.3)
    ax[0].set_xlabel("Predicted Y")
    ax[0].set_ylabel("Residual")
    ax[0].set_title("Scatter Plot")

    # histogram plot
    residuals.plot(kind='hist', ax=ax[1])
    ax[1].set_title('Histogram Plot')
    ax[1].set_ylabel('Count')
    ax[1].set_xlabel('Residuals')

    # density plot
    residuals.plot(kind='kde', ax=ax[2])
    ax[2].set_title('Density Plot')

#####################################################################################################################

def plot_prediction(x, y, x_h, y_h, title="", label1="train", label2="validate"):
    plt.cla()
    plt.title(title)
    a, b = zip(*sorted(zip(x,y)))
    c, d = zip(*sorted(zip(x_h,y_h)))

    plt.plot (a, b, c='red', label=str(label1))
    plt.plot (c, d, c='green', label=str(label2))
    plt.legend()


#######################################################################################################################

class Stopping(object):
    """
    Class implement some of regularization techniques to avoid over-training as described in
    http://page.mi.fu-berlin.de/prechelt/Biblio/stop_tricks1997.pdf
    """
    def __init__(self, model, patience=50):
        self.model = model
        self.patience = patience

        self.best_score = -1
        self.best_score_epoch = 0
        self.best_score_model = None
        self.best_score_state = None

    def step(self, epoch, train_score, valid_score):
        if valid_score > self.best_score:
            self.best_score = valid_score
            self.best_score_epoch = epoch
            self.best_score_state = self.model.state_dict()
            return False
        elif self.best_score_epoch + self.patience < epoch:
            return True

    def state_dict(self):
        return {
            'patience' : self.patience,
            'best_score' : self.best_score,
            'best_score_epoch' : self.best_score_epoch,
            'best_score_model' : self.best_score_model,
        }

    def load_state_dict(self, state_dict):
        self.patience = state_dict['patience']
        self.best_score  = state_dict['best_score']
        self.best_score_epoch = state_dict['best_score_epoch']
        self.best_score_model = state_dict['best_score_model']

    def __repr__(self):
        fmt_str = self.__class__.__name__ + '\n'
        fmt_str += '    Patience: {}\n'.format(self.patience)
        fmt_str += '    Best Score: {:.4f}\n'.format(self.best_score)
        fmt_str += '    Epoch of Best Score: {}\n'.format(self.best_score_epoch)
        return fmt_str

#######################################################################################################################
	import numpy as np
	import copy
	import time
	import signal

	import matplotlib.pyplot as plt
	from graphviz import Digraph

	from pandas import DataFrame
	from sklearn.metrics import r2_score, mean_absolute_error, mean_squared_error, log_loss

	import torch
	from torch.autograd import Variable
	import torch.nn.init as init
	import torch.utils.data

	from pycuda import autoinit, driver


	#######################################################################################################################

	def gpu_stat():
	if torch.cuda.is_available():

	def pretty_bytes(bytes, precision=1):
	abbrevs = ((1<<50, 'PB'),(1<<40, 'TB'),(1<<30, 'GB'),(1<<20, 'MB'),(1<<10, 'kB'),(1, 'bytes'))
	if bytes == 1:
	return '1 byte'
	for factor, suffix in abbrevs:
	if bytes >= factor:
	break
	return '%.*f%s' % (precision, bytes / factor, suffix)

	device = autoinit.device
	print()
	print( 'GPU Name: %s' % device.name())
	print( 'GPU Memory: %s' % pretty_bytes(device.total_memory()))
	print( 'CUDA Version: %s' % str(driver.get_version()))
	print( 'GPU Free/Total Memory: %d%%' % ((driver.mem_get_info()[0] /driver.mem_get_info()[1]) * 100))

	#####################################################################################################################

	class HYPERPARAMETERS(dict):
	"""
	Class that holds a set of hyperparameters as name-value pairs and for convenience makes them accesssable
	as attributes.
	Example:
	H = HYPERPARAMETERS({ 'parameter_name' : parameter_value, ... })
	access using H.parameter_name or by H['parameter_name']
	"""
	def __init__(self, dictionary):
	super(HYPERPARAMETERS, self).__init__(dictionary)
	def __getattr__(self, name):
	return self[name]
	def __setattr__(self, name, value):
	self[name] = value
	def __getstate__(self):
	return self
	def __setstate__(self, d):
	self = d

	#####################################################################################################################

	def to_np(x):
	return x.data.cpu().numpy()

	def to_var(x):
	if torch.cuda.is_available():
	x = x.cuda()
	return Variable(x)

	#####################################################################################################################

	#save_checkpoint({
	# 'model' : type(model).__name__
	# 'epoch': epoch + 1,
	# 'state_dict': model.state_dict(),
	# 'optimizer' : optimizer.state_dict(),
	# })
	def save_checkpoint(state, filename='./chkp/checkpoint.tar'):
	torch.save(state, filename)
	print("=> saved checkpoint '{}' (epoch {})".format(filename, state['epoch']))


	def load_checkpoint(model, optimizer=None, filename='./chkp/checkpoint.tar'):
	checkpoint = torch.load(filename)
	model.load_state_dict(checkpoint['state_dict'])
	if not optimizer is None:
	optimizer.load_state_dict(checkpoint['optimizer'])
	print("=> loaded checkpoint '{}' (epoch {})".format(filename, checkpoint['epoch']))
	return checkpoint

	#####################################################################################################################

	# https://github.com/robintibor/braindecode/blob/master/braindecode/torch_ext/init.py

	def glorot_weight_zero_bias(model):
	"""
	Initalize parameters of all modules
	by initializing weights with glorot uniform/xavier initialization,
	and setting biases to zero.
	Weights from batch norm layers are set to 1.

	Parameters
	----------
	model: Module
	"""
	for module in model.modules():
	if hasattr(module, 'weight') and not module.weight is None:
	if not ('BatchNorm' in module.__class__.__name__):
	init.xavier_uniform_(module.weight, gain=1)
	else:
	init.constant_(module.weight, 1)
	if hasattr(module, 'bias'):
	if module.bias is not None:
	init.constant_(module.bias, 0)

	#####################################################################################################################

	# https://discuss.pytorch.org/t/solved-learning-rate-decay/6825/4

	def adjust_learning_rate(optimizer, epoch, init_lr=0.001, lr_decay_epoch=30):
	"""Sets the learning rate to the initial LR decayed by 10 every lr_decay_epoch epochs"""
	lr = init_lr * (0.1**(epoch // lr_decay_epoch))

	for param_group in optimizer.state_dict()['param_groups']:
	param_group['lr'] = lr

	return lr

	#####################################################################################################################

	class PlotLosses(object):
	"""
	Plots the train loss and validation score in a matlibplot plot during training whenever
	plot_loss and plot_prediction are called inside the epoch loop.
	"""
	def __init__(self, figsize=(12,6)):
	plt.ion()

	self.fig, self.ax = plt.subplots(1,2,figsize=figsize)

	self.ax[0].set_xlabel("Epoch");
	self.ax[0].set_ylabel("Loss");
	self.ax[0].grid(True)

	self.ax[1].set_xlabel("X");
	self.ax[1].set_ylabel("Y");
	self.ax[1].set_ylim([-1,1])
	self.ax[1].grid(True)

	self.fig.canvas.draw()
	plt.show(block=False)

	def plot_loss(self, loss, epoch, epochs, lr):
	iter_array = np.arange(1, epochs, 1)

	self.ax[0].set_title("Epoch # " + str(epoch) + "/" + str(epochs)
	+ " Loss # %.4f" % loss[-1] + " LR # %.2e" % lr)
	self.ax[0].plot(np.arange(0, epoch, 1), loss)

	self.fig.canvas.draw()
	plt.show(block=False)

	def plot_prediction(self, x, y, x_h, y_h, label1="train", label2="predict"):
	plt.cla()
	self.ax[1].set_title("Prediction")
	self.ax[1].scatter (x, y, c='red', label=str(label1), s=1.0, alpha=0.3)
	self.ax[1].scatter (x_h, y_h, c='green', label=str(label2), s=10.0, alpha=0.3)
	self.ax[1].legend()

	self.fig.canvas.draw()
	plt.show(block=False)

	def close(self):
	plt.ioff ()
	plt.close(self.fig)

	#####################################################################################################################

	# https://github.com/szagoruyko/pytorchviz/blob/master/torchviz/dot.py

	def make_dot(var, params):
	""" Produces Graphviz representation of PyTorch autograd graph

	Blue nodes are the Variables that require grad, orange are Tensors
	saved for backward in torch.autograd.Function

	Args:
	var: output Variable
	params: dict of (name, Variable) to add names to node that
	require grad (TODO: make optional)
	"""
	param_map = {id(v): k for k, v in params.items()}

	node_attr = dict(style='filled',
	shape='box',
	align='left',
	fontsize='12',
	ranksep='0.1',
	height='0.2')
	dot = Digraph(node_attr=node_attr, graph_attr=dict(size="8,8"))
	seen = set()

	def size_to_str(size):
	return '('+(', ').join(['%d'% v for v in size])+')'

	def add_nodes(var):
	if var not in seen:
	if torch.is_tensor(var):
	dot.node(str(id(var)), size_to_str(var.size()), fillcolor='orange')
	elif hasattr(var, 'variable'):
	u = var.variable
	node_name = '%s\n %s' % (param_map.get(id(u)), size_to_str(u.size()))
	dot.node(str(id(var)), node_name, fillcolor='lightblue')
	else:
	dot.node(str(id(var)), str(type(var).__name__))
	seen.add(var)
	if hasattr(var, 'next_functions'):
	for u in var.next_functions:
	if u[0] is not None:
	dot.edge(str(id(u[0])), str(id(var)))
	add_nodes(u[0])
	if hasattr(var, 'saved_tensors'):
	for t in var.saved_tensors:
	dot.edge(str(id(t)), str(id(var)))
	add_nodes(t)
	add_nodes(var.grad_fn)
	return dot

	#####################################################################################################################

	def layer_weight(data):
	mean = np.mean(data)
	std = np.std(data)

	hist, bins = np.histogram(data, bins=50)
	width = np.diff(bins)
	center = (bins[:-1] + bins[1:]) / 2

	return { 'mean':mean,
	'std':std,
	'hist':hist,
	'center':center,
	'width':width
	}

	def layer_stats(model):
	for module in model.modules():
	if hasattr(module, 'weight') and hasattr(module, 'bias'):
	fig, ax = plt.subplots(1,2,figsize=(8,3))

	if not module.weight is None:
	w = layer_weight(to_np(module.weight))
	ax[0].set_title("Weight - Mean # %.4f" % w['mean'] + " STD # %.2e" % w['std'])
	ax[0].bar(w['center'], w['hist'], align='center', width=w['width'])

	if not module.bias is None:
	b = layer_weight(to_np(module.bias))
	ax[1].set_title("Bias - Mean # %.4f" % b['mean'] + " STD # %.2e" % b['std'])
	ax[1].bar(b['center'], b['hist'], align='center', width=b['width'])
	plt.show()

	#####################################################################################################################

	# https://stackoverflow.com/questions/42480111/model-summary-in-pytorch
	# https://github.com/fchollet/keras/blob/master/keras/utils/layer_utils.py

	def print_summary(model, line_length=None, positions=None, print_fn=print):
	"""Prints a summary of a model.
	# Arguments
	model: model instance.
	line_length: Total length of printed lines
	(e.g. set this to adapt the display to different
	terminal window sizes).
	positions: Relative or absolute positions of log elements in each line.
	If not provided, defaults to `[.33, .55, .67, 1.]`.
	print_fn: Print function to use.
	It will be called on each line of the summary.
	You can set it to a custom function
	in order to capture the string summary.
	"""

	line_length = line_length or 65
	positions = positions or [.45, .85, 1.]
	if positions[-1] <= 1:
	positions = [int(line_length * p) for p in positions]
	# header names for the different log elements
	to_display = ['Layer (type)', 'Shape', 'Param #']

	def print_row(fields, positions):
	line = ''
	for i in range(len(fields)):
	if i > 0:
	line = line[:-1] + ' '
	line += str(fields[i])
	line = line[:positions[i]]
	line += ' ' * (positions[i] - len(line))
	print_fn(line)

	print_fn( "Summary for model: " + model.__class__.__name__)
	print_fn('_' * line_length)
	print_row(to_display, positions)
	print_fn('=' * line_length)

	def print_module_summary(name, module):
	count_params = sum([np.prod(p.size()) for p in module.parameters()])
	output_shape = tuple([tuple(p.size()) for p in module.parameters()])
	cls_name = module.__class__.__name__
	fields = [name + ' (' + cls_name + ')', output_shape, count_params]
	print_row(fields, positions)

	module_count = len(set(model.modules()))
	for i, item in enumerate(model.named_modules()):
	name, module = item
	cls_name = str(module.__class__)
	if not 'torch' in cls_name or 'container' in cls_name:
	continue

	print_module_summary(name, module)
	if i == module_count - 1:
	print_fn('=' * line_length)
	else:
	print_fn('_' * line_length)

	trainable_count = 0
	non_trainable_count = 0
	for name, param in model.named_parameters():
	if 'bias' in name or 'weight' in name :
	trainable_count += np.prod(param.size())
	else:
	non_trainable_count += np.prod(param.size())

	print_fn('Total params: {:,}'.format(trainable_count + non_trainable_count))
	print_fn('Trainable params: {:,}'.format(trainable_count))
	print_fn('Non-trainable params: {:,}'.format(non_trainable_count))
	print_fn('_' * line_length)

	#####################################################################################################################

	def stat_summary(y, y_hat, n, p):
	# local time & date
	t = time.localtime()

	# printing output to screen
	print( '\n==============================================================================' )
	print( "Date: ", time.strftime("%a, %d %b %Y",t) )
	print( "Time: ", time.strftime("%H:%M:%S",t) )
	print( '==============================================================================')
	print( 'Parameters: % 5.0f' % p + ' Cases: %5.0f' % n )
	print( '==============================================================================' )
	print( 'Models stats' )
	print( '==============================================================================' )
	print( 'Mean Squared Error % -5.6f ' % mean_squared_error(y, y_hat) )
	print( 'Mean Absolute Error % -5.6f ' % mean_squared_error(y, y_hat) )
	print( 'Root Mean Squared Error % -5.6f ' % np.sqrt(mean_squared_error(y, y_hat)) )
	print( 'R-squared % -5.6f ' % r2_score(y, y_hat) )
	print( '==============================================================================')

	#####################################################################################################################

	# https://stackoverflow.com/questions/842557/how-to-prevent-a-block-of-code-from-being-interrupted-by-keyboardinterrupt-in-py

	class DelayedKeyboardInterrupt(object):
	def __init__(self):
	self.signal_received = None

	def __enter__(self):
	self.signal_received = None
	self.old_handler = signal.signal(signal.SIGINT, self.handler)

	def handler(self, sig, frame):
	self.signal_received = (sig, frame)
	print('SIGINT received. Delaying KeyboardInterrupt.')

	def __exit__(self, type, value, traceback):
	signal.signal(signal.SIGINT, self.old_handler)
	if self.signal_received:
	self.old_handler(*self.signal_received)

	#####################################################################################################################

	def residual_plots(y, y_hat, figsize=(16,4)):
	residuals = DataFrame(y - y_hat)

	fig, ax = plt.subplots(1,3,figsize=figsize)

	# scatter plot
	ax[0].scatter(y_hat, residuals,s=1.0, alpha=0.3)
	ax[0].set_xlabel("Predicted Y")
	ax[0].set_ylabel("Residual")
	ax[0].set_title("Scatter Plot")

	# histogram plot
	residuals.plot(kind='hist', ax=ax[1])
	ax[1].set_title('Histogram Plot')
	ax[1].set_ylabel('Count')
	ax[1].set_xlabel('Residuals')

	# density plot
	residuals.plot(kind='kde', ax=ax[2])
	ax[2].set_title('Density Plot')

	#####################################################################################################################

	def plot_prediction(x, y, x_h, y_h, title="", label1="train", label2="validate"):
	plt.cla()
	plt.title(title)
	a, b = zip(*sorted(zip(x,y)))
	c, d = zip(*sorted(zip(x_h,y_h)))

	plt.plot (a, b, c='red', label=str(label1))
	plt.plot (c, d, c='green', label=str(label2))
	plt.legend()



	#######################################################################################################################

	class Stopping(object):
	"""
	Class implement some of regularization techniques to avoid over-training as described in
	http://page.mi.fu-berlin.de/prechelt/Biblio/stop_tricks1997.pdf
	"""
	def __init__(self, model, patience=50):
	self.model = model
	self.patience = patience

	self.best_score = -1
	self.best_score_epoch = 0
	self.best_score_model = None
	self.best_score_state = None

	def step(self, epoch, train_score, valid_score):
	if valid_score > self.best_score:
	self.best_score = valid_score
	self.best_score_epoch = epoch
	self.best_score_state = self.model.state_dict()
	return False
	elif self.best_score_epoch + self.patience < epoch:
	return True

	def state_dict(self):
	return {
	'patience' : self.patience,
	'best_score' : self.best_score,
	'best_score_epoch' : self.best_score_epoch,
	'best_score_model' : self.best_score_model,
	}

	def load_state_dict(self, state_dict):
	self.patience = state_dict['patience']
	self.best_score = state_dict['best_score']
	self.best_score_epoch = state_dict['best_score_epoch']
	self.best_score_model = state_dict['best_score_model']

	def __repr__(self):
	fmt_str = self.__class__.__name__ + '\n'
	fmt_str += ' Patience: {}\n'.format(self.patience)
	fmt_str += ' Best Score: {:.4f}\n'.format(self.best_score)
	fmt_str += ' Epoch of Best Score: {}\n'.format(self.best_score_epoch)
	return fmt_str

	#######################################################################################################################
No results found