Source code for sssm.sssm_core.model

import time
from hashlib import md5
import torch
import os
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
import pandas as pd
import einops
from torch import nn
from . import saved_models

from sklearn.base import BaseEstimator, ClassifierMixin



[docs]
class Model(ClassifierMixin, BaseEstimator):
    def __init__(self, device='cuda', model_name='model.pt', model_path=None, ):
        """
        if model_path is None, use default model path, you can select default model by setting model_name;
        \if you set a model_path, it should be a full path, not dir.
        :param device:
        :param model_path:
        :param model_name:
        """

[docs]
        self.input_data_length = None


[docs]
        self.step = None


[docs]
        self.device = torch.device(device)


[docs]
        self.model = self.__load_model(model_path=model_path, model_name=model_name)


[docs]
        self.proba = None


[docs]
        self.pred = None


[docs]
        self.feature = None


[docs]
        self.N_TIME = 300


[docs]
        self.LABEL_SHORT = ['SS', 'KC', 'SW', 'SAW', 'VSW', 'BG', 'AR']


[docs]
        self.LABEL_LONG = ['Spindle', 'K-complex', 'Slow wave', 'Sawtooth', 'Vertex Sharp', 'Background', 'Arousal']



[docs]
    def predict(self, X=None, step=50):
        """
        input data, predict sleep event for each time step
        :param X: (n_epoch,  n_time)
        :param step: 300 >= step >= 1
        :return: predict_proba, pred, filtered pred, feature
        """
        n_epoch = X.shape[0]
        sample = self.__sliding_window_sample(X, step)
        proba, fea = self.__predict(sample)
        _ = self.__rearrange_output(proba, fea, n_epoch)
        return self.pred.flatten()



[docs]
    def predict_proba(self, X=None, step=50):
        """
        input data, predict sleep event for each time step
        :param X: (n_epoch,  n_time)
        :param step: 300 >= step >= 1
        :return: predict_proba, pred, filtered pred, feature
        """
        _ = self.predict(X, step)
        return self.proba.flatten()



[docs]
    def __sliding_window_sample(self, X=None, step=50):
        data = X[:, None, :]
        assert data.shape[2] >= 300, 'n_time should > 300'
        assert 300 >= step >= 1
        self.step = step
        self.input_data_length = data.shape[2]

        sliding_window_sample = np.lib.stride_tricks.sliding_window_view(data, self.N_TIME, axis=2)[:, :, ::step]
        sliding_window_sample = einops.rearrange(sliding_window_sample,
                                                 'n_epoch n_ch n_window n_time -> (n_epoch n_window) n_ch n_time')
        return torch.from_numpy(sliding_window_sample).float().to(self.device)



[docs]
    def __rearrange_output(self, proba, fea, n_epoch):
        self.feature = einops.rearrange(fea, '(n_epoch n_window) n_hd n_step -> n_epoch n_window n_hd n_step',
                                        n_epoch=n_epoch)
        pred = np.argmax(proba, axis=1)
        self.proba = einops.rearrange(proba, '(n_epoch n_window) n_class -> n_epoch n_window n_class',
                                      n_epoch=n_epoch)
        self.pred = einops.rearrange(pred, '(n_epoch n_window) -> n_epoch n_window', n_epoch=n_epoch)
        return self.feature, self.proba, self.pred



[docs]
    def plot_predictions(self, epoch_ind=0):
        proba = pd.DataFrame(self.proba[epoch_ind] * 100, columns=self.LABEL_SHORT)
        sns.set_theme('notebook', style='ticks', palette='bright')
        ax = proba.plot(kind='area', figsize=(50, 4), alpha=0.9, stacked=True, lw=0)
        ax.set_xlim(0, proba.shape[0])
        ax.set_ylim(0, 100)
        ax.set_ylabel("Probability")
        ax.set_xlabel("Epoch Index / 30s")
        N_WIN_PER_EPOCH = int((3000 - self.N_TIME) / self.step + 1)
        N_EPOCH_STEP = 50
        ori_ticks = np.arange(0, len(proba), N_EPOCH_STEP * N_WIN_PER_EPOCH, dtype=int)
        ax.set_xticks(ori_ticks, (ori_ticks / N_WIN_PER_EPOCH).astype(int))
        plt.legend(bbox_to_anchor=(0.04, 0.5))




[docs]
    def to_json(self):
        pass



[docs]
    def to_pandas(self, overall_threshold=0.5, describe=False, event_threshold=None):
        label_ind = np.argwhere(self.proba > overall_threshold)
        last_ind = label_ind[0]
        starts = [last_ind]
        ends = []
        for this_ind in label_ind[1:]:
            if this_ind[1] - last_ind[1] == 1 and this_ind[2] == last_ind[2]:
                last_ind = this_ind
            else:
                ends.append(last_ind)
                starts.append(this_ind)
                last_ind = this_ind
        ends.append(label_ind[-1])

        step = self.step
        starts_ = np.array(starts)
        ends_ = np.array(ends)
        proba_ = []
        for s_, e_ in zip(starts_, ends_):
            proba_.append(self.proba[s_[0], s_[1]:e_[1] + 1, s_[2]].mean())
        starts = starts_[:, 1] * step + int(150 - step / 2)
        ends = ends_[:, 1] * step + int(150 + step / 2)
        starts = np.where(starts <= int(150 - step / 2), 0, starts)
        ends = np.where(ends >= self.input_data_length - int(150 + step / 2), self.input_data_length, ends)

        df = pd.DataFrame({
            'Start': starts,
            'End': ends,
            'Duration': ends - starts,
            'label': [self.LABEL_LONG[label_ind] for label_ind in ends_[:, 2]],
            'predict_proba': proba_,
            'epoch_id': ends_[:, 0],
        })

        if event_threshold is None:
            event_threshold = {
                'Spindle': 0.95,
                'Background': 0.9,
                'Arousal': 0.9,
                'K-complex': 0.6,
                'Slow wave': 0.6,
                'Vertex Sharp': 0.6,
                'Sawtooth': 0.6}
        inds = []
        for label in event_threshold:
            inds.extend(df.query(f'label=="{label}" and predict_proba<{event_threshold[label]}').index.to_list())
        df = df.drop(index=inds)

        if describe is True:
            describe = df.groupby('label').describe()['predict_proba'][['count', 'mean']]
            describe['percentage'] = 100 * describe['count'] / describe['count'].sum()
            describe.rename(columns={'mean': 'predict_proba_mean'}, inplace=True)
            describe['predict_proba_mean'] *= 100
            return df, describe
        else:
            return df



[docs]
    def __predict(self, data):
        torch.cuda.empty_cache()
        softmax = torch.nn.Softmax(dim=1)
        with torch.no_grad():
            pre, fea = self.model(data)
            proba = softmax(pre).cpu().numpy()
        torch.cuda.empty_cache()
        return proba, fea

        # pre = einops.rearrange(pre, '(n_epoch n_window) n_class -> n_epoch n_window n_class', n_epoch=n_epoch)
        # fea = einops.rearrange(fea, '(n_epoch n_window) n_hd n_step -> n_epoch n_window n_hd n_step', n_epoch=n_epoch)


[docs]
    def __load_model(self, model_path=None, model_name='model.pt'):
        model = base_Model(Config()).to(self.device)
        if model_path is None:
            from importlib import resources
            model_path = os.path.join(resources.files(saved_models), model_name)
        chkpoint = torch.load(model_path, map_location=self.device)
        pretrained_dict = chkpoint["model_state_dict"]
        model.load_state_dict(pretrained_dict)
        model.eval()
        return model





[docs]
class base_Model(nn.Module):
    def __init__(self, configs):
        super(base_Model, self).__init__()


[docs]
        self.conv_block1 = nn.Sequential(
            nn.Conv1d(configs.input_channels, 32, kernel_size=configs.kernel_size,
                      stride=configs.stride, bias=False, padding=(configs.kernel_size // 2)),
            nn.BatchNorm1d(32),
            nn.ReLU(),
            nn.MaxPool1d(kernel_size=2, stride=2, padding=1),
            nn.Dropout(configs.dropout)
        )



[docs]
        self.conv_block2 = nn.Sequential(
            nn.Conv1d(32, 64, kernel_size=8, stride=1, bias=False, padding=4),
            nn.BatchNorm1d(64),
            nn.ReLU(),
            nn.MaxPool1d(kernel_size=2, stride=2, padding=1)
        )



[docs]
        self.conv_block3 = nn.Sequential(
            nn.Conv1d(64, configs.final_out_channels, kernel_size=8, stride=1, bias=False, padding=4),
            nn.BatchNorm1d(configs.final_out_channels),
            nn.ReLU(),
            nn.MaxPool1d(kernel_size=2, stride=2, padding=1),
        )



[docs]
        model_output_dim = configs.features_len


[docs]
        self.logits = nn.Linear(model_output_dim * configs.final_out_channels, configs.num_classes)



[docs]
    def forward(self, x_in):
        x = self.conv_block1(x_in)
        x = self.conv_block2(x)
        x = self.conv_block3(x)

        x_flat = x.reshape(x.shape[0], -1)
        logits = self.logits(x_flat)
        return logits, x





[docs]
class Config(object):
    def __init__(self):
        # model configs

[docs]
        self.input_channels = 1


[docs]
        self.final_out_channels = 128


[docs]
        self.num_classes = 7


[docs]
        self.dropout = 0.35



[docs]
        self.kernel_size = 25


[docs]
        self.stride = 3


[docs]
        self.features_len = 15  # 15  # 127, 44


        # training configs

[docs]
        self.num_epoch = 50


        # optimizer parameters

[docs]
        self.optimizer = 'adam'


[docs]
        self.beta1 = 0.9


[docs]
        self.beta2 = 0.99


[docs]
        self.lr = 3e-4


        # data parameters

[docs]
        self.drop_last = True


[docs]
        self.batch_size = 3500



[docs]
        self.Context_Cont = Context_Cont_configs()


[docs]
        self.TC = TC()


[docs]
        self.augmentation = augmentations()





[docs]
class augmentations(object):
    def __init__(self):

[docs]
        self.jitter_scale_ratio = 1.5


[docs]
        self.jitter_ratio = 2


[docs]
        self.max_seg = 12





[docs]
class Context_Cont_configs(object):
    def __init__(self):

[docs]
        self.temperature = 0.2


[docs]
        self.use_cosine_similarity = True





[docs]
class TC(object):
    def __init__(self):

[docs]
        self.hidden_dim = 128


[docs]
        self.timesteps = 5