models/m7_lstm_att.py

import torch

from models.lightning_common import CommonModel, common_test, common_train


class LSTMModel(CommonModel):
    def __init__(self, hparams, xst, yst, xsv, ysv):
        super().__init__(hparams, xst, yst, xsv, ysv)

        self.n_layers = hparams['layer_count']
        self.n_hidden = hparams['hidden_size']
        self.drop_prob = hparams['drop_prob']

        self.n_classes = hparams['class_count']
        self.n_channels = hparams['channels']

        self.lstm = torch.nn.LSTM(self.n_channels, self.n_hidden, self.n_layers, dropout=self.drop_prob,
                                  batch_first=True)
        self.dropout = torch.nn.Dropout(self.drop_prob)

        assert self.n_hidden % 8 == 0
        self.self_att = torch.nn.MultiheadAttention(self.n_hidden, 8)
        self.fc = torch.nn.Linear(self.n_hidden, self.n_classes)

    def forward(self, x: torch.Tensor) -> torch.Tensor:
        x, _ = self.lstm(x)
        x = self.dropout(x)

        kv = x.permute(1, 0, 2)
        query = x[:, -1:].permute(1, 0, 2)
        x = self.self_att(query, kv, kv)[0]
        x = x.squeeze(0)

        x = self.fc(x)
        return x


def feature_extraction(xs):
    return xs


def train(x_train, y_train, class_count, *args, **kwargs):
    return common_train(x_train, y_train, LSTMModel,
                        {
                            'layer_count': kwargs['layer_count'],
                            'hidden_size': kwargs['hidden_size'],
                            'drop_prob': kwargs['drop_prob'],
                            'temporal_length': x_train.shape[1],

                            'lr': kwargs['lr'],
                            'class_count': class_count,
                            'channels': x_train.shape[2],
                        },
                        kwargs['folds'])


def test(model, x_test):
    return common_test(model, x_test)