SentimentAnalysisNLP/models.py at main · olof98johansson/SentimentAnalysisNLP · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
import torch
import torch.nn as nn
import preprocessing
import os
import numpy as np


class ModelUtils:
    '''
    A utility class to save and load model weights
    '''
    def save_model(save_path, model):
        root, ext = os.path.splitext(save_path)
        if not ext:
            save_path = root + '.pth'
        try:
            torch.save(model.state_dict(), save_path)
            print(f'Successfully saved to model to "{save_path}"!')
        except Exception as e:
            print(f'Unable to save model, check save path!')
            print(f'Exception:\n{e}')
            return None

    def load_model(load_path, model):
        try:
            model.load_state_dict(torch.load(load_path))
            print(f'Successfully loaded the model from path "{load_path}"')

        except Exception as e:
            print(f'Unable to load the weights, check if different model or incorrect path!')
            print(f'Exception:\n{e}')
            return None

class RNNModel(nn.Module):
    '''
    RNN classifier with different available RNN types (basic RNN, LSTM, GRU)
    '''

    def __init__(self, rnn_type, nr_layers, voc_size, emb_dim, rnn_size, dropout, n_classes):
        '''
        Initiates the RNN model

        Input: rnn_type - specifies the rnn model type between "rnn", "lstm" or "gru" (type: string)
               nr_layers - number of rnn layers (type: int)
               voc_size - size of vocabulary of the encoded input data (type: int)
               emb_dim - size of embedding layer (type: int)
               rnn_size - number of hidden layers in RNN model (type: int)
               dropout - probability of dropout layers (type: float in between [0, 1])
               n_classes - number of different classes/labels (type: int)
        '''
        super().__init__()
        self.rnn_size = rnn_size
        self.rnn_type = rnn_type
        self.nr_layers = nr_layers
        self.embedding = nn.Embedding(voc_size, emb_dim)

        if self.rnn_type == 'rnn':
            self.rnn = nn.RNN(input_size=emb_dim, hidden_size=rnn_size, dropout=dropout if nr_layers > 1 else 0,
                              bidirectional=False, num_layers=nr_layers, batch_first=True)

        elif self.rnn_type == 'lstm':
            self.rnn = nn.LSTM(input_size=emb_dim, hidden_size=rnn_size, dropout=dropout if nr_layers > 1 else 0,
                               bidirectional=False, num_layers=nr_layers, batch_first=True)

        elif self.rnn_type == 'gru':
            self.rnn = nn.GRU(input_size=emb_dim, hidden_size=rnn_size, dropout=dropout if nr_layers > 1 else 0,
                              bidirectional=False, num_layers=nr_layers, batch_first=True)

        else:
            print('Invalid or no choice for RNN type, please choose one of "rnn", "lstm" or "gru"')


        self.dropout = nn.Dropout(dropout)
        self.linear = nn.Linear(in_features=rnn_size, out_features=n_classes)
        self.sigmoid = nn.Sigmoid()

    def forward(self, X, hidden):
        '''
        Forward propagation of the RNN model

        Input: X - batch of input data (type: torch tensor)
               hidden - batch of input to the hidden cells (type: torch tensor)

        Output: out - model prediction (type: torch tensor)
                hidden - output of the hidden cells (torch.tensor)
        '''
        self.batch_size = X.size(0)
        embedded = self.embedding(X)


        if self.rnn_type == 'rnn' or self.rnn_type == 'gru':
            rnn_out, hidden = self.rnn(embedded, hidden)

        elif self.rnn_type == 'lstm':
            rnn_out, hidden = self.rnn(embedded, hidden)

        else:
            print(f'Invalid rnn type! Rebuild the model with a correct rnn type!')
            return None

        rnn_out = rnn_out.contiguous().view(-1, self.rnn_size)
        drop = self.dropout(rnn_out)
        out = self.linear(drop)
        out = self.sigmoid(out)
        # reshape such that batch size is first and get labels of last batch
        out = out.view(self.batch_size, -1)
        out = out[:, -1]

        return out, hidden

    def init_hidden(self, batch_size, device):
        '''
        Initializes hidden state
        '''
        # initialized to zero, for hidden state and cell state of LSTM
        h0 = torch.zeros((self.nr_layers, batch_size, self.rnn_size)).to(device)
        c0 = torch.zeros((self.nr_layers, batch_size, self.rnn_size)).to(device)
        hidden = (h0, c0)
        return hidden