Question

Я пытаюсь запустить последовательность биграмм в LSTM. Это включает в себя:

2. Добавление последовательностей с помощью pad_sequence

3.Ввод дополненных последовательностей в слой внедрения

4.Упаковка вывода встраиваемого слоя

5. Вставка пакета в LSTM.

class LSTMClassifier(nn.Module):
    # LSTM initialization
    def __init__(self, embedding_dim=32, hidden_dim=50, vocab_size=7138, label_size=2, static_size, batch_size=32):
        super(LSTMClassifier, self).__init__()
        # Initializing batch size
        self.batch_size = batch_size
        # Setting the hidden layer dimension of the LSTM
        self.hidden_dim = hidden_dim
        # Initializing the embedding layer
        self.embeddings = nn.Embedding(vocab_size, embedding_dim-2)
        # Initializing the LSTM layer with one hidden layer 
        self.lstm = nn.LSTM(((embedding_dim*vocab_size)+static_size), hidden_dim, num_layers=1, batch_first=True)
        # Initializing linear linear that takes the hidden layer output
        self.hidden2label = nn.Linear(hidden_dim, label_size)
        # Initializing the hidden layer
        self.hidden = self.init_hidden()

    # Defining the hidding state of the LSTM
    def init_hidden(self):
        # the first is the hidden h
        # the second is the cell  c
        return (autograd.Variable(torch.zeros(1, self.batch_size, self.hidden_dim).cuda()),
                autograd.Variable(torch.zeros(1, self.batch_size, self.hidden_dim).cuda()))

    # Defining the feed forward logic of the LSTM. It contains:
    # 1. The embedding layer
    # 2. The LSTM layer with one hidden layer
    # 3. The software layer
    def forward(self, seq, freq, time, static):
        # reset the LSTM hidden state. Must be done before you run a new batch. Otherwise the LSTM will treat
        # a new batch as a continuation of a sequence
        self.hidden = self.init_hidden()

        # Get sequence lengths
        seq_lengths = torch.LongTensor(list(map(len, seq))) # length of 59

        # Pad the sequences
        seq = rnn_utils.pad_sequence(seq, batch_first = True)
        freq = rnn_utils.pad_sequence(freq, batch_first = True)
        time = rnn_utils.pad_sequence(time, batch_first = True)
        static = rnn_utils.pad_sequence(static, batch_first = True)

        seq = autograd.Variable(seq)
        freq = autograd.Variable(freq)
        time = autograd.Variable(time)
        static = autograd.Variable(static)

        # This is the pass to the embedding layer. 
        # The sequence is of dimension N and the output is N x Demb
        embeds = self.embeddings(seq)
        embeds = torch.cat((embeds,freq), dim=3)
        embeds = torch.cat((embeds,time), dim=3)
        print(embeds.size()) #torch.Size([32, 59, 7138, 32])

        x = embeds.view(self.batch_size, seq.size()[1], 1,-1)
        print(x.size()) #torch.Size([32, 59, 1, 228416])

        static = static.view(self.batch_size, -1,1,3)
        x = torch.cat([x, static], dim=3)
        print(x.size()) #torch.Size([32, 59, 1, 228419])

        # pack the padded sequence so that paddings are ignored
        x = torch.nn.utils.rnn.pack_padded_sequence(x, seq_lengths, batch_first=True)

        lstm_out, self.hidden = self.lstm(x, self.hidden)

        # unpack the packed padded sequence so that it is ready for prediction
        lstm_out = torch.nn.utils.rnn.pad_packed_sequence(lstm_out, batch_first=True)

        y = self.hidden2label(lstm_out[-1])
        log_probs = F.log_softmax(y)
        return log_probs

Однако я получаю сообщение об ошибке:

---> 66         lstm_out, self.hidden = self.lstm(x, self.hidden)
     67 
     68         # unpack the packed padded sequence so that it is ready for prediction

~/anaconda3/envs/pytorch_p36/lib/python3.6/site-packages/torch/nn/modules/module.py in __call__(self, *input, **kwargs)
    487             result = self._slow_forward(*input, **kwargs)
    488         else:
--> 489             result = self.forward(*input, **kwargs)
    490         for hook in self._forward_hooks.values():
    491             hook_result = hook(self, input, result)

~/anaconda3/envs/pytorch_p36/lib/python3.6/site-packages/torch/nn/modules/rnn.py in forward(self, input, hx)
    173                 hx = (hx, hx)
    174 
--> 175         self.check_forward_args(input, hx, batch_sizes)
    176         _impl = _rnn_impls[self.mode]
    177         if batch_sizes is None:

~/anaconda3/envs/pytorch_p36/lib/python3.6/site-packages/torch/nn/modules/rnn.py in check_forward_args(self, input, hidden, batch_sizes)
    129             raise RuntimeError(
    130                 'input must have {} dimensions, got {}'.format(
--> 131                     expected_input_dim, input.dim()))
    132         if self.input_size != input.size(-1):
    133             raise RuntimeError(

RuntimeError: input must have 2 dimensions, got 3
x = rnn_utils.pad_sequence(x, batch_first=True)
import torch

Я думал, что модель LSTM требует 3-х мерного ввода? Я очень смущен тем, почему это требует 2 измерений. Как мне это исправить?

Untitled123 · Answer 1 · 02 июня 2019

Вам также необходимо пройти скрытый слой и состояние ячейки. Скопировано из https://pytorch.org/docs/stable/nn.html

>>> rnn = nn.LSTM(10, 20, 2)
>>> input = torch.randn(5, 3, 10)
>>> h0 = torch.randn(2, 3, 20)
>>> c0 = torch.randn(2, 3, 20)
>>> output, (hn, cn) = rnn(input, (h0, c0))

RuntimeError: вход должен иметь 2 измерения, получил 3

Пожалуйста, войдите или зарегистрируйтесь чтобы ответить на этот вопрос.

1 Ответ

Пожалуйста, войдите или зарегистрируйтесь что бы добавить комментарий.

RuntimeError: вход должен иметь 2 измерения, получил 3

Пожалуйста, войдите или зарегистрируйтесь чтобы ответить на этот вопрос.

1 Ответ

Пожалуйста, войдите или зарегистрируйтесь что бы добавить комментарий.

Похожие темы