Fixed bug in RawInputLSTM where only last context was added to. Applying dropout after relu in MLP

2261c98b · Franck Dary · f6de0f30 · 2261c98b · 2261c98b · 2261c98b
Commit 2261c98b authored Apr 15, 2020 by Franck Dary
--- a/torch_modules/include/LSTMNetwork.hpp
+++ b/torch_modules/include/LSTMNetwork.hpp
@@ -15,7 +15,6 @@ class LSTMNetworkImpl : public NeuralNetworkImpl
  torch::nn::Embedding wordEmbeddings{nullptr};
  torch::nn::Dropout embeddingsDropout{nullptr};
-  torch::nn::Dropout lstmDropout{nullptr};
  MLP mlp{nullptr};
  ContextLSTM contextLSTM{nullptr};

--- a/torch_modules/src/MLP.cpp
+++ b/torch_modules/src/MLP.cpp
@@ -19,7 +19,7 @@ torch::Tensor MLPImpl::forward(torch::Tensor input)
 {
  torch::Tensor output = input;
  for (unsigned int i = 0; i < layers.size()-1; i++)
-    output = torch::relu(dropouts[i](layers[i](output)));
+    output = dropouts[i](torch::relu(layers[i](output)));
  return layers.back()(output);
 }

--- a/torch_modules/src/RawInputLSTM.cpp
+++ b/torch_modules/src/RawInputLSTM.cpp
@@ -25,16 +25,19 @@ void RawInputLSTMImpl::addToContext(std::vector<std::vector<long>> & context, Di
  if (leftWindow < 0 or rightWindow < 0)
    return;
+  for (auto & contextElement : context)
+  {
    for (int i = 0; i < leftWindow; i++)
      if (config.hasCharacter(config.getCharacterIndex()-leftWindow+i))
-      context.back().push_back(dict.getIndexOrInsert(fmt::format("{}", config.getLetter(config.getCharacterIndex()-leftWindow+i))));
+        contextElement.push_back(dict.getIndexOrInsert(fmt::format("{}", config.getLetter(config.getCharacterIndex()-leftWindow+i))));
      else
-      context.back().push_back(dict.getIndexOrInsert(Dict::nullValueStr));
+        contextElement.push_back(dict.getIndexOrInsert(Dict::nullValueStr));
    for (int i = 0; i <= rightWindow; i++)
      if (config.hasCharacter(config.getCharacterIndex()+i))
-      context.back().push_back(dict.getIndexOrInsert(fmt::format("{}", config.getLetter(config.getCharacterIndex()+i))));
+        contextElement.push_back(dict.getIndexOrInsert(fmt::format("{}", config.getLetter(config.getCharacterIndex()+i))));
      else
-      context.back().push_back(dict.getIndexOrInsert(Dict::nullValueStr));
+        contextElement.push_back(dict.getIndexOrInsert(Dict::nullValueStr));
+  }
 }