Fix python 3 download script and left-over cuda in attention layer

Files changed (3) hide show

scripts/download_weights.py CHANGED Viewed

@@ -1,6 +1,7 @@
 from __future__ import print_function
 import os
 from subprocess import call
 curr_folder = os.path.basename(os.path.normpath(os.getcwd()))
@@ -23,7 +24,7 @@ def prompt():
             'n': False,
             'no': False,
         }
-        choice = raw_input().lower()
         if choice in valid:
             return valid[choice]
         else:

 from __future__ import print_function
 import os
 from subprocess import call
+from builtins import input
 curr_folder = os.path.basename(os.path.normpath(os.getcwd()))
             'n': False,
             'no': False,
         }
+        choice = input().lower()
         if choice in valid:
             return valid[choice]
         else:

torchmoji/attlayer.py CHANGED Viewed

@@ -51,8 +51,6 @@ class Attention(Module):
         # See e.g. https://discuss.pytorch.org/t/self-attention-on-words-and-masking/5671/5
         max_len = unnorm_ai.size(1)
         idxes = torch.arange(0, max_len, out=torch.LongTensor(max_len)).unsqueeze(0)
-        if torch.cuda.is_available():
-            idxes = idxes.cuda()
         mask = Variable((idxes < input_lengths.unsqueeze(1)).float())
         # apply mask and renormalize attention scores (weights)

         # See e.g. https://discuss.pytorch.org/t/self-attention-on-words-and-masking/5671/5
         max_len = unnorm_ai.size(1)
         idxes = torch.arange(0, max_len, out=torch.LongTensor(max_len)).unsqueeze(0)
         mask = Variable((idxes < input_lengths.unsqueeze(1)).float())
         # apply mask and renormalize attention scores (weights)

torchmoji/finetuning.py CHANGED Viewed

@@ -514,9 +514,6 @@ def fit_model(model, loss_op, optim_op, train_gen, val_gen, epochs,
             X_train, y_train = data
             X_train = Variable(X_train, requires_grad=False)
             y_train = Variable(y_train, requires_grad=False)
-            if torch.cuda.is_available():
-                X_train = X_train.cuda()
-                y_train = y_train.cuda()
             model.train()
             optim_op.zero_grad()
             output = model(X_train)

             X_train, y_train = data
             X_train = Variable(X_train, requires_grad=False)
             y_train = Variable(y_train, requires_grad=False)
             model.train()
             optim_op.zero_grad()
             output = model(X_train)