Update PyTorch DeepSpeech

Beat Buesser · Beat Buesser · commit fd03959a2b0d · 2020-09-18T21:14:26.000+01:00
Signed-off-by: Beat Buesser &lt;beat.buesser@ie.ibm.com&gt;
diff --git a/art/estimators/speech_recognition/pytorch_deep_speech.py b/art/estimators/speech_recognition/pytorch_deep_speech.py
@@ -583,17 +583,19 @@ def transform_model_input(
             # Push the sequence to device
             if not tensor_input:
                 x[i] = x[i].astype(ART_NUMPY_DTYPE)
-                x[i] = torch.tensor(x[i]).to(self._device)
+                x_i_tensor = torch.tensor(x[i]).to(self._device)
+            else:
+                x_i_tensor = x[i]
 
             # Set gradient computation permission
             if compute_gradient:
-                x[i].requires_grad = True
+                x_i_tensor.requires_grad = True
 
             # Transform the sequence into the frequency space
             if tensor_input and real_lengths is not None:
-                transformed_input = transformer(x[i][: real_lengths[i]])
+                transformed_input = transformer(x_i_tensor[: real_lengths[i]])
             else:
-                transformed_input = transformer(x[i])
+                transformed_input = transformer(x_i_tensor)
 
             spectrogram, _ = torchaudio.functional.magphase(transformed_input)
             spectrogram = torch.log1p(spectrogram)