sshuster
diff --git a/‎PyTorch/SpeechSynthesis/Tacotron2/Dockerfile‎
Lines changed: 1 addition & 1 deletion b/‎PyTorch/SpeechSynthesis/Tacotron2/Dockerfile‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎PyTorch/SpeechSynthesis/Tacotron2/README.md‎
Lines changed: 6 additions & 2 deletions b/‎PyTorch/SpeechSynthesis/Tacotron2/README.md‎
Lines changed: 6 additions & 2 deletions
diff --git a/‎PyTorch/SpeechSynthesis/Tacotron2/inference.py‎
Lines changed: 1 addition & 2 deletions b/‎PyTorch/SpeechSynthesis/Tacotron2/inference.py‎
Lines changed: 1 addition & 2 deletions
diff --git a/‎PyTorch/SpeechSynthesis/Tacotron2/models.py‎
Lines changed: 14 additions & 1 deletion b/‎PyTorch/SpeechSynthesis/Tacotron2/models.py‎
Lines changed: 14 additions & 1 deletion
diff --git a/‎PyTorch/SpeechSynthesis/Tacotron2/tacotron2/model.py‎
Lines changed: 1 addition & 12 deletions b/‎PyTorch/SpeechSynthesis/Tacotron2/tacotron2/model.py‎
Lines changed: 1 addition & 12 deletions
diff --git a/‎PyTorch/SpeechSynthesis/Tacotron2/train.py‎
Lines changed: 4 additions & 1 deletion b/‎PyTorch/SpeechSynthesis/Tacotron2/train.py‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎PyTorch/Translation/Transformer/Dockerfile‎
Lines changed: 4 additions & 0 deletions b/‎PyTorch/Translation/Transformer/Dockerfile‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎PyTorch/Translation/Transformer/README.md‎
Lines changed: 9 additions & 3 deletions b/‎PyTorch/Translation/Transformer/README.md‎
Lines changed: 9 additions & 3 deletions
diff --git a/‎PyTorch/Translation/Transformer/fairseq/optim/fairseq_optimizer.py‎
Lines changed: 2 additions & 1 deletion b/‎PyTorch/Translation/Transformer/fairseq/optim/fairseq_optimizer.py‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎PyTorch/Translation/Transformer/fairseq/options.py‎
Lines changed: 3 additions & 0 deletions b/‎PyTorch/Translation/Transformer/fairseq/options.py‎
Lines changed: 3 additions & 0 deletions
@@ -1,4 +1,4 @@
-FROM nvcr.io/nvidia/pytorch:19.06-py3
+FROM nvcr.io/nvidia/pytorch:19.07-py3
 
 ADD . /workspace/tacotron2
 WORKDIR /workspace/tacotron2
 
@@ -417,7 +417,7 @@ Batch: 8/260 epoch 0
 
 ### Getting the data
 
-The Tacotron 2 and WaveGlow models were trained on the LJSpeech-1.1 dataset.  
+The Tacotron 2 and WaveGlow models were trained on the LJSpeech-1.1 dataset.
 This repository contains the `./scripts/prepare_dataset.sh` script which will automatically download and extract the whole dataset. By default, data will be extracted to the `./LJSpeech-1.1` directory. The dataset directory contains a `README` file, a `wavs` directory with all audio samples, and a file `metadata.csv` that contains audio file names and the corresponding transcripts.
 
 #### Dataset guidelines
@@ -428,7 +428,7 @@ The LJSpeech dataset has 13,100 clips that amount to about 24 hours of speech. S
 
 To use datasets different than the default LJSpeech dataset:
 
-1. Prepare a directory with all audio files and pass it to the `--dataset-path` command-line option.  
+1. Prepare a directory with all audio files and pass it to the `--dataset-path` command-line option.
 
 2. Add two text files containing file lists: one for the training subset (`--training-files`) and one for the validation subset (`--validation files`).
 The structure of the filelists should be as follows:
@@ -679,6 +679,10 @@ benchmarks from input tokes per second to output mel-spectrograms per second
 * Introduced batched inference
 * Included warmup in the inference script
 
+August 2019
+* Fixed inference results
+* Fixed initialization of Batch Normalization
+
 ### Known issues
 
 There are no known issues in this release.
@@ -46,8 +46,7 @@ def parse_args(parser):
     Parse commandline arguments.
     """
     parser.add_argument('-i', '--input', type=str, required=True,
-                        help='full path to the input text (phareses separated by new line); \
-                        if not provided then use default text')
+                        help='full path to the input text (phareses separated by new line)')
     parser.add_argument('-o', '--output', required=True,
                         help='output folder to save audio (file per phrase)')
     parser.add_argument('--tacotron2', type=str,
 
@@ -54,7 +54,16 @@ def batchnorm_to_float(module):
     return module
 
 
-def get_model(model_name, model_config, to_cuda):
+def init_bn(module):
+    if isinstance(module, torch.nn.modules.batchnorm._BatchNorm):
+        if module.affine:
+            module.weight.data.uniform_()
+    for child in module.children():
+        init_bn(child)
+
+
+def get_model(model_name, model_config, to_cuda,
+              uniform_initialize_bn_weight=False):
     """ Code chooses a model based on name"""
     model = None
     if model_name == 'Tacotron2':
@@ -63,6 +72,10 @@ def get_model(model_name, model_config, to_cuda):
         model = WaveGlow(**model_config)
     else:
         raise NotImplementedError(model_name)
+
+    if uniform_initialize_bn_weight:
+        init_bn(model)
+
     if to_cuda:
         model = model.cuda()
     return model
 
@@ -206,7 +206,7 @@ def __init__(self, encoder_n_convolutions,
                          dilation=1, w_init_gain='relu'),
                 nn.BatchNorm1d(encoder_embedding_dim))
             convolutions.append(conv_layer)
-            self.convolutions = nn.ModuleList(convolutions)
+        self.convolutions = nn.ModuleList(convolutions)
 
         self.lstm = nn.LSTM(encoder_embedding_dim,
                             int(encoder_embedding_dim / 2), 1,
@@ -231,17 +231,6 @@ def forward(self, x, input_lengths):
 
         return outputs
 
-    def infer(self, x):
-        for conv in self.convolutions:
-            x = F.dropout(F.relu(conv(x)), 0.5, self.training)
-
-        x = x.transpose(1, 2)
-
-        self.lstm.flatten_parameters()
-        outputs, _ = self.lstm(x)
-
-        return outputs
-
 
 class Decoder(nn.Module):
     def __init__(self, n_mel_channels, n_frames_per_step,
 
@@ -96,6 +96,8 @@ def parse_args(parser):
                           help='Enable cudnn')
     training.add_argument('--cudnn-benchmark', action='store_true',
                           help='Run cudnn benchmark')
+    training.add_argument('--disable-uniform-initialize-bn-weight', action='store_true',
+                          help='disable uniform initialization of batchnorm layer weight')
 
     optimization = parser.add_argument_group('optimization setup')
     optimization.add_argument(
@@ -343,7 +345,8 @@ def main():
 
     model_config = models.get_model_config(model_name, args)
     model = models.get_model(model_name, model_config,
-                             to_cuda=True)
+                             to_cuda=True,
+                             uniform_initialize_bn_weight=not args.disable_uniform_initialize_bn_weight)
 
     if not args.amp_run and distributed_run:
         model = DDP(model)
 
@@ -15,6 +15,10 @@
 ARG FROM_IMAGE_NAME=nvcr.io/nvidia/pytorch:19.06-py3
 FROM ${FROM_IMAGE_NAME}
 
+WORKDIR /workspace
+RUN git clone https://github.com/NVIDIA/apex \
+ && cd apex \
+ && pip install -v --no-cache-dir --global-option="--cpp_ext" --global-option="--cuda_ext" ./
 # Install Python dependencies
 RUN pip install --upgrade --no-cache-dir pip \
  && pip install --no-cache-dir \
 
@@ -345,7 +345,7 @@ The following sections provide details on how we achieved our performance and ac
 #### Training accuracy results
 
 In order to test the accuracy of our implementation, we have run experiments with different seeds for 100 epochs with batch size 5120 per GPU and learning rate 6e-4 in the pytorch-18.12-py3 Docker container. The plot below shows the BLEU score changes.<br/>
-![Accuracy plot](/BLEU.png)
+![Accuracy plot](./BLEU.png)
 
 Running this code with the provided hyperparameters will allow you to achieve the following results. Our setup is a DGX-1 with 8x Tesla V100 16GB. We've verified our results after training 32 epochs to obtain multi-GPU and mixed precision scaling results.
 
@@ -424,12 +424,18 @@ January 2019
 - initial commit, forked from [fairseq](https://github.com/pytorch/fairseq/commit/ac5fddfc691267285a84c81d39475411da5ed1c6)
 
 May 2019:
-- adding mid-training SacreBLEU evaluation. Better handling of OOMs.
+- add mid-training [SacreBLEU](https://pypi.org/project/sacrebleu/1.2.10/) evaluation. Better handling of OOMs.
 
 June 2019
 - new README
-- jit support added
+
+July 2019
+- replace custom fused operators with jit functions
+
+August 2019
+- add basic AMP support
 
 ## Known issues
 
 - Course of a training heavily depends on a random seed. There is high variance in the time required to reach a certain BLEU score. Also the highest BLEU score value observed vary between runs with different seeds.
+- Translations produced by training script during online evaluation may differ from those produced by `generate.py` script. It is probably a format conversion issue.
@@ -40,7 +40,8 @@ def optimizer(self):
         """Return a torch.optim.optimizer.Optimizer instance."""
         if not hasattr(self, '_optimizer'):
             raise NotImplementedError
-        if not isinstance(self._optimizer, torch.optim.Optimizer):
+        #TODO: this shouldn't be dependent of args.amp
+        if not isinstance(self._optimizer, torch.optim.Optimizer) and not self.args.amp:
             raise ValueError('_optimizer must be an instance of torch.optim.Optimizer')
         return self._optimizer
 
 
@@ -144,6 +144,9 @@ def get_parser(desc, default_task='translation'):
     parser.add_argument('--seed', default=1, type=int, metavar='N',
                         help='pseudo random number generator seed')
     parser.add_argument('--fp16', action='store_true', help='use FP16')
+    parser.add_argument('--amp', action='store_true', help='use Automatic Mixed Precision')
+    parser.add_argument('--amp-level', type=str, default="O1", help='choose apm\'s optimization level')
+
     parser.add_argument('--profile', type=int, default=None)
     # Task definitions can be found under fairseq/tasks/
     parser.add_argument(
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		`-FROM nvcr.io/nvidia/pytorch:19.06-py3`
	`1`	`+FROM nvcr.io/nvidia/pytorch:19.07-py3`
`2`	`2`
`3`	`3`	`ADD . /workspace/tacotron2`
`4`	`4`	`WORKDIR /workspace/tacotron2`