mohanakrishna12
diff --git a/‎tensorflow_examples/models/densenet/train.py
Lines changed: 1 addition & 1 deletion b/‎tensorflow_examples/models/densenet/train.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎tensorflow_examples/models/nmt_with_attention/__init__.py
Lines changed: 14 additions & 0 deletions b/‎tensorflow_examples/models/nmt_with_attention/__init__.py
Lines changed: 14 additions & 0 deletions
diff --git a/‎tensorflow_examples/models/nmt_with_attention/distributed_test.py
Lines changed: 59 additions & 0 deletions b/‎tensorflow_examples/models/nmt_with_attention/distributed_test.py
Lines changed: 59 additions & 0 deletions
diff --git a/‎tensorflow_examples/models/nmt_with_attention/distributed_train.py
Lines changed: 145 additions & 0 deletions b/‎tensorflow_examples/models/nmt_with_attention/distributed_train.py
Lines changed: 145 additions & 0 deletions
diff --git a/‎tensorflow_examples/models/nmt_with_attention/nmt.py
Lines changed: 131 additions & 0 deletions b/‎tensorflow_examples/models/nmt_with_attention/nmt.py
Lines changed: 131 additions & 0 deletions
@@ -31,6 +31,7 @@ class Train(object):
   Args:
     epochs: Number of epochs
     enable_function: If True, wraps the train_step and test_step in tf.function
+    model: Densenet model.
   """
 
   def __init__(self, epochs, enable_function, model):
@@ -154,7 +155,6 @@ def run_main(argv):
   """
   del argv
   kwargs = utils.flags_dict()
-  print (kwargs)
   main(**kwargs)
 
 
 
@@ -0,0 +1,14 @@
+# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
@@ -0,0 +1,59 @@
+# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Tests for distributed nmt_with_attention."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import time
+import tensorflow as tf # TF2
+from tensorflow_examples.models.nmt_with_attention import distributed_train
+from tensorflow_examples.models.nmt_with_attention import utils
+assert tf.__version__.startswith('2')
+
+
+class NmtDistributedBenchmark(tf.test.Benchmark):
+
+  def __init__(self, output_dir=None, **kwargs):
+    self.output_dir = output_dir
+
+  def benchmark_one_epoch_1_gpu(self):
+    kwargs = utils.get_common_kwargs()
+    kwargs.update({'enable_function': False})
+    self._run_and_report_benchmark(**kwargs)
+
+  def benchmark_one_epoch_1_gpu_function(self):
+    kwargs = utils.get_common_kwargs()
+    self._run_and_report_benchmark(**kwargs)
+
+  def benchmark_ten_epochs_2_gpus(self):
+    kwargs = utils.get_common_kwargs()
+    kwargs.update({'epochs': 10, 'num_gpu': 2, 'batch_size': 128})
+    self._run_and_report_benchmark(**kwargs)
+
+  def _run_and_report_benchmark(self, **kwargs):
+    start_time_sec = time.time()
+    train_loss, test_loss = distributed_train.main(**kwargs)
+    wall_time_sec = time.time() - start_time_sec
+
+    extras = {'train_loss': train_loss,
+              'test_loss': test_loss}
+
+    self.report_benchmark(
+        wall_time=wall_time_sec, extras=extras)
+
+if __name__ == '__main__':
+  tf.test.main()
@@ -0,0 +1,145 @@
+# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Distributed Train.
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+from absl import app
+from absl import flags
+import tensorflow as tf # TF2
+from tensorflow_examples.models.nmt_with_attention import nmt
+from tensorflow_examples.models.nmt_with_attention import utils
+from tensorflow_examples.models.nmt_with_attention.train import Train
+assert tf.__version__.startswith('2')
+
+FLAGS = flags.FLAGS
+
+# if additional flags are needed, define it here.
+flags.DEFINE_integer('num_gpu', 1, 'Number of GPUs to use')
+
+
+class DistributedTrain(Train):
+  """Distributed Train class.
+
+  Args:
+    epochs: Number of epochs.
+    enable_function: Decorate function with tf.function.
+    encoder: Encoder.
+    decoder: Decoder.
+    inp_lang: Input language tokenizer.
+    targ_lang: Target language tokenizer.
+    batch_size: Batch size.
+  """
+
+  def __init__(self, epochs, enable_function, encoder, decoder, inp_lang,
+               targ_lang, batch_size):
+    Train.__init__(
+        self, epochs, enable_function, encoder, decoder, inp_lang, targ_lang,
+        batch_size)
+
+  def training_loop(self, train_iterator, test_iterator,
+                    num_train_steps_per_epoch, num_test_steps_per_epoch,
+                    strategy):
+    """Custom training and testing loop.
+
+    Args:
+      train_iterator: Training iterator created using strategy
+      test_iterator: Testing iterator created using strategy
+      num_train_steps_per_epoch: number of training steps in an epoch.
+      num_test_steps_per_epoch: number of test steps in an epoch.
+      strategy: Distribution strategy
+
+    Returns:
+      train_loss, test_loss
+    """
+
+    # this code is expected to change.
+    def distributed_train():
+      return strategy.experimental_run(self.train_step, train_iterator)
+
+    def distributed_test():
+      return strategy.experimental_run(self.test_step, test_iterator)
+
+    if self.enable_function:
+      distributed_train = tf.function(distributed_train)
+      distributed_test = tf.function(distributed_test)
+
+    template = 'Epoch: {}, Train Loss: {}, Test Loss: {}'
+
+    for epoch in range(self.epochs):
+      self.train_loss_metric.reset_states()
+      self.test_loss_metric.reset_states()
+
+      train_iterator.initialize()
+      for _ in range(num_train_steps_per_epoch):
+        distributed_train()
+
+      test_iterator.initialize()
+      for _ in range(num_test_steps_per_epoch):
+        distributed_test()
+
+      print (template.format(epoch,
+                             self.train_loss_metric.result().numpy(),
+                             self.test_loss_metric.result().numpy()))
+
+    return (self.train_loss_metric.result().numpy(),
+            self.test_loss_metric.result().numpy())
+
+
+def run_main(argv):
+  del argv
+  kwargs = utils.flags_dict()
+  kwargs.update({'num_gpu': FLAGS.num_gpu})
+  main(**kwargs)
+
+
+def main(epochs, enable_function, buffer_size, batch_size, download_path,
+         num_examples=70000, embedding_dim=256, enc_units=1024, dec_units=1024,
+         num_gpu=1):
+
+  devices = ['/device:GPU:{}'.format(i) for i in range(num_gpu)]
+  strategy = tf.distribute.MirroredStrategy(devices)
+
+  with strategy.scope():
+    file_path = utils.download(download_path)
+    train_ds, test_ds, inp_lang, targ_lang = utils.create_dataset(
+        file_path, num_examples, buffer_size, batch_size)
+    vocab_inp_size = len(inp_lang.word_index) + 1
+    vocab_tar_size = len(targ_lang.word_index) + 1
+
+    num_train_steps_per_epoch = tf.data.experimental.cardinality(train_ds)
+    num_test_steps_per_epoch = tf.data.experimental.cardinality(test_ds)
+
+    train_iterator = strategy.make_dataset_iterator(train_ds)
+    test_iterator = strategy.make_dataset_iterator(test_ds)
+
+    encoder = nmt.Encoder(vocab_inp_size, embedding_dim, enc_units, batch_size)
+    decoder = nmt.Decoder(vocab_tar_size, embedding_dim, dec_units, batch_size)
+
+    train_obj = DistributedTrain(epochs, enable_function, encoder, decoder,
+                                 inp_lang, targ_lang, batch_size)
+    print ('Training ...')
+    return train_obj.training_loop(train_iterator,
+                                   test_iterator,
+                                   num_train_steps_per_epoch,
+                                   num_test_steps_per_epoch,
+                                   strategy)
+
+if __name__ == '__main__':
+  utils.nmt_flags()
+  app.run(run_main)
@@ -0,0 +1,131 @@
+# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Neural Machine Translation with Attention.
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import tensorflow as tf # TF2
+
+
+class Encoder(tf.keras.Model):
+  """Encoder.
+
+  Args:
+    vocab_size: Vocabulary size.
+    embedding_dim: Embedding dimension.
+    enc_units: Number of encoder units.
+    batch_sz: Batch size.
+  """
+
+  def __init__(self, vocab_size, embedding_dim, enc_units, batch_sz):
+    super(Encoder, self).__init__()
+    self.batch_sz = batch_sz
+    self.enc_units = enc_units
+    self.embedding = tf.keras.layers.Embedding(vocab_size, embedding_dim)
+    self.gru = tf.keras.layers.GRU(self.enc_units,
+                                   return_sequences=True,
+                                   return_state=True,
+                                   recurrent_initializer='glorot_uniform')
+
+  def call(self, x, hidden):
+    x = self.embedding(x)
+    output, state = self.gru(x, initial_state=hidden)
+    return output, state
+
+  def initialize_hidden_state(self):
+    return tf.zeros((self.batch_sz, self.enc_units))
+
+
+class BahdanauAttention(tf.keras.Model):
+  """Bahdanau Attention.
+
+  Args:
+    units: Number of dense units.
+  """
+
+  def __init__(self, units):
+    super(BahdanauAttention, self).__init__()
+    self.w1 = tf.keras.layers.Dense(units)
+    self.w2 = tf.keras.layers.Dense(units)
+    self.v = tf.keras.layers.Dense(1)
+
+  def call(self, query, values):
+    # hidden shape == (batch_size, hidden size)
+    # hidden_with_time_axis shape == (batch_size, 1, hidden size)
+    # we are doing this to perform addition to calculate the score
+    hidden_with_time_axis = tf.expand_dims(query, 1)
+
+    # score shape == (batch_size, max_length, hidden_size)
+    score = self.v(tf.nn.tanh(
+        self.w1(values) + self.w2(hidden_with_time_axis)))
+
+    # attention_weights shape == (batch_size, max_length, 1)
+    # we get 1 at the last axis because we are applying score to self.V
+    attention_weights = tf.nn.softmax(score, axis=1)
+
+    # context_vector shape after sum == (batch_size, hidden_size)
+    context_vector = attention_weights * values
+    context_vector = tf.reduce_sum(context_vector, axis=1)
+
+    return context_vector, attention_weights
+
+
+class Decoder(tf.keras.Model):
+  """Decoder.
+
+  Args:
+    vocab_size: Vocabulary size.
+    embedding_dim: Embedding dimension.
+    dec_units: Number of decoder units.
+    batch_sz: Batch size.
+  """
+
+  def __init__(self, vocab_size, embedding_dim, dec_units, batch_sz):
+    super(Decoder, self).__init__()
+    self.batch_sz = batch_sz
+    self.dec_units = dec_units
+    self.embedding = tf.keras.layers.Embedding(vocab_size, embedding_dim)
+    self.gru = tf.keras.layers.GRU(self.dec_units,
+                                   return_sequences=True,
+                                   return_state=True,
+                                   recurrent_initializer='glorot_uniform')
+    self.fc = tf.keras.layers.Dense(vocab_size)
+
+    # used for attention
+    self.attention = BahdanauAttention(self.dec_units)
+
+  def call(self, x, hidden, enc_output):
+    # enc_output shape == (batch_size, max_length, hidden_size)
+    context_vector, attention_weights = self.attention(hidden, enc_output)
+
+    # x shape after passing through embedding == (batch_size, 1, embedding_dim)
+    x = self.embedding(x)
+
+    # x shape after concatenation == (batch_size, 1, embedding_dim+hidden_size)
+    x = tf.concat([tf.expand_dims(context_vector, 1), x], axis=-1)
+
+    # passing the concatenated vector to the GRU
+    output, state = self.gru(x)
+
+    # output shape == (batch_size * 1, hidden_size)
+    output = tf.reshape(output, (-1, output.shape[2]))
+
+    # output shape == (batch_size, vocab)
+    x = self.fc(output)
+
+    return x, state, attention_weights