From b93c788748cf0965ff90ee2659c3dbd53f8dcd78 Mon Sep 17 00:00:00 2001
From: Leslie-Fang <fangjiahaosjtu2017@126.com>
Date: Thu, 14 Nov 2019 01:23:49 +0800
Subject: [PATCH 1/5] add checkpoint model save after training

---
 .../models/nmt_with_attention/train.py                | 11 ++++++++++-
 .../models/nmt_with_attention/utils.py                |  6 +++++-
 2 files changed, 15 insertions(+), 2 deletions(-)

diff --git a/tensorflow_examples/models/nmt_with_attention/train.py b/tensorflow_examples/models/nmt_with_attention/train.py
index 018155d4fd4..6eef4e7106a 100644
--- a/tensorflow_examples/models/nmt_with_attention/train.py
+++ b/tensorflow_examples/models/nmt_with_attention/train.py
@@ -160,6 +160,15 @@ def training_loop(self, train_ds, test_ds):
       for inp, targ in train_ds:
         self.train_step((inp, targ))
 
+      if epoch == self.epochs - 1:
+        import os, sys
+        checkpoint_dir = os.path.join(sys.path[0]+'/training_checkpoints')
+        checkpoint_prefix = os.path.join(checkpoint_dir, "ckpt")
+        checkpoint = tf.train.Checkpoint(optimizer=self.optimizer,
+                                         encoder=self.encoder,
+                                         decoder=self.decoder)
+        #save the model
+        checkpoint.save(file_prefix=checkpoint_prefix)
       for inp_test, targ_test in test_ds:
         self.test_step((inp_test, targ_test))
 
@@ -180,7 +189,7 @@ def run_main(argv):
 def main(epochs, enable_function, buffer_size, batch_size, download_path,
          num_examples=70000, embedding_dim=256, enc_units=1024, dec_units=1024):
   file_path = utils.download(download_path)
-  train_ds, test_ds, inp_lang, targ_lang = utils.create_dataset(
+  train_ds, test_ds, inp_lang, targ_lang, _, _ = utils.create_dataset(
       file_path, num_examples, buffer_size, batch_size)
   vocab_inp_size = len(inp_lang.word_index) + 1
   vocab_tar_size = len(targ_lang.word_index) + 1
diff --git a/tensorflow_examples/models/nmt_with_attention/utils.py b/tensorflow_examples/models/nmt_with_attention/utils.py
index e9bf6e5d598..f4b76375a19 100644
--- a/tensorflow_examples/models/nmt_with_attention/utils.py
+++ b/tensorflow_examples/models/nmt_with_attention/utils.py
@@ -153,6 +153,9 @@ def create_dataset(path_to_file, num_examples, buffer_size, batch_size):
   input_tensor, target_tensor, inp_lang, targ_lang = load_dataset(
       path_to_file, num_examples)
 
+  max_length_targ, max_length_inp = \
+      max_length(target_tensor), max_length(input_tensor)
+
   # Creating training and validation sets using an 80-20 split
   inp_train, inp_val, target_train, target_val = train_test_split(
       input_tensor, target_tensor, test_size=0.2)
@@ -165,7 +168,8 @@ def create_dataset(path_to_file, num_examples, buffer_size, batch_size):
   test_dataset = tf.data.Dataset.from_tensor_slices((inp_val, target_val))
   test_dataset = test_dataset.batch(batch_size, drop_remainder=True)
 
-  return train_dataset, test_dataset, inp_lang, targ_lang
+  return train_dataset, test_dataset, inp_lang, targ_lang, \
+         max_length_targ, max_length_inp
 
 
 def get_common_kwargs():

From 79e5e6ec866ad37df8b05074aef505ac86c1fe56 Mon Sep 17 00:00:00 2001
From: Leslie-Fang <fangjiahaosjtu2017@126.com>
Date: Thu, 14 Nov 2019 22:19:20 +0800
Subject: [PATCH 2/5] enable nmt single sentence evaluation

---
 .../models/nmt_with_attention/evaluate.py     | 141 ++++++++++++++++++
 .../models/nmt_with_attention/nmt.py          |   2 +-
 2 files changed, 142 insertions(+), 1 deletion(-)
 create mode 100644 tensorflow_examples/models/nmt_with_attention/evaluate.py

diff --git a/tensorflow_examples/models/nmt_with_attention/evaluate.py b/tensorflow_examples/models/nmt_with_attention/evaluate.py
new file mode 100644
index 00000000000..cba2657aa9d
--- /dev/null
+++ b/tensorflow_examples/models/nmt_with_attention/evaluate.py
@@ -0,0 +1,141 @@
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+from absl import app, flags
+import tensorflow as tf # TF2
+from tensorflow_examples.models.nmt_with_attention import nmt
+from tensorflow_examples.models.nmt_with_attention import utils
+assert tf.__version__.startswith('2')
+
+FLAGS = flags.FLAGS
+
+class Evaluate(object):
+  """Train class.
+
+  Attributes:
+    epochs: Number of epochs.
+    enable_function: Decorate function with tf.function.
+    encoder: Encoder.
+    decoder: Decoder.
+    inp_lang: Input language tokenizer.
+    targ_lang: Target language tokenizer.
+    batch_size: Batch size.
+    per_replica_batch_size: Batch size per replica for sync replicas. Same as
+      batch_size for non distributed training.
+    optimizer: Optimizer.
+    loss_object: Object of the loss class.
+    train_loss_metric: Mean metric to keep track of the train loss value.
+    test_loss_metric: Mean metric to keep track of the test loss value.
+  """
+
+  def __init__(self, encoder, decoder, inp_lang,
+               targ_lang, max_length_targ, max_length_inp):
+    self.encoder = encoder
+    self.decoder = decoder
+    self.inp_lang = inp_lang
+    self.targ_lang = targ_lang
+    self.optimizer = tf.keras.optimizers.Adam()
+    self.loss_object = tf.keras.losses.SparseCategoricalCrossentropy(
+        from_logits=True, reduction=tf.keras.losses.Reduction.NONE)
+    self.max_length_targ = max_length_targ
+    self.max_length_inp = max_length_inp
+
+  def evaluate(self, sentence):
+
+    sentence = utils.preprocess_sentence(sentence)
+
+    inputs = [self.inp_lang.word_index[i] for i in sentence.split(' ')]
+    inputs = tf.keras.preprocessing.sequence.pad_sequences([inputs],
+                                                            maxlen=self.max_length_inp,
+                                                            padding='post')
+    inputs = tf.convert_to_tensor(inputs)
+
+    result = ''
+
+    hidden = [tf.zeros((1, self.encoder.enc_units))]
+    enc_out, enc_hidden = self.encoder(inputs, hidden)
+
+    dec_hidden = enc_hidden
+    dec_input = tf.expand_dims([self.targ_lang.word_index['<start>']], 0)
+
+    for t in range(self.max_length_targ):
+        predictions, dec_hidden, attention_weights = self.decoder(dec_input,
+                                                                    dec_hidden,
+                                                                    enc_out)
+        predicted_id = tf.argmax(predictions[0]).numpy()
+
+        result += self.targ_lang.index_word[predicted_id] + ' '
+
+        if self.targ_lang.index_word[predicted_id] == '<end>':
+            # return result, sentence, attention_plot
+            return result, sentence
+
+        # the predicted ID is fed back into the model
+        dec_input = tf.expand_dims([predicted_id], 0)
+    return result, sentence
+
+def evaluate_flags():
+  flags.DEFINE_string('file_path', '/root/.keras/datasets/spa-eng/spa.txt', 'Download training dataset file')
+  flags.DEFINE_integer('embedding_dim', 256, 'Embedding dimension')
+  flags.DEFINE_integer('enc_units', 1024, 'Encoder GRU units')
+  flags.DEFINE_integer('dec_units', 1024, 'Decoder GRU units')
+  flags.DEFINE_integer('num_examples', 70000, 'Number of examples from dataset')
+
+def flags_dict():
+  """Define the flags.
+
+  Returns:
+    Command line arguments as Flags.
+  """
+
+  kwargs = {
+      'file_path': FLAGS.file_path,
+      'num_examples': FLAGS.num_examples,
+      'embedding_dim': FLAGS.embedding_dim,
+      'enc_units': FLAGS.enc_units,
+      'dec_units': FLAGS.dec_units
+  }
+  return kwargs
+
+
+def run_main(argv):
+  del argv
+  kwargs = flags_dict()
+  main(**kwargs)
+
+
+def main(file_path,
+         num_examples=70000, embedding_dim=256, enc_units=1024, dec_units=1024):
+
+  input_tensor, target_tensor, inp_lang, targ_lang = utils.load_dataset(
+      file_path, num_examples)
+
+  max_length_targ, max_length_inp = \
+      utils.max_length(target_tensor), utils.max_length(input_tensor)
+
+  vocab_inp_size = len(inp_lang.word_index) + 1
+  vocab_tar_size = len(targ_lang.word_index) + 1
+
+  encoder = nmt.Encoder(vocab_inp_size, embedding_dim, enc_units)
+  decoder = nmt.Decoder(vocab_tar_size, embedding_dim, dec_units)
+
+  optimizer = tf.keras.optimizers.Adam()
+
+  import os, sys
+  checkpoint_dir = os.path.join(sys.path[0] + '/training_checkpoints')
+  checkpoint = tf.train.Checkpoint(optimizer=optimizer, encoder=encoder, decoder=decoder)
+  status = checkpoint.restore(tf.train.latest_checkpoint(checkpoint_dir))
+  print("status is {}".format(status))
+
+  eva_obj = Evaluate(encoder, decoder,
+                    inp_lang, targ_lang, max_length_targ, max_length_inp)
+  print("*********start evaluate**********")
+  result, sentence = eva_obj.evaluate("Tom hizo todo lo que estuvo a su alcance para salvar a los niños atrapados en el edificio en llamas.")
+  print("{}:{}".format(sentence, result))
+
+if __name__ == "__main__":
+    evaluate_flags()
+    app.run(run_main)
+
diff --git a/tensorflow_examples/models/nmt_with_attention/nmt.py b/tensorflow_examples/models/nmt_with_attention/nmt.py
index 5105709756c..a71a3bdb540 100644
--- a/tensorflow_examples/models/nmt_with_attention/nmt.py
+++ b/tensorflow_examples/models/nmt_with_attention/nmt.py
@@ -32,7 +32,7 @@ class Encoder(tf.keras.Model):
     batch_sz: Batch size.
   """
 
-  def __init__(self, vocab_size, embedding_dim, enc_units, batch_sz):
+  def __init__(self, vocab_size, embedding_dim, enc_units, batch_sz=64):
     super(Encoder, self).__init__()
     self.batch_sz = batch_sz
     self.enc_units = enc_units

From 31fe6a1ae4716a27762115ee2c4577e3545f7d25 Mon Sep 17 00:00:00 2001
From: Leslie-Fang <fangjiahaosjtu2017@126.com>
Date: Thu, 14 Nov 2019 22:42:05 +0800
Subject: [PATCH 3/5] fix pylint error

---
 .../models/nmt_with_attention/evaluate.py     | 85 +++++++++++++------
 .../models/nmt_with_attention/train.py        |  3 +-
 2 files changed, 58 insertions(+), 30 deletions(-)

diff --git a/tensorflow_examples/models/nmt_with_attention/evaluate.py b/tensorflow_examples/models/nmt_with_attention/evaluate.py
index cba2657aa9d..68ac0caaa0f 100644
--- a/tensorflow_examples/models/nmt_with_attention/evaluate.py
+++ b/tensorflow_examples/models/nmt_with_attention/evaluate.py
@@ -1,8 +1,25 @@
+# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Evaluate.
+"""
 
 from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function
 
+import os, sys
 from absl import app, flags
 import tensorflow as tf # TF2
 from tensorflow_examples.models.nmt_with_attention import nmt
@@ -43,13 +60,21 @@ def __init__(self, encoder, decoder, inp_lang,
     self.max_length_inp = max_length_inp
 
   def evaluate(self, sentence):
+    """Custom evaluating step.
 
+    Args:
+      sentence: input sentence to evaluate
+
+    Returns:
+      result, sentence
+    """
     sentence = utils.preprocess_sentence(sentence)
 
     inputs = [self.inp_lang.word_index[i] for i in sentence.split(' ')]
-    inputs = tf.keras.preprocessing.sequence.pad_sequences([inputs],
-                                                            maxlen=self.max_length_inp,
-                                                            padding='post')
+    inputs = tf.keras.preprocessing.\
+                        sequence.pad_sequences([inputs],
+                                               maxlen=self.max_length_inp,
+                                               padding='post')
     inputs = tf.convert_to_tensor(inputs)
 
     result = ''
@@ -60,28 +85,32 @@ def evaluate(self, sentence):
     dec_hidden = enc_hidden
     dec_input = tf.expand_dims([self.targ_lang.word_index['<start>']], 0)
 
-    for t in range(self.max_length_targ):
-        predictions, dec_hidden, attention_weights = self.decoder(dec_input,
-                                                                    dec_hidden,
-                                                                    enc_out)
-        predicted_id = tf.argmax(predictions[0]).numpy()
+    for _ in range(self.max_length_targ):
+      predictions, dec_hidden, _ = self.decoder(dec_input,
+                                                dec_hidden,
+                                                enc_out)
+      predicted_id = tf.argmax(predictions[0]).numpy()
 
-        result += self.targ_lang.index_word[predicted_id] + ' '
+      result += self.targ_lang.index_word[predicted_id] + ' '
 
-        if self.targ_lang.index_word[predicted_id] == '<end>':
-            # return result, sentence, attention_plot
-            return result, sentence
+      if self.targ_lang.index_word[predicted_id] == '<end>':
+        # return result, sentence, attention_plot
+        return result, sentence
 
-        # the predicted ID is fed back into the model
-        dec_input = tf.expand_dims([predicted_id], 0)
+      # the predicted ID is fed back into the model
+      dec_input = tf.expand_dims([predicted_id], 0)
     return result, sentence
 
 def evaluate_flags():
-  flags.DEFINE_string('file_path', '/root/.keras/datasets/spa-eng/spa.txt', 'Download training dataset file')
+  flags.DEFINE_string('file_path', '/root/.keras/datasets/spa-eng/spa.txt',
+                      'Download training dataset file')
   flags.DEFINE_integer('embedding_dim', 256, 'Embedding dimension')
   flags.DEFINE_integer('enc_units', 1024, 'Encoder GRU units')
   flags.DEFINE_integer('dec_units', 1024, 'Decoder GRU units')
-  flags.DEFINE_integer('num_examples', 70000, 'Number of examples from dataset')
+  flags.DEFINE_integer('num_examples', 70000,
+                       'Number of examples from dataset')
+  flags.DEFINE_integer('input_sentence', 'Halo.',
+                       'The input sentence to inference,')
 
 def flags_dict():
   """Define the flags.
@@ -95,7 +124,8 @@ def flags_dict():
       'num_examples': FLAGS.num_examples,
       'embedding_dim': FLAGS.embedding_dim,
       'enc_units': FLAGS.enc_units,
-      'dec_units': FLAGS.dec_units
+      'dec_units': FLAGS.dec_units,
+      'input_sentence': FLAGS.input_sentence
   }
   return kwargs
 
@@ -105,9 +135,8 @@ def run_main(argv):
   kwargs = flags_dict()
   main(**kwargs)
 
-
-def main(file_path,
-         num_examples=70000, embedding_dim=256, enc_units=1024, dec_units=1024):
+def main(file_path, num_examples=70000, embedding_dim=256,
+         enc_units=1024, dec_units=1024, input_sentence='Halo.'):
 
   input_tensor, target_tensor, inp_lang, targ_lang = utils.load_dataset(
       file_path, num_examples)
@@ -123,19 +152,19 @@ def main(file_path,
 
   optimizer = tf.keras.optimizers.Adam()
 
-  import os, sys
   checkpoint_dir = os.path.join(sys.path[0] + '/training_checkpoints')
-  checkpoint = tf.train.Checkpoint(optimizer=optimizer, encoder=encoder, decoder=decoder)
-  status = checkpoint.restore(tf.train.latest_checkpoint(checkpoint_dir))
-  print("status is {}".format(status))
+  checkpoint = tf.train.Checkpoint(optimizer=optimizer,
+                                   encoder=encoder,
+                                   decoder=decoder)
+  _ = checkpoint.restore(tf.train.latest_checkpoint(checkpoint_dir))
 
   eva_obj = Evaluate(encoder, decoder,
-                    inp_lang, targ_lang, max_length_targ, max_length_inp)
+                     inp_lang, targ_lang, max_length_targ, max_length_inp)
   print("*********start evaluate**********")
-  result, sentence = eva_obj.evaluate("Tom hizo todo lo que estuvo a su alcance para salvar a los niños atrapados en el edificio en llamas.")
+  result, sentence = eva_obj.evaluate(input_sentence)
   print("{}:{}".format(sentence, result))
 
 if __name__ == "__main__":
-    evaluate_flags()
-    app.run(run_main)
+  evaluate_flags()
+  app.run(run_main)
 
diff --git a/tensorflow_examples/models/nmt_with_attention/train.py b/tensorflow_examples/models/nmt_with_attention/train.py
index 6eef4e7106a..a35d3af80bc 100644
--- a/tensorflow_examples/models/nmt_with_attention/train.py
+++ b/tensorflow_examples/models/nmt_with_attention/train.py
@@ -19,13 +19,13 @@
 from __future__ import division
 from __future__ import print_function
 
+import os, sys
 from absl import app
 import tensorflow as tf # TF2
 from tensorflow_examples.models.nmt_with_attention import nmt
 from tensorflow_examples.models.nmt_with_attention import utils
 assert tf.__version__.startswith('2')
 
-
 class Train(object):
   """Train class.
 
@@ -161,7 +161,6 @@ def training_loop(self, train_ds, test_ds):
         self.train_step((inp, targ))
 
       if epoch == self.epochs - 1:
-        import os, sys
         checkpoint_dir = os.path.join(sys.path[0]+'/training_checkpoints')
         checkpoint_prefix = os.path.join(checkpoint_dir, "ckpt")
         checkpoint = tf.train.Checkpoint(optimizer=self.optimizer,

From 9928de4723fe42f244e184fe14cfac6156e7397b Mon Sep 17 00:00:00 2001
From: Leslie-Fang <fangjiahaosjtu2017@126.com>
Date: Fri, 15 Nov 2019 04:29:23 +0800
Subject: [PATCH 4/5] change by pylint code style

---
 .../models/nmt_with_attention/evaluate.py     | 31 +++----------------
 1 file changed, 5 insertions(+), 26 deletions(-)

diff --git a/tensorflow_examples/models/nmt_with_attention/evaluate.py b/tensorflow_examples/models/nmt_with_attention/evaluate.py
index 68ac0caaa0f..a63c83fa5d3 100644
--- a/tensorflow_examples/models/nmt_with_attention/evaluate.py
+++ b/tensorflow_examples/models/nmt_with_attention/evaluate.py
@@ -32,19 +32,14 @@ class Evaluate(object):
   """Train class.
 
   Attributes:
-    epochs: Number of epochs.
-    enable_function: Decorate function with tf.function.
     encoder: Encoder.
     decoder: Decoder.
     inp_lang: Input language tokenizer.
     targ_lang: Target language tokenizer.
-    batch_size: Batch size.
-    per_replica_batch_size: Batch size per replica for sync replicas. Same as
-      batch_size for non distributed training.
+    max_length_targ: target language max embedding feature dimension
+    max_length_inp: input language max embedding feature dimension
     optimizer: Optimizer.
     loss_object: Object of the loss class.
-    train_loss_metric: Mean metric to keep track of the train loss value.
-    test_loss_metric: Mean metric to keep track of the test loss value.
   """
 
   def __init__(self, encoder, decoder, inp_lang,
@@ -69,34 +64,26 @@ def evaluate(self, sentence):
       result, sentence
     """
     sentence = utils.preprocess_sentence(sentence)
-
     inputs = [self.inp_lang.word_index[i] for i in sentence.split(' ')]
     inputs = tf.keras.preprocessing.\
                         sequence.pad_sequences([inputs],
                                                maxlen=self.max_length_inp,
                                                padding='post')
     inputs = tf.convert_to_tensor(inputs)
-
     result = ''
-
     hidden = [tf.zeros((1, self.encoder.enc_units))]
     enc_out, enc_hidden = self.encoder(inputs, hidden)
-
     dec_hidden = enc_hidden
     dec_input = tf.expand_dims([self.targ_lang.word_index['<start>']], 0)
-
     for _ in range(self.max_length_targ):
       predictions, dec_hidden, _ = self.decoder(dec_input,
                                                 dec_hidden,
                                                 enc_out)
       predicted_id = tf.argmax(predictions[0]).numpy()
-
       result += self.targ_lang.index_word[predicted_id] + ' '
-
       if self.targ_lang.index_word[predicted_id] == '<end>':
         # return result, sentence, attention_plot
         return result, sentence
-
       # the predicted ID is fed back into the model
       dec_input = tf.expand_dims([predicted_id], 0)
     return result, sentence
@@ -108,9 +95,9 @@ def evaluate_flags():
   flags.DEFINE_integer('enc_units', 1024, 'Encoder GRU units')
   flags.DEFINE_integer('dec_units', 1024, 'Decoder GRU units')
   flags.DEFINE_integer('num_examples', 70000,
-                       'Number of examples from dataset')
-  flags.DEFINE_integer('input_sentence', 'Halo.',
-                       'The input sentence to inference,')
+                       'Number of examples from dataset extract to analysis the feature')
+  flags.DEFINE_string('input_sentence', 'Halo.',
+                      'The input sentence to inference,')
 
 def flags_dict():
   """Define the flags.
@@ -118,7 +105,6 @@ def flags_dict():
   Returns:
     Command line arguments as Flags.
   """
-
   kwargs = {
       'file_path': FLAGS.file_path,
       'num_examples': FLAGS.num_examples,
@@ -137,27 +123,20 @@ def run_main(argv):
 
 def main(file_path, num_examples=70000, embedding_dim=256,
          enc_units=1024, dec_units=1024, input_sentence='Halo.'):
-
   input_tensor, target_tensor, inp_lang, targ_lang = utils.load_dataset(
       file_path, num_examples)
-
   max_length_targ, max_length_inp = \
       utils.max_length(target_tensor), utils.max_length(input_tensor)
-
   vocab_inp_size = len(inp_lang.word_index) + 1
   vocab_tar_size = len(targ_lang.word_index) + 1
-
   encoder = nmt.Encoder(vocab_inp_size, embedding_dim, enc_units)
   decoder = nmt.Decoder(vocab_tar_size, embedding_dim, dec_units)
-
   optimizer = tf.keras.optimizers.Adam()
-
   checkpoint_dir = os.path.join(sys.path[0] + '/training_checkpoints')
   checkpoint = tf.train.Checkpoint(optimizer=optimizer,
                                    encoder=encoder,
                                    decoder=decoder)
   _ = checkpoint.restore(tf.train.latest_checkpoint(checkpoint_dir))
-
   eva_obj = Evaluate(encoder, decoder,
                      inp_lang, targ_lang, max_length_targ, max_length_inp)
   print("*********start evaluate**********")

From abb1b5b4eb750a907535b7c1cdf1bb39bd869cda Mon Sep 17 00:00:00 2001
From: Leslie-Fang <fangjiahaosjtu2017@126.com>
Date: Tue, 19 Nov 2019 00:00:23 +0800
Subject: [PATCH 5/5] add beam search

---
 .../models/nmt_with_attention/evaluate.py     |  48 ++++--
 .../evaluate_without_beam_search.py           | 152 ++++++++++++++++++
 2 files changed, 191 insertions(+), 9 deletions(-)
 create mode 100644 tensorflow_examples/models/nmt_with_attention/evaluate_without_beam_search.py

diff --git a/tensorflow_examples/models/nmt_with_attention/evaluate.py b/tensorflow_examples/models/nmt_with_attention/evaluate.py
index a63c83fa5d3..4c2cd1f0609 100644
--- a/tensorflow_examples/models/nmt_with_attention/evaluate.py
+++ b/tensorflow_examples/models/nmt_with_attention/evaluate.py
@@ -54,11 +54,12 @@ def __init__(self, encoder, decoder, inp_lang,
     self.max_length_targ = max_length_targ
     self.max_length_inp = max_length_inp
 
-  def evaluate(self, sentence):
+  def evaluate(self, sentence, beam_width=1):
     """Custom evaluating step.
 
     Args:
-      sentence: input sentence to evaluate
+      sentence: input sentence to evaluate.
+      beam_width: beam search K.
 
     Returns:
       result, sentence
@@ -74,18 +75,47 @@ def evaluate(self, sentence):
     hidden = [tf.zeros((1, self.encoder.enc_units))]
     enc_out, enc_hidden = self.encoder(inputs, hidden)
     dec_hidden = enc_hidden
-    dec_input = tf.expand_dims([self.targ_lang.word_index['<start>']], 0)
+    dec_input_vector = tf.expand_dims([self.targ_lang.word_index['<start>']], 0)
+    possbility_input = tf.expand_dims([1], 0)
+    first = True
+
     for _ in range(self.max_length_targ):
-      predictions, dec_hidden, _ = self.decoder(dec_input,
-                                                dec_hidden,
-                                                enc_out)
-      predicted_id = tf.argmax(predictions[0]).numpy()
+      if first:
+        decode_input_numbers = 1
+        first = False
+      else:
+        decode_input_numbers = beam_width
+      current_probability = []
+      current_word = []
+      for decode_input_number in range(0, decode_input_numbers):
+          # Go through each possible word in the beam search
+          dec_input = tf.slice(dec_input_vector, [0, decode_input_number], [1, 1])
+          predictions, dec_hidden, _ = self.decoder(dec_input,
+                                                    dec_hidden,
+                                                    enc_out)
+          #Get the top beam_width most likely word
+          possible_word_list = tf.argsort(predictions[0], axis=-1, direction='DESCENDING', stable=False, name=None)
+          possible_word_list = tf.slice(possible_word_list, [0], [beam_width])
+          for item in possible_word_list:
+            current_probability.append(predictions[0][item] * possbility_input[0][decode_input_number].numpy())
+            current_word.append(item)
+      final_probability_index = tf.argsort(current_probability, axis=-1, direction='DESCENDING', stable=False, name=None)
+      final_probability_index = tf.slice(final_probability_index, [0], [beam_width])
+      #Get the top beam_width from all of the possible output
+      possbility_input = []
+      dec_input_vector = []
+      for item in final_probability_index:
+          possbility_input.append(current_probability[item])
+          dec_input_vector.append(current_word[item])
+      possbility_input = tf.expand_dims(possbility_input, 0)
+      dec_input_vector = tf.expand_dims(dec_input_vector, 0)
+
+      # Take the final top 1 into the result todo:take all the possible top beam_width result
+      predicted_id = dec_input_vector[0][0].numpy()
       result += self.targ_lang.index_word[predicted_id] + ' '
       if self.targ_lang.index_word[predicted_id] == '<end>':
         # return result, sentence, attention_plot
         return result, sentence
-      # the predicted ID is fed back into the model
-      dec_input = tf.expand_dims([predicted_id], 0)
     return result, sentence
 
 def evaluate_flags():
diff --git a/tensorflow_examples/models/nmt_with_attention/evaluate_without_beam_search.py b/tensorflow_examples/models/nmt_with_attention/evaluate_without_beam_search.py
new file mode 100644
index 00000000000..c852cf74e2e
--- /dev/null
+++ b/tensorflow_examples/models/nmt_with_attention/evaluate_without_beam_search.py
@@ -0,0 +1,152 @@
+# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Evaluate.
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import os, sys
+from absl import app, flags
+import tensorflow as tf # TF2
+from tensorflow_examples.models.nmt_with_attention import nmt
+from tensorflow_examples.models.nmt_with_attention import utils
+assert tf.__version__.startswith('2')
+
+FLAGS = flags.FLAGS
+
+class Evaluate(object):
+  """Train class.
+
+  Attributes:
+    encoder: Encoder.
+    decoder: Decoder.
+    inp_lang: Input language tokenizer.
+    targ_lang: Target language tokenizer.
+    max_length_targ: target language max embedding feature dimension
+    max_length_inp: input language max embedding feature dimension
+    optimizer: Optimizer.
+    loss_object: Object of the loss class.
+  """
+
+  def __init__(self, encoder, decoder, inp_lang,
+               targ_lang, max_length_targ, max_length_inp):
+    self.encoder = encoder
+    self.decoder = decoder
+    self.inp_lang = inp_lang
+    self.targ_lang = targ_lang
+    self.optimizer = tf.keras.optimizers.Adam()
+    self.loss_object = tf.keras.losses.SparseCategoricalCrossentropy(
+        from_logits=True, reduction=tf.keras.losses.Reduction.NONE)
+    self.max_length_targ = max_length_targ
+    self.max_length_inp = max_length_inp
+
+  def evaluate(self, sentence, beam_width=4):
+    """Custom evaluating step.
+
+    Args:
+      sentence: input sentence to evaluate.
+      beam_width: beam search K.
+
+    Returns:
+      result, sentence
+    """
+    sentence = utils.preprocess_sentence(sentence)
+    inputs = [self.inp_lang.word_index[i] for i in sentence.split(' ')]
+    inputs = tf.keras.preprocessing.\
+                        sequence.pad_sequences([inputs],
+                                               maxlen=self.max_length_inp,
+                                               padding='post')
+    inputs = tf.convert_to_tensor(inputs)
+    result = ''
+    hidden = [tf.zeros((1, self.encoder.enc_units))]
+    enc_out, enc_hidden = self.encoder(inputs, hidden)
+    dec_hidden = enc_hidden
+    dec_input = tf.expand_dims([self.targ_lang.word_index['<start>']], 0)
+
+    for _ in range(self.max_length_targ):
+      predictions, dec_hidden, _ = self.decoder(dec_input,
+                                                dec_hidden,
+                                                enc_out)
+
+      predicted_id = tf.argmax(predictions[0]).numpy()
+      result += self.targ_lang.index_word[predicted_id] + ' '
+      if self.targ_lang.index_word[predicted_id] == '<end>':
+        # return result, sentence, attention_plot
+        return result, sentence
+      # the predicted ID is fed back into the model
+      dec_input = tf.expand_dims([predicted_id], 0)
+    return result, sentence
+
+def evaluate_flags():
+  flags.DEFINE_string('file_path', '/root/.keras/datasets/spa-eng/spa.txt',
+                      'Download training dataset file')
+  flags.DEFINE_integer('embedding_dim', 256, 'Embedding dimension')
+  flags.DEFINE_integer('enc_units', 1024, 'Encoder GRU units')
+  flags.DEFINE_integer('dec_units', 1024, 'Decoder GRU units')
+  flags.DEFINE_integer('num_examples', 70000,
+                       'Number of examples from dataset extract to analysis the feature')
+  flags.DEFINE_string('input_sentence', 'Halo.',
+                      'The input sentence to inference,')
+
+def flags_dict():
+  """Define the flags.
+
+  Returns:
+    Command line arguments as Flags.
+  """
+  kwargs = {
+      'file_path': FLAGS.file_path,
+      'num_examples': FLAGS.num_examples,
+      'embedding_dim': FLAGS.embedding_dim,
+      'enc_units': FLAGS.enc_units,
+      'dec_units': FLAGS.dec_units,
+      'input_sentence': FLAGS.input_sentence
+  }
+  return kwargs
+
+
+def run_main(argv):
+  del argv
+  kwargs = flags_dict()
+  main(**kwargs)
+
+def main(file_path, num_examples=70000, embedding_dim=256,
+         enc_units=1024, dec_units=1024, input_sentence='Halo.'):
+  input_tensor, target_tensor, inp_lang, targ_lang = utils.load_dataset(
+      file_path, num_examples)
+  max_length_targ, max_length_inp = \
+      utils.max_length(target_tensor), utils.max_length(input_tensor)
+  vocab_inp_size = len(inp_lang.word_index) + 1
+  vocab_tar_size = len(targ_lang.word_index) + 1
+  encoder = nmt.Encoder(vocab_inp_size, embedding_dim, enc_units)
+  decoder = nmt.Decoder(vocab_tar_size, embedding_dim, dec_units)
+  optimizer = tf.keras.optimizers.Adam()
+  checkpoint_dir = os.path.join(sys.path[0] + '/training_checkpoints')
+  checkpoint = tf.train.Checkpoint(optimizer=optimizer,
+                                   encoder=encoder,
+                                   decoder=decoder)
+  _ = checkpoint.restore(tf.train.latest_checkpoint(checkpoint_dir))
+  eva_obj = Evaluate(encoder, decoder,
+                     inp_lang, targ_lang, max_length_targ, max_length_inp)
+  print("*********start evaluate**********")
+  result, sentence = eva_obj.evaluate(input_sentence)
+  print("{}:{}".format(sentence, result))
+
+if __name__ == "__main__":
+  evaluate_flags()
+  app.run(run_main)
+