Fix model save issue

liushuchun · liushuchun · commit b3b4bdc38abe · 2018-08-17T01:05:50.000+08:00
diff --git a/README.md b/README.md
@@ -1,5 +1,5 @@
 # 自然语言处理算法与实战
-本书主要是介绍了一些基础的入门知识和概念，同时偏重于实战，这里是代码的主要介绍：
+本书主要是面向初学者，介绍了一些基础的入门知识和概念，同时提供一些偏向于实战的代码供给读者练习，这里是代码的主要介绍：
 * chapter-3 中文分词技术
 * chapter-4 词性标注与命名实体识别
 * chapter-5 关键词提取
@@ -8,3 +8,5 @@
 * chapter-8 情感分析
 * chapter-9 NLP中用到的机器学习算法
 * chapter-10 基于深度学习的NLP算法
+
+**由于是初版，还存在不少小的问题，欢迎大家提issue，我们会积极地回复和改进，非常感谢大家。**
diff --git a/chapter-10/seq2seq/dynamic_seq2seq_model.py b/chapter-10/seq2seq/dynamic_seq2seq_model.py
@@ -93,7 +93,7 @@ def _init_placeholders(self):
             dtype=tf.int32,
             name='encoder_inputs',
         )
-        #self.encoder_inputs = tf.Variable(np.ones((10, 50)).astype(np.int32))
+        # self.encoder_inputs = tf.Variable(np.ones((10, 50)).astype(np.int32))
         self.encoder_inputs_length = tf.placeholder(
             shape=(None,),
             dtype=tf.int32,
@@ -115,15 +115,15 @@ def _init_decoder_train_connectors(self):
         with tf.name_scope('DecoderTrainFeeds'):
             sequence_size, batch_size = tf.unstack(
                 tf.shape(self.decoder_targets))
-            #batch_size, sequence_size = tf.unstack(tf.shape(self.decoder_targets))
+            # batch_size, sequence_size = tf.unstack(tf.shape(self.decoder_targets))
 
             EOS_SLICE = tf.ones([1, batch_size], dtype=tf.int32) * self.EOS
             PAD_SLICE = tf.ones([1, batch_size], dtype=tf.int32) * self.PAD
 
             self.decoder_train_inputs = tf.concat(
                 [EOS_SLICE, self.decoder_targets], axis=0)
             self.decoder_train_length = self.decoder_targets_length + 1
-            #self.decoder_train_length = self.decoder_targets_length
+            # self.decoder_train_length = self.decoder_targets_length
 
             decoder_train_targets = tf.concat(
                 [self.decoder_targets, PAD_SLICE], axis=0)
@@ -148,7 +148,6 @@ def _init_decoder_train_connectors(self):
 
     def _init_embeddings(self):
         with tf.variable_scope("embedding") as scope:
-
             sqrt3 = math.sqrt(3)
             initializer = tf.random_uniform_initializer(-sqrt3, sqrt3)
 
diff --git a/chapter-10/seq2seq/main.py b/chapter-10/seq2seq/main.py
@@ -167,8 +167,8 @@ def train(self):
                     self.clearModel()
                     total_time = 0
                     for i, (e_in, dt_pred) in enumerate(zip(
-                        fd[self.model.decoder_targets].T,
-                        sess.run(self.model.decoder_prediction_train, fd).T
+                            fd[self.model.decoder_targets].T,
+                            sess.run(self.model.decoder_prediction_train, fd).T
                     )):
                         print('  sample {}:'.format(i + 1))
                         print('    dec targets > {}'.format(e_in))
@@ -233,8 +233,8 @@ def onlinelearning(self, input_strs, target_strs):
                     sess, checkpoint_path, global_step=self.model.global_step)
 
                 for i, (e_in, dt_pred) in enumerate(zip(
-                    fd[self.model.decoder_targets].T,
-                    sess.run(self.model.decoder_prediction_train, fd).T
+                        fd[self.model.decoder_targets].T,
+                        sess.run(self.model.decoder_prediction_train, fd).T
                 )):
                     print('    sample {}:'.format(i + 1))
                     print('    dec targets > {}'.format(e_in))
@@ -282,7 +282,7 @@ def predict(self):
 
                 action = False
                 segements = self.segement(inputs_strs)
-                #inputs_vec = [enc_vocab.get(i) for i in segements]
+                # inputs_vec = [enc_vocab.get(i) for i in segements]
                 inputs_vec = []
                 for i in segements:
                     inputs_vec.append(self.enc_vocab.get(i, self.model.UNK))
@@ -349,8 +349,8 @@ def test(self):
                         sess.run(self.model.loss, fd)))
 
                     for i, (e_in, dt_pred) in enumerate(zip(
-                        fd[self.model.decoder_targets].T,
-                        sess.run(self.model.decoder_prediction_train, fd).T
+                            fd[self.model.decoder_targets].T,
+                            sess.run(self.model.decoder_prediction_train, fd).T
                     )):
                         print('  sample {}:'.format(i + 1))
                         print('    dec targets > {}'.format(e_in))
@@ -366,4 +366,3 @@ def test(self):
             seq_obj.train()
         elif sys.argv[1] == 'infer':
             seq_obj.predict()
-
diff --git a/chapter-8/sentiment-analysis/main.py b/chapter-8/sentiment-analysis/main.py
@@ -1,6 +1,7 @@
 # encoding:utf-8
 
 import numpy as np
+
 wordsList = np.load('wordsList.npy')
 print('载入word列表')
 wordsList = wordsList.tolist()
@@ -9,45 +10,45 @@
 wordVectors = np.load('wordVectors.npy')
 print('载入文本向量')
 
-
 print(len(wordsList))
 print(wordVectors.shape)
 
 import os
 from os.path import isfile, join
+
 pos_files = ['pos/' + f for f in os.listdir(
     'pos/') if isfile(join('pos/', f))]
 neg_files = ['neg/' + f for f in os.listdir(
     'neg/') if isfile(join('neg/', f))]
 num_words = []
 for pf in pos_files:
-  with open(pf, "r", encoding='utf-8') as f:
-    line = f.readline()
-    counter = len(line.split())
-    num_words.append(counter)
+    with open(pf, "r", encoding='utf-8') as f:
+        line = f.readline()
+        counter = len(line.split())
+        num_words.append(counter)
 print('正面评价完结')
 
 for nf in neg_files:
-  with open(nf, "r", encoding='utf-8') as f:
-    line = f.readline()
-    counter = len(line.split())
-    num_words.append(counter)
+    with open(nf, "r", encoding='utf-8') as f:
+        line = f.readline()
+        counter = len(line.split())
+        num_words.append(counter)
 print('负面评价完结')
 
 num_files = len(num_words)
 print('文件总数', num_files)
 print('所有的词的数量', sum(num_words))
 print('平均文件词的长度', sum(num_words) / len(num_words))
 
-
 import re
+
 strip_special_chars = re.compile("[^A-Za-z0-9 ]+")
 num_dimensions = 300  # Dimensions for each word vector
 
 
 def cleanSentences(string):
-  string = string.lower().replace("<br />", " ")
-  return re.sub(strip_special_chars, "", string.lower())
+    string = string.lower().replace("<br />", " ")
+    return re.sub(strip_special_chars, "", string.lower())
 
 
 max_seq_num = 250
@@ -94,38 +95,40 @@ def cleanSentences(string):
 batch_size = 24
 lstm_units = 64
 num_labels = 2
-iterations = 100000
+iterations = 100
+lr = 0.001
 ids = np.load('idsMatrix.npy')
 
 
 def get_train_batch():
-  labels = []
-  arr = np.zeros([batch_size, max_seq_num])
-  for i in range(batch_size):
-    if (i % 2 == 0):
-      num = randint(1, 11499)
-      labels.append([1, 0])
-    else:
-      num = randint(13499, 24999)
-      labels.append([0, 1])
-    arr[i] = ids[num - 1:num]
-  return arr, labels
+    labels = []
+    arr = np.zeros([batch_size, max_seq_num])
+    for i in range(batch_size):
+        if (i % 2 == 0):
+            num = randint(1, 11499)
+            labels.append([1, 0])
+        else:
+            num = randint(13499, 24999)
+            labels.append([0, 1])
+        arr[i] = ids[num - 1:num]
+    return arr, labels
 
 
 def get_test_batch():
-  labels = []
-  arr = np.zeros([batch_size, max_seq_num])
-  for i in range(batch_size):
-    num = randint(11499, 13499)
-    if (num <= 12499):
-      labels.append([1, 0])
-    else:
-      labels.append([0, 1])
-    arr[i] = ids[num - 1:num]
-  return arr, labels
+    labels = []
+    arr = np.zeros([batch_size, max_seq_num])
+    for i in range(batch_size):
+        num = randint(11499, 13499)
+        if (num <= 12499):
+            labels.append([1, 0])
+        else:
+            labels.append([0, 1])
+        arr[i] = ids[num - 1:num]
+    return arr, labels
 
 
 import tensorflow as tf
+
 tf.reset_default_graph()
 
 labels = tf.placeholder(tf.float32, [batch_size, num_labels])
@@ -134,33 +137,43 @@ def get_test_batch():
     tf.zeros([batch_size, max_seq_num, num_dimensions]), dtype=tf.float32)
 data = tf.nn.embedding_lookup(wordVectors, input_data)
 
-
 lstmCell = tf.contrib.rnn.BasicLSTMCell(lstm_units)
-lstmCell = tf.contrib.rnn.DropoutWrapper(cell=lstmCell, output_keep_prob=0.75)
+lstmCell = tf.contrib.rnn.DropoutWrapper(cell=lstmCell, output_keep_prob=0.5)
 value, _ = tf.nn.dynamic_rnn(lstmCell, data, dtype=tf.float32)
 
-
 weight = tf.Variable(tf.truncated_normal([lstm_units, num_labels]))
 bias = tf.Variable(tf.constant(0.1, shape=[num_labels]))
 value = tf.transpose(value, [1, 0, 2])
 last = tf.gather(value, int(value.get_shape()[0]) - 1)
 prediction = (tf.matmul(last, weight) + bias)
 
-correctPred = tf.equal(tf.argmax(prediction, 1), tf.argmax(labels, 1))
-accuracy = tf.reduce_mean(tf.cast(correctPred, tf.float32))
-
+correct_pred = tf.equal(tf.argmax(prediction, 1), tf.argmax(labels, 1))
+accuracy = tf.reduce_mean(tf.cast(correct_pred, tf.float32))
 
 loss = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(
     logits=prediction, labels=labels))
-optimizer = tf.train.AdamOptimizer().minimize(loss)
+optimizer = tf.train.AdamOptimizer(lr).minimize(loss)
 
-
-sess = tf.InteractiveSession()
 saver = tf.train.Saver()
-saver.restore(sess, tf.train.latest_checkpoint('models'))
 
-iterations = 10
-for i in range(iterations):
-  next_batch, next_batch_labels = get_test_batch()
-  print("正确率:", (sess.run(
-      accuracy, {input_data: next_batch, labels: next_batch_labels})) * 100)
+with tf.Session() as sess:
+    if os.path.exists("models") and os.path.exists("models/checkpoint"):
+        saver.restore(sess, tf.train.latest_checkpoint('models'))
+    else:
+        if int((tf.__version__).split('.')[1]) < 12 and int((tf.__version__).split('.')[0]) < 1:
+            init = tf.initialize_all_variables()
+        else:
+            init = tf.global_variables_initializer()
+        sess.run(init)
+
+    iterations = 100
+    for step in range(iterations):
+        next_batch, next_batch_labels = get_test_batch()
+        if step % 20 == 0:
+            print("step:", step, " 正确率:", (sess.run(
+                accuracy, {input_data: next_batch, labels: next_batch_labels})) * 100)
+
+    if not os.path.exists("models"):
+        os.mkdir("models")
+    save_path = saver.save(sess, "models/model.ckpt")
+    print("Model saved in path: %s" % save_path)