  1. import os
  2. import numpy as np
  3. import tensorflow as tf
  4. import time
  5. # 获取每张图片的路径
  6. def get_file(file_dir):
  7. image_list = []
  8. label_list = []
  9. for train_class in os.listdir(file_dir):
  10. for pic in os.listdir(file_dir + '/' + train_class):
  11. image_list.append(file_dir + '/' + train_class + '/' + pic)
  12. label_list.append(train_class)
  13. temp = np.array([image_list, label_list])
  14. temp = temp.transpose()
  15. np.random.shuffle(temp) # 打乱顺序
  16. label_list = [int(i) for i in label_list] # 数据类型转换
  17. return image_list, label_list
  18. # 读取图片产生训练样本
  19. def get_batch(image, label, image_W, image_H, batch_size, capacity):
  20. image = tf.cast(image, tf.string)
  21. label = tf.cast(label, tf.int32)
  22. input_queue = tf.train.slice_input_producer([image, label])
  23. label = input_queue[1]
  24. image_contens = tf.read_file(input_queue[0])
  25. image = tf.image.decode_jpeg(image_contens, channels=3)
  26. image = tf.image.resize_image_with_crop_or_pad(image, image_W, image_H)
  27. image = tf.image.per_image_standardization(image)
  28. image_batch, label_batch = tf.train.batch([image, label], batch_size=batch_size, num_threads=16, capacity=capacity)
  29. label_batch = tf.reshape(label_batch, [batch_size])
  30. image_batch = tf.cast(image_batch, tf.float32)
  31. return image_batch, label_batch
  32. def weight_variable(shape, n):
  33. initial = tf.truncated_normal(shape, stddev=n, dtype=tf.float32)
  34. return initial
  35. def bias_variable(shape):
  36. initial = tf.constant(0.1, shape=shape, dtype=tf.float32)
  37. return initial
  38. def conv2d(x, W):
  39. return tf.nn.conv2d(x, W, strides=[1, 1, 1, 1], padding="SAME")
  40. def max_pool_2x2(x, name):
  41. return tf.nn.max_pool(x, ksize=[1, 3, 3, 1], strides=[1, 2, 2, 1], padding="SAME", name=name)
  42. # 定义训练模型
  43. def inference(images, batch_size, n_classes):
  44. # 第一层卷积层
  45. with tf.variable_scope('conv1') as scope:
  46. w_conv1 = tf.Variable(weight_variable([3, 3, 3, 16], 1.0), name="weights", dtype=tf.float32)
  47. b_conv1 = tf.Variable(bias_variable([16]), name="blases", dtype=tf.float32)
  48. h_conv1 = tf.nn.relu(conv2d(images, w_conv1) + b_conv1, name="conv1")
  49. h_conv1_sum = tf.split(h_conv1, num_or_size_splits=4, axis=3) # 将特征图划分为[20, 56, 56, 4]
  50. tf.summary.image("h_conv1_image", h_conv1_sum[0], 5) # 保存卷积后的特征图
  51. # 第一层池化层
  52. with tf.variable_scope('pooling1_lrn') as scope:
  53. pool1 = max_pool_2x2(h_conv1, "pooling1")
  54. norm1 = tf.nn.lrn(pool1, depth_radius=4, bias=1.0, alpha=0.001 / 9.0, beta=0.75, name="norm1")
  55. pool1_sum = tf.split(pool1, num_or_size_splits=4, axis=3)
  56. tf.summary.image("pooling1", pool1_sum[0], 5) # 保存池化后的特征图
  57. # 第二层卷积层
  58. with tf.variable_scope('conv2') as scope:
  59. w_conv2 = tf.Variable(weight_variable([3, 3, 16, 32], 1.0), name="weights", dtype=tf.float32)
  60. b_conv2 = tf.Variable(bias_variable([32]), name="blases", dtype=tf.float32)
  61. h_conv2 = tf.nn.relu(conv2d(norm1, w_conv2) + b_conv2, name="conv2")
  62. h_conv2_sum = tf.split(h_conv2, num_or_size_splits=8, axis=3)
  63. tf.summary.image("h_conv2_image", h_conv2_sum[0], 5)
  64. # 第二层池化层
  65. with tf.variable_scope('pooling2_lrn') as scope:
  66. pool2 = max_pool_2x2(h_conv2, "pooling2")
  67. norm2 = tf.nn.lrn(pool2, depth_radius=4, bias=1.0, alpha=0.001 / 9.0, beta=0.75, name="norm2")
  68. pool2_sum = tf.split(pool2, num_or_size_splits=8, axis=3)
  69. tf.summary.image("pooling2", pool2_sum[0], 5)
  70. # 第三层卷积层
  71. with tf.variable_scope('conv3') as scope:
  72. w_conv3 = tf.Variable(weight_variable([3, 3, 32, 64], 1.0), name="weights", dtype=tf.float32)
  73. b_conv3 = tf.Variable(bias_variable([64]), name="blases", dtype=tf.float32)
  74. h_conv3 = tf.nn.relu(conv2d(norm2, w_conv3) + b_conv3, name="conv3")
  75. h_conv3_sum = tf.split(h_conv3, num_or_size_splits=16, axis=3)
  76. tf.summary.image("h_conv3_image", h_conv3_sum[0], 5)
  77. # 第三层池化层
  78. with tf.variable_scope('pooling3_lrn') as scope:
  79. pool3 = max_pool_2x2(h_conv3, "pooling2")
  80. norm3 = tf.nn.lrn(pool3, depth_radius=4, bias=1.0, alpha=0.001 / 9.0, beta=0.75, name="norm3")
  81. pool3_sum = tf.split(pool3, num_or_size_splits=16, axis=3)
  82. tf.summary.image("pooling3", pool3_sum[0], 5)
  83. # 第四层全连接层
  84. with tf.variable_scope('local3') as scope:
  85. reshape = tf.reshape(norm3, shape=[batch_size, -1])
  86. dim = reshape.get_shape()[1].value
  87. w_fc1 = tf.Variable(weight_variable([dim, 128], 0.005), name="weights", dtype=tf.float32)
  88. b_fc1 = tf.Variable(bias_variable([128]), name="blases", dtype=tf.float32)
  89. h_fc1 = tf.nn.relu(tf.matmul(reshape, w_fc1) + b_fc1, name=scope.name)
  90. # 第五层全连接层
  91. with tf.variable_scope('local4') as scope:
  92. w_fc2 = tf.Variable(weight_variable([128, 128], 0.005), name="weights", dtype=tf.float32)
  93. b_fc2 = tf.Variable(bias_variable([128]), name="blases", dtype=tf.float32)
  94. h_fc2 = tf.nn.relu(tf.matmul(h_fc1, w_fc2) + b_fc2, name=scope.name)
  95. h_fc2_dropout = tf.nn.dropout(h_fc2, 0.5) # 随机删除神经网络中的部分神经元,防止过拟合
  96. # 回归层
  97. with tf.variable_scope("sofemax_liner") as scope:
  98. weights = tf.Variable(weight_variable([128, n_classes], 0.005), name="softmax_linear", dtype=tf.float32)
  99. biases = tf.Variable(bias_variable([n_classes]), name="biases", dtype=tf.float32)
  100. softmax_linear = tf.add(tf.matmul(h_fc2_dropout, weights), biases, name="softmax_linear")
  101. return softmax_linear
  102. # 计算损失
  103. def losses(logits, labels):
  104. with tf.variable_scope("loss") as scope:
  105. cross_entropy = tf.nn.sparse_softmax_cross_entropy_with_logits(logits=logits, labels=labels, name="xentropy_per_example")
  106. loss = tf.reduce_mean(cross_entropy, name="loss")
  107. tf.summary.scalar(scope.name + "/loss", loss) # 保存损失模型
  108. return loss
  109. # loss损失值优化
  110. def trainning(loss, learning_rate):
  111. with tf.name_scope("oprimizer"):
  112. optimizer = tf.train.AdamOptimizer(learning_rate=learning_rate)
  113. global_step = tf.Variable(0, name="global_step", trainable=False)
  114. train_op = optimizer.minimize(loss, global_step=global_step)
  115. return train_op
  116. # 准确率计算
  117. def evaluation(logits, labels):
  118. with tf.variable_scope("accuracy") as scope:
  119. correct = tf.nn.in_top_k(logits, labels, 1)
  120. accuracy = tf.reduce_mean(tf.cast(correct, tf.float16))
  121. tf.summary.scalar(scope.name + "/accuracy", accuracy) # 保存准确率模型
  122. return accuracy
  123. # ******************************************************************************************************************* #
  124. N_CLASSES = 5 # 图片的种类
  125. IMG_W = 56 # 图片宽度
  126. IMG_H = 56 # 图片高度
  127. BATCH_SIZE = 20 # 每次读取图片的数目
  128. CAPACITY = 200 # 读取队列的最大容量
  129. MAX_STEP = 10000 # 迭代次数
  130. learning_rate = 0.0001 # 学习率
  131. train_dir = "flowers" # 文件路径
  132. logs_train_dir = "CK-part/" # 日志保存路径
  133. # ******************************************************************************************************************* #
  134. train, train_label = get_file(train_dir) # 获取文件路径
  135. train_batch, train_label_batch = get_batch(train, train_label, IMG_W, IMG_H, BATCH_SIZE, CAPACITY) # 读取数据和标签
  136. # 构建训练模型
  137. train_logits = inference(train_batch, BATCH_SIZE, N_CLASSES)
  138. train_loss = losses(train_logits, train_label_batch)
  139. train_op = trainning(train_loss, learning_rate)
  140. train_acc = evaluation(train_logits, train_label_batch)
  141. image_summary = tf.summary.image("image", train_batch, 5) # 保存原始图片特征图
  142. summary_op = tf.summary.merge_all() # 混合所有summary类型log
  143. saver = tf.train.Saver() # 保存训练模型
  144. # ******************************************************************************************************************* #
  145. # 开始训练模型,并输出训练过程中的loss和accuracy
  146. if __name__ == "__main__":
  147. sess = tf.Session() # 开启一个会话
  148. train_writer = tf.summary.FileWriter(logs_train_dir, sess.graph) # 日志写入
  149. sess.run(tf.global_variables_initializer()) # 初始化全部模型参数
  150. coord = tf.train.Coordinator()
  151. threads = tf.train.start_queue_runners(sess=sess, coord=coord) # 启动线程
  152. try:
  153. print(time.strftime('%Y-%m-%d %H:%M:%S'))
  154. for step in np.arange(MAX_STEP):
  155. if coord.should_stop():
  156. break
  157. _, tra_loss, tra_acc = sess.run([train_op, train_loss, train_acc])
  158. if step % 10 == 0:
  159. print("Step %d, train loss = %.2f, train accuracy = %.2f%%" % (step, tra_loss, tra_acc * 100.0))
  160. summary_str = sess.run(summary_op)
  161. train_writer.add_summary(summary_str, step)
  162. checkpoint_path = os.path.join(logs_train_dir, "thing.ckpt")
  163. saver.save(sess, checkpoint_path)
  164. print(time.strftime('%Y-%m-%d %H:%M:%S'))
  165. except tf.errors.OutOfRangeError:
  166. print("Done training -- epoch limit reached")
  167. finally:
  168. coord.request_stop()
  169. coord.join(threads)
  170. sess.close()


1. 日志目录

2. 需要记录的数据( tf.summary.***)

3. 数据合并保存

4. 查看数据

cmd命令行进入代码log中   输入:tensorboard --logdir=./













1. InvalidArgumentError (see above for traceback): Tensor must be 4-D with last dim 1, 3, or 4, not [20,56,56,16]

     先切分为4片,每一份为[20,56,56,4] ,保存第一份


2. tensorboard 

查看SCALARS 提示 KeyError: None, 无法显示loss和accuracy (在windows上出现异常)


3.  W tensorflow/core/framework/op_kernel.cc:1401] OP_REQUIRES failed at save_restore_v2_ops.cc:137 : Unknown: Failed to rename: CK-part/thing.ckpt.index.tempstate10496770459040915805 to: CK-part/thing.ckpt.index : �ܾ����ʡ�
; Input/output error



