TensorFlow入门:MNIST预测[restore问题]
变量的恢复可按照两种方式导入:
saver=tf.train.Saver() saver.restore(sess,'model.ckpt')
或者:
saver=tf.train.import_meta_graph(r'D:\tmp\tensorflow\mnist\model.ckpt.meta') saver.restore(sess,'model.ckpt')
两种方法的效果应该一致,但是实际结果不一样:
使用前者时预测结果是一致的;使用后者时,每次运行结果都不一致。无论是否重启spyde,现象都一样。
在使用前者时,必须在运行前重启spyde,否则会报错,为什么?Out_1等参数会随运行次数增加
INFO:tensorflow:Restoring parameters from D:/tmp/tensorflow/mnist/model.ckpt
Traceback (most recent call last):
File "<ipython-input-2-61410824b24c>", line 1, in <module>
runfile('D:/wangjc/pythonTest/TensorFlow/TestMNIST_Predict.py', wdir='D:/wangjc/pythonTest/TensorFlow')
......
File "D:\software\anaconda\envs\tensorflow\lib\site-packages\tensorflow\python\client\session.py", line 1052, in _do_call
raise type(e)(node_def, op, message)
NotFoundError: Key out_1/bias/bias not found in checkpoint
[[Node: save_1/RestoreV2_14 = RestoreV2[dtypes=[DT_FLOAT], _device="/job:localhost/replica:0/task:0/cpu:0"](_recv_save_1/Const_0, save_1/RestoreV2_14/tensor_names, save_1/RestoreV2_14/shape_and_slices)]]
Caused by op 'save_1/RestoreV2_14', defined at:
File "D:\software\anaconda\envs\tensorflow\lib\site-packages\spyder\utils\ipython\start_kernel.py", line 241, in <module>
main()
......File "D:\software\anaconda\envs\tensorflow\lib\site-packages\tensorflow\python\framework\ops.py", line 1228, in __init__
self._traceback = _extract_stack()
NotFoundError (see above for traceback): Key out_1/bias/bias not found in checkpoint
[[Node: save_1/RestoreV2_14 = RestoreV2[dtypes=[DT_FLOAT], _device="/job:localhost/replica:0/task:0/cpu:0"](_recv_save_1/Const_0, save_1/RestoreV2_14/tensor_names, save_1/RestoreV2_14/shape_and_slices)]]
NotFoundError: Key out_2/weight/weight not found in checkpoint
[[Node: save_2/RestoreV2_23 = RestoreV2[dtypes=[DT_FLOAT], _device="/job:localhost/replica:0/task:0/cpu:0"](_recv_save_2/Const_0, save_2/RestoreV2_23/tensor_names, save_2/RestoreV2_23/shape_and_slices)]]
Caused by op 'save_2/RestoreV2_23', defined at:
以上需要重启spyder的原因为saver恢复一次之后不能再次恢复,否则报错。
导致saver=tf.train.Saver()与saver=tf.train.import_meta_graph(r'D:\tmp\tensorflow\mnist\model.ckpt.meta')结果不同的原因是,后者在使用中可直接加载模型的参数,操作数等。
tf.get_default_graph()获取图
.get_tensor_by_name()获取张量
.get_operation_by_name()获取操作
注意对各部分命名。
使用下面方法的效果与直接读ckpt文件一致
saver = tf.train.Saver() ckpt=tf.train.get_checkpoint_state(r'D:\tmp\tensorflow\mnist') saver.restore(sess, ckpt.model_checkpoint_path)
可使用tf.get_collection('name')来读取恢复的变量
注意定义变量时最好标注标量名称,否则可能出现预测时加载参数不正确,定义方法为:
def weight_variable(shape):
#use normal distribution numbers with stddev 0.1 to initial the weight
initial=tf.truncated_normal(shape, stddev=0.1)
return tf.Variable(initial,name='weight')
-------------------------------------------------------------------------------------------------------------------------------
训练并保存模型 代码
# -*- coding: utf-8 -*-
"""
Created on Mon Sep 11 10:16:34 2017
multy layers softmax regression
@author: Wangjc
"""
import tensorflow as tf
import os
import tensorflow.examples.tutorials.mnist.input_data as input_data
#need to show the full address, or error occus.
mnist = input_data.read_data_sets('MNIST_data', one_hot=True)
#use read_data_sets to download and load the mnist data set. if has the data, then load.
#need a long time about 5 minutes
sess = tf.InteractiveSession()
#link the back-end of C++ to compute.
#in norm cases, we should create the map and then run in the sussion.
#now, use a more convenient class named InteractiveSession which could insert compute map when running map.
x=tf.placeholder("float",shape=[None,784])
y_=tf.placeholder("float",shape=[None,10])
def weight_variable(shape):
#use normal distribution numbers with stddev 0.1 to initial the weight
initial=tf.truncated_normal(shape, stddev=0.1)
return tf.Variable(initial,name='weight')
def bias_variable(shape):
#use constant value of 0.1 to initial the bias
initial=tf.constant(0.1, shape=shape)
return tf.Variable(initial,name='bias')
def conv2d(x,W):
#convolution by filter of W,with step size of 1, 0 padding size
#x should have the dimension of [batch,height,width,channels]
#other dimension of strides or ksize is the same with x
return tf.nn.conv2d(x,W,strides=[1,1,1,1],padding='SAME')
def max_pool_2x2(x):
#pool by windows of ksize,with step size of 2, 0 padding size
return tf.nn.max_pool(x,ksize=[1,2,2,1],
strides=[1,2,2,1],padding='SAME')
#------------------------------------------------
x_image = tf.reshape(x, [-1,28,28,1])
#to use conv1, need to convert x to 4D, in form of [batch,height,width,channels]
# -1 means default
with tf.name_scope('conv1'):
#use 'with' and name_scope to define a name space which will show in tensorboard as a ragion
with tf.name_scope('weight'):
W_conv1=weight_variable([5,5,1,32])
tf.summary.histogram('conv1'+'/weight',W_conv1)
#summary the variation ('name', value)
with tf.name_scope('bias'):
b_conv1=bias_variable([32])
tf.summary.histogram('conv1'+'/bias',b_conv1)
#build the first conv layer:
#get 32 features from every 5*5 patch, so the shape is [5,5,1(channel),32]
h_conv1 = tf.nn.relu(conv2d(x_image, W_conv1) + b_conv1)
with tf.name_scope('pool1'):
h_pool1 = max_pool_2x2(h_conv1)
#--------------------------------------------
with tf.name_scope('conv2'):
with tf.name_scope('weight'):
W_conv2=weight_variable([5,5,32,64])
tf.summary.histogram('weight',W_conv2)
with tf.name_scope('bias'):
b_conv2=bias_variable([64])
tf.summary.histogram('bias',b_conv2)
#build the 2nd conv layer:
#get 64 features from every 5*5 patch, so the shape is [5,5,32(channel),64]
h_conv2 = tf.nn.relu(conv2d(h_pool1, W_conv2) + b_conv2)
with tf.name_scope('pool2'):
h_pool2 = max_pool_2x2(h_conv2)
#----------------------------------------
#image size reduce to 7*7 by pooling
#we add a full connect layer contains 1027 nuere
#need to flat pool tensor for caculate
with tf.name_scope('fc1'):
with tf.name_scope('weight'):
W_fc1 = weight_variable([7*7*64, 1024])
tf.summary.histogram('weight',W_fc1)
with tf.name_scope('bias'):
b_fc1 = bias_variable([1024])
tf.summary.histogram('bias',b_fc1)
h_pool2_flat = tf.reshape(h_pool2,[-1, 7*7*64])
h_fc1 = tf.nn.relu(tf.matmul(h_pool2_flat,W_fc1) + b_fc1)
#------------------------------------
#output layer
with tf.name_scope('out'):
keep_prob = tf.placeholder("float")
h_fc1_drop = tf.nn.dropout(h_fc1,keep_prob)
#to decrease overfit, we add dropout before output layer.
#use placeholder to represent the porbability of a neure's output value unchange
with tf.name_scope('weight'):
W_fc2 = weight_variable([1024, 10])
tf.summary.histogram('weight',W_fc2)
with tf.name_scope('bias'):
b_fc2 = bias_variable([10])
tf.summary.histogram('bias',b_fc2)
y_conv = tf.nn.softmax(tf.matmul(h_fc1_drop, W_fc2) + b_fc2)
#---------------------------------
#train and evaluate the module
#use a ADAM
cross_entropy=-tf.reduce_sum(y_*tf.log(y_conv))
tf.summary.scalar('cross_entropy',cross_entropy)
##summary the constant ('name', value)
train_step=tf.train.AdamOptimizer(1e-4).minimize(cross_entropy)
correct_prediction = tf.equal(tf.argmax(y_conv,1), tf.argmax(y_,1))
accuracy = tf.reduce_mean(tf.cast(correct_prediction, "float"))
#sess = tf.Session()
merged=tf.summary.merge_all()
#merge all the summary nodes
writer=tf.summary.FileWriter('D:/tmp/tensorflow/mnist/',sess.graph)
# assign the event file write directory
saver=tf.train.Saver()
#saver for variation.Dafault to save all.
checkpoint_file = os.path.join('D:/tmp/tensorflow/mnist/', 'model.ckpt')
#save directroy for variation
sess.run(tf.global_variables_initializer())
for i in range(100):
batch = mnist.train.next_batch(50)
if i%100 == 0:
train_accuracy = accuracy.eval(feed_dict={x:batch[0], y_:batch[1],keep_prob:1.0})
# saver.save(sess,checkpoint_file)
# saver.save(sess,checkpoint_file,global_step=i)
#save variation
print("step %d, training accuracy %g"%(i, train_accuracy))
result=sess.run(merged,feed_dict={x: batch[0], y_: batch[1], keep_prob: 0.5})
#the merged summary need to be run
writer.add_summary(result,i)
#add the result to summary
train_step.run(feed_dict={x: batch[0], y_: batch[1], keep_prob: 0.5})
print("test accuracy %g"%accuracy.eval(feed_dict={
x: mnist.test.images, y_: mnist.test.labels, keep_prob: 1.0}))
saver.save(sess,checkpoint_file)
读取图片,恢复参数并预测 代码
# -*- coding: utf-8 -*-
"""
Created on Mon Sep 11 10:16:34 2017
multy layers softmax regression
@author: Wangjc
"""
import tensorflow as tf
import os
import cv2
import matplotlib.pyplot as plt
#need to show the full address, or error occus.
imgs0=cv2.imread(r'D:\tmp\tensorflow\imgs\_1.png',0)
plt.imshow(imgs0)
plt.show()
imgs=imgs0/255
#imgs=(255-imgs0)/255
imgs.shape=(1,784)
sess = tf.InteractiveSession()
#link the back-end of C++ to compute.
#in norm cases, we should create the map and then run in the sussion.
#now, use a more convenient class named InteractiveSession which could insert compute map when running map.
x=tf.placeholder("float",shape=[None,784])
def weight_variable(shape):
#use normal distribution numbers with stddev 0.1 to initial the weight
initial=tf.truncated_normal(shape, stddev=0.1)
return tf.Variable(initial,name='weight')
def bias_variable(shape):
#use constant value of 0.1 to initial the bias
initial=tf.constant(0.1, shape=shape)
return tf.Variable(initial,name='bias')
def conv2d(x,W):
#convolution by filter of W,with step size of 1, 0 padding size
#x should have the dimension of [batch,height,width,channels]
#other dimension of strides or ksize is the same with x
return tf.nn.conv2d(x,W,strides=[1,1,1,1],padding='SAME')
def max_pool_2x2(x):
#pool by windows of ksize,with step size of 2, 0 padding size
return tf.nn.max_pool(x,ksize=[1,2,2,1],
strides=[1,2,2,1],padding='SAME')
#------------------------------------------------
x_image = tf.reshape(x, [-1,28,28,1])
#to use conv1, need to convert x to 4D, in form of [batch,height,width,channels]
# -1 means default
with tf.name_scope('conv1'):
#use 'with' and name_scope to define a name space which will show in tensorboard as a ragion
with tf.name_scope('weight'):
W_conv1=weight_variable([5,5,1,32])
# tf.summary.histogram('conv1'+'/weight',W_conv1)
#summary the variation ('name', value)
with tf.name_scope('bias'):
b_conv1=bias_variable([32])
# tf.summary.histogram('conv1'+'/bias',b_conv1)
#build the first conv layer:
#get 32 features from every 5*5 patch, so the shape is [5,5,1(channel),32]
h_conv1 = tf.nn.relu(conv2d(x_image, W_conv1) + b_conv1)
with tf.name_scope('pool1'):
h_pool1 = max_pool_2x2(h_conv1)
#--------------------------------------------
with tf.name_scope('conv2'):
with tf.name_scope('weight'):
W_conv2=weight_variable([5,5,32,64])
# tf.summary.histogram('weight',W_conv2)
with tf.name_scope('bias'):
b_conv2=bias_variable([64])
# tf.summary.histogram('bias',b_conv2)
#build the 2nd conv layer:
#get 64 features from every 5*5 patch, so the shape is [5,5,32(channel),64]
h_conv2 = tf.nn.relu(conv2d(h_pool1, W_conv2) + b_conv2)
with tf.name_scope('pool2'):
h_pool2 = max_pool_2x2(h_conv2)
#----------------------------------------
#image size reduce to 7*7 by pooling
#we add a full connect layer contains 1027 nuere
#need to flat pool tensor for caculate
with tf.name_scope('fc1'):
with tf.name_scope('weight'):
W_fc1 = weight_variable([7*7*64, 1024])
# tf.summary.histogram('weight',W_fc1)
with tf.name_scope('bias'):
b_fc1 = bias_variable([1024])
# tf.summary.histogram('bias',b_fc1)
h_pool2_flat = tf.reshape(h_pool2,[-1, 7*7*64])
h_fc1 = tf.nn.relu(tf.matmul(h_pool2_flat,W_fc1) + b_fc1)
#------------------------------------
#output layer
with tf.name_scope('out'):
keep_prob = tf.placeholder("float")
# h_fc1_drop = tf.nn.dropout(h_fc1,keep_prob)
#to decrease overfit, we add dropout before output layer.
#use placeholder to represent the porbability of a neure's output value unchange
with tf.name_scope('weight'):
W_fc2 = weight_variable([1024, 10])
# tf.summary.histogram('weight',W_fc2)
with tf.name_scope('bias'):
b_fc2 = bias_variable([10])
# tf.summary.histogram('bias',b_fc2)
y_conv = tf.nn.softmax(tf.matmul(h_fc1, W_fc2) + b_fc2)
#---------------------------------
#saver=tf.train.import_meta_graph(r'D:\tmp\tensorflow\mnist\model.ckpt.meta')
saver=tf.train.Saver()
#saver for variation.Dafault to save all.
checkpoint_file = os.path.join('D:/tmp/tensorflow/mnist/', 'model.ckpt')
#save directroy for variation
sess.run(tf.global_variables_initializer())
saver.restore(sess,checkpoint_file)
#saver.recover_last_checkpoints(checkpoint_file)
#prediction=tf.argmax(y_conv,1)
#result=prediction.eval(feed_dict={x: imgs})
result=sess.run(tf.argmax(y_conv,1),feed_dict={x: imgs,keep_prob: 0.5})
#result=prediction.eval(feed_dict={x: imgs,keep_prob: 0.5})
print('recognize result')
print(result[0])

浙公网安备 33010602011771号