我用tensorflow为诗人重新训练了我的模型,开始模式。预测需要0.4秒,排序需要2秒。由于它需要很长的时间,所以框架是滞后的,在预测时会被置乱。有任何方法,我可以使框架平滑,虽然预测需要时间?以下是我的代码..。
camera = cv2.VideoCapture(0)
# Loads label file, strips off carriage return
label_lines = [line.rstrip() for line
in tf.gfile.GFile('retrained_labels.txt')]
def grabVideoFeed():
grabbed, frame = camera.read()
return frame if grabbed else None
def initialSetup():
os.environ['TF_CPP_MIN_LOG_LEVEL'] = '2'
start_time = timeit.default_timer()
# This takes 2-5 seconds to run
# Unpersists graph from file
with tf.gfile.FastGFile('retrained_graph.pb', 'rb') as f:
graph_def = tf.GraphDef()
graph_def.ParseFromString(f.read())
tf.import_graph_def(graph_def, name='')
print 'Took {} seconds to unpersist the graph'.format(timeit.default_timer() - start_time)
initialSetup()
with tf.Session() as sess:
start_time = timeit.default_timer()
# Feed the image_data as input to the graph and get first prediction
softmax_tensor = sess.graph.get_tensor_by_name('final_result:0')
print 'Took {} seconds to feed data to graph'.format(timeit.default_timer() - start_time)
while True:
frame = grabVideoFeed()
if frame is None:
raise SystemError('Issue grabbing the frame')
frame = cv2.resize(frame, (299, 299), interpolation=cv2.INTER_CUBIC)
cv2.imshow('Main', frame)
# adhere to TS graph input structure
numpy_frame = np.asarray(frame)
numpy_frame = cv2.normalize(numpy_frame.astype('float'), None, -0.5, .5, cv2.NORM_MINMAX)
numpy_final = np.expand_dims(numpy_frame, axis=0)
start_time = timeit.default_timer()
# This takes 2-5 seconds as well
predictions = sess.run(softmax_tensor, {'Mul:0': numpy_final})
print 'Took {} seconds to perform prediction'.format(timeit.default_timer() - start_time)
start_time = timeit.default_timer()
# Sort to show labels of first prediction in order of confidence
top_k = predictions[0].argsort()[-len(predictions[0]):][::-1]
print 'Took {} seconds to sort the predictions'.format(timeit.default_timer() - start_time)
for node_id in top_k:
human_string = label_lines[node_id]
score = predictions[0][node_id]
print('%s (score = %.5f)' % (human_string, score))
print '********* Session Ended *********'
if cv2.waitKey(1) & 0xFF == ord('q'):
sess.close()
break
camera.release()
cv2.destroyAllWindows()发布于 2017-07-31 09:28:42
@dat-tran是正确的,虽然fater rcnn是快速的,但它也会滞后somewhat.For不滞后,你可以使用yolo,ssd模型,我用了yolo它是好的。
对于队列和多处理,可以使用以下代码。
from utils import FPS, WebcamVideoStream
from multiprocessing import Process, Queue, Pool
def worker(input_q, output_q):
os.environ['TF_CPP_MIN_LOG_LEVEL'] = '2'
start_time = timeit.default_timer()
# This takes 2-5 seconds to run
# Unpersists graph from file
graph_def = tf.Graph()
with graph_def.as_default():
graph_def_ = tf.GraphDef()
with tf.gfile.FastGFile('retrained_graph.pb', 'rb') as f:
graph_def_.ParseFromString(f.read())
tf.import_graph_def(graph_def_, name='')
sess = tf.Session(graph=graph_def)
fps = FPS().start()
while True:
fps.update()
frame = input_q.get()
numpy_frame = np.asarray(frame)
numpy_frame = cv2.normalize(numpy_frame.astype('float'), None, -0.5, .5, cv2.NORM_MINMAX)
numpy_final = np.expand_dims(numpy_frame, axis=0)
start_time = timeit.default_timer()
# This takes 2-5 seconds as well
predictions = sess.run(softmax_tensor, {'Mul:0': numpy_final})
print 'Took {} seconds to perform prediction'.format(timeit.default_timer() - start_time)
start_time = timeit.default_timer()
# Sort to show labels of first prediction in order of confidence
top_k = predictions[0].argsort()[-len(predictions[0]):][::-1]
print 'Took {} seconds to sort the predictions'.format(timeit.default_timer() - start_time)
for node_id in top_k:
human_string = label_lines[node_id]
score = predictions[0][node_id]
print('%s (score = %.5f)' % (human_string, score))
output_q.put(frame)
fps.stop()
sess.close()
if __name__ == '__main__':
input_q = Queue(maxsize=10)
output_q = Queue(maxsize=10)
process = Process(target=worker, args=((input_q, output_q)))
process.daemon = True
pool = Pool(1, worker, (input_q, output_q))
video_capture = WebcamVideoStream(src=0,
width=args.width,
height=args.height).start()
fps = FPS().start()
while (video_capture.isOpened()):
_,frame = video_capture.read()
input_q.put(frame)
cv2.namedWindow('Image', cv2.WINDOW_NORMAL)
cv2.resizeWindow('Image', 600, 600)
cv2.imshow('Image', output_q.get())
fps.update()
if cv2.waitKey(1) & 0xFF == ord('q'):
break
fps.stop()发布于 2017-07-31 08:39:03
问题是,这是因为太滞后是由于您使用的模型。这些模型不是为低延迟而制作的。使您的帧更平滑的一种方法是像Mobilenet或frame这样的模型,它们速度更快,但精度更低。万一你对我在媒体上写到这件事感兴趣。
如果您仍然想使用您的模型,另一个选项是使用队列和多处理。您可以设置一个队列来加载映像,另一个队列只能在加载另一个队列之前进行预测。最后,这两个队列需要同步在一起。
https://stackoverflow.com/questions/45409937
复制相似问题