-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathHandDetector.py
76 lines (63 loc) · 2.74 KB
/
HandDetector.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
import numpy as np
import tensorflow as tf
import cv2 as cv
# Initialize the camera
vc = cv.VideoCapture(0)
b, img = vc.read()
shape = img.shape
whiteboard = 255 * np.ones(shape=[shape[0], shape[1], shape[2]], dtype=np.uint8)
# Read the graph.
with tf.gfile.FastGFile('frozen_inference_graph.pb', 'rb') as f:
graph_def = tf.GraphDef()
graph_def.ParseFromString(f.read())
with tf.Session() as sess:
# Restore session
sess.graph.as_default()
tf.import_graph_def(graph_def, name='')
startedDrawing = False
lastPoint = (0,0)
while True:
b, img = vc.read()
if b:
# Read and preprocess an image.
img = cv.flip(img, 1)
rows = img.shape[0]
cols = img.shape[1]
inp = cv.resize(img, (300, 300))
inp = inp[:, :, [2, 1, 0]] # BGR2RGB
# Run the model
out = sess.run([sess.graph.get_tensor_by_name('num_detections:0'),
sess.graph.get_tensor_by_name('detection_scores:0'),
sess.graph.get_tensor_by_name('detection_boxes:0'),
sess.graph.get_tensor_by_name('detection_classes:0')],
feed_dict={'image_tensor:0': inp.reshape(1, inp.shape[0], inp.shape[1], 3)})
# Visualize detected bounding boxes.
num_detections = int(out[0][0])
biggestArea = 0
biggestPoint = (0,0)
for i in range(num_detections):
#classId = int(out[3][0][i])
score = float(out[1][0][i])
bbox = [float(v) for v in out[2][0][i]]
if score > 0.5:
x = bbox[1] * cols
y = bbox[0] * rows
right = bbox[3] * cols
bottom = bbox[2] * rows
currentArea = (right - x) * (bottom - y)
if currentArea > biggestArea:
biggestArea = currentArea
biggestPoint = (int((right - x)/2 + x), int((y - bottom)/2 + bottom))
cv.rectangle(img, (int(x), int(y)), (int(right), int(bottom)), (125, 255, 51), thickness=2)
# Paint
if biggestArea != 0:
if startedDrawing == False:
lastPoint = biggestPoint
startedDrawing = True
else:
cv.line(whiteboard, lastPoint, biggestPoint, (125, 255, 51), thickness=2)
lastPoint = biggestPoint
# Display image and whiteboard
cv.imshow("Webcam", img)
cv.imshow("Whiteboard", whiteboard)
cv.waitKey(1)