-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathhand_tracking_module.py
74 lines (59 loc) · 2.59 KB
/
hand_tracking_module.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
import cv2
import mediapipe as mp
import time
class handDetector():
def __init__(self, static_image_mode=False, max_num_hands=2, min_detection_confidence=0.5, min_tracking_confidence=0.5):
self.static_image_mode = static_image_mode
self.max_num_hands = max_num_hands
self.min_detection_confidence = min_detection_confidence
self.min_tracking_confidence = min_tracking_confidence
self.mpHands = mp.solutions.hands
self.mpDraw = mp.solutions.drawing_utils
self.hands = self.mpHands.Hands(
self.static_image_mode,
self.max_num_hands,
self.min_detection_confidence,
self.min_tracking_confidence
)
def findHands(self, img, draw=True):
imgRGB = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
self.results = self.hands.process(imgRGB)
if self.results.multi_hand_landmarks:
for hand_landmarks in self.results.multi_hand_landmarks:
if draw:
self.mpDraw.draw_landmarks(img, hand_landmarks, self.mpHands.HAND_CONNECTIONS) # mpHands.HAND_CONNECTIONS joins the landmark points
return img
def findPosition(self, img, handNumber=0, draw=True):
height, width, _ = img.shape
landmark_list = []
if self.results.multi_hand_landmarks:
hand_landmarks = self.results.multi_hand_landmarks[handNumber]
for id, landmark in enumerate(hand_landmarks.landmark):
height, width, channel = img.shape
x,y,z = int(landmark.x * width), int(landmark.y * height), landmark.z
# print(id, x, y)
landmark_list.append([id,x,y])
if draw:
if id==4:
cv2.circle(img, (x,y), 10, (255,0,0), cv2.FILLED)
# self.mpDraw.draw_landmarks(img, hand_landmarks, mpHands.HAND_CONNECTIONS) # mpHands.HAND_CONNECTIONS joins the landmark points
return landmark_list
def main():
video_capture = cv2.VideoCapture(0)
prev_time=0
current_time=0
detector = handDetector()
while True:
_, img = video_capture.read()
img = detector.findHands(img)
landmark_list = detector.findPosition(img)
if landmark_list:
print(landmark_list[8])
current_time = time.time()
fps = 1/(current_time-prev_time)
prev_time = current_time
cv2.putText(img, f'FPS: {str(int(fps))}', (10,70), cv2.FONT_HERSHEY_COMPLEX_SMALL, 2, (0,0,255), 2)
cv2.imshow("Image", img)
cv2.waitKey(1)
if __name__=="__main__":
main()