-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathframeTrackingModule.py
77 lines (64 loc) · 2.81 KB
/
frameTrackingModule.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
import cv2
import mediapipe as mp
class poseDetector():
def __init__(self, mode = False, complexity = 1, smooth = True,
enableSeg = False, smoothSeg = True,
detectConf = 0.5, trackConf = 0.5):
self.mode = mode
self.complexity = complexity
self.smooth = smooth
self.enableSeg = enableSeg
self.smoothSeg = smoothSeg
self.detectConf = detectConf
self.trackConf = trackConf
# Drawing the landmarks and lines between them for the skeleton
self.mpDraw = mp.solutions.drawing_utils
self.mpPose = mp.solutions.pose
# Getting the pose
self.pose = self.mpPose.Pose(self.mode, self.complexity, self.smooth,
self.enableSeg, self.smoothSeg,
self.detectConf, self.trackConf)
def findPose(self, img, draw = True):
# Convert video to color and process the results
imgRGB = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
self.results = self.pose.process(imgRGB)
# Draw the landmarks and connections
if (self.results.pose_landmarks):
if (draw):
self.mpDraw.draw_landmarks(img, self.results.pose_landmarks,
self.mpPose.POSE_CONNECTIONS)
return img
def findPosition(self, img, draw = True):
lmList = []
if (self.results.pose_landmarks):
# Landmark number, Landmark position/visibility vector
# num, [x, y, z, visibility]
for id, lm in enumerate(self.results.pose_landmarks.landmark):
# Image Height, Image Width, Image Channel
h, w, c = img.shape
# X, Y, Z pixel of the image (possibly change Z)
cx, cy, cz = int(lm.x * w), int(lm.y * h), int(lm.z * w)
# ID, X, Y, Z, Visibility
lmList.append([id, cx, cy, cz])
if (draw):
# Marking the (X, Y) points for confirmation they're right
cv2.circle(img, (cx, cy), 5,
(255, 0, 8), cv2.FILLED)
return lmList
# Typically used for a test script of some sort.
def main():
# Getting the video
capture = cv2.VideoCapture('Videos/breakdance.mp4')
detector = poseDetector()
# Look/Draw loop
while True:
# Read in the video and store its data
success, img = capture.read()
img = detector.findPose(img)
lmList = detector.findPosition(img)
cv2.imshow("Image", img)
cv2.waitKey(1)
# If you run this in general it'll run the main() above.
# Otherwise, if you run a specific function, it won't run that main().
if __name__ == "__main__":
main()