hand_tracking/hand_tracking_module.py

import cv2
import mediapipe as mp
import time

class handDetector():
    def __init__(self, static_image_mode=False, max_num_hands=2, min_detection_confidence=0.5, min_tracking_confidence=0.5):
        self.static_image_mode = static_image_mode
        self.max_num_hands = max_num_hands
        self.min_detection_confidence = min_detection_confidence
        self.min_tracking_confidence = min_tracking_confidence

        self.mpHands = mp.solutions.hands
        self.mpDraw = mp.solutions.drawing_utils
        self.hands = self.mpHands.Hands(
            self.static_image_mode,
            self.max_num_hands,
            self.min_detection_confidence,
            self.min_tracking_confidence
        )

    def findHands(self, img, draw=True):
        imgRGB = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
        self.results = self.hands.process(imgRGB)

        if self.results.multi_hand_landmarks:
            for hand_landmarks in self.results.multi_hand_landmarks:
                if draw:
                    self.mpDraw.draw_landmarks(img, hand_landmarks, self.mpHands.HAND_CONNECTIONS)  # mpHands.HAND_CONNECTIONS joins the landmark points

        return img

    def findPosition(self, img, handNumber=0, draw=True):
        height, width, _ = img.shape
        landmark_list = []

        if self.results.multi_hand_landmarks:
            hand_landmarks = self.results.multi_hand_landmarks[handNumber]
            for id, landmark in enumerate(hand_landmarks.landmark):
                height, width, channel = img.shape
                x,y,z = int(landmark.x * width), int(landmark.y * height), landmark.z
                # print(id, x, y)
                landmark_list.append([id,x,y])
                if draw:
                    if id==4:
                        cv2.circle(img, (x,y), 10, (255,0,0), cv2.FILLED)
                    # self.mpDraw.draw_landmarks(img, hand_landmarks, mpHands.HAND_CONNECTIONS)  # mpHands.HAND_CONNECTIONS joins the landmark points

        return landmark_list

def main():
    video_capture = cv2.VideoCapture(0)

    prev_time=0
    current_time=0
    detector = handDetector()
    while True:
        _, img = video_capture.read()
        
        img = detector.findHands(img)
        landmark_list = detector.findPosition(img)
        if landmark_list:
            print(landmark_list[8])

        current_time = time.time()
        fps = 1/(current_time-prev_time)
        prev_time = current_time

        cv2.putText(img, f'FPS: {str(int(fps))}', (10,70), cv2.FONT_HERSHEY_COMPLEX_SMALL, 2, (0,0,255), 2)
        cv2.imshow("Image", img)
        cv2.waitKey(1)


if __name__=="__main__":
    main()