forked from pratyusha2802/Pen-in-the-air
-
Notifications
You must be signed in to change notification settings - Fork 0
/
htm.py
102 lines (83 loc) · 3.38 KB
/
htm.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
# HandTrackingModule code modified as per need
import cv2
import mediapipe as mp
import time
class handDetector:
def __init__(self, mode=False, maxHands=2, complexity=1, detection_con=0.5, trackCon=0.5):
self.lmList = []
self.mode = mode
self.maxHands = maxHands
self.detection_con = detection_con
self.trackCon = trackCon
self.complexity = complexity
self.mpHands = mp.solutions.hands
self.hands = self.mpHands.Hands(self.mode, self.maxHands, self.complexity, self.detection_con, self.trackCon)
self.mpDraw = mp.solutions.drawing_utils
self.tipIds = [4, 8, 12, 16, 20]
# to find if there is any hand in the image that we capture
def findHands(self, img, draw=True):
imgRGB = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
results = self.hands.process(imgRGB)
# print(results.multi_hand_landmarks)
if results.multi_hand_landmarks:
for handLms in results.multi_hand_landmarks:
if draw:
self.mpDraw.draw_landmarks(img, handLms, self.mpHands.HAND_CONNECTIONS)
img = imgRGB
return img
# to find the positions of the ids on fingers and store it in a list
def findPosition(self, img, handNo=0, draw=True):
xList = []
yList = []
imgRGB = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
results = self.hands.process(imgRGB)
if results.multi_hand_landmarks:
myHand = results.multi_hand_landmarks[handNo]
for id, lm in enumerate(myHand.landmark):
# print(id, lm)
h, w, c = img.shape
cx, cy = int(lm.x * w), int(lm.y * h)
xList.append(cx)
yList.append(cy)
# print(id, cx, cy)
self.lmList.append([id, cx, cy])
if draw:
cv2.circle(img, (cx, cy), 15, (255, 0, 255), cv2.FILLED)
xmin, xmax = min(xList, default=0), max(xList, default=0)
ymin, ymax = min(yList, default=0), max(yList, default=0)
bbox = [xmin, ymin, xmax, ymax]
if draw:
cv2.rectangle(img, (int(xmin) - 20, int(ymin) - 20), (int(xmax) + 20, int(ymax) + 20), (0, 255, 0), 2)
return self.lmList, bbox
# to track which fingers are open in the iteration
def fingersUp(self):
fingers = []
# Thumb
if self.lmList[self.tipIds[0]][1] < self.lmList[self.tipIds[0] - 1][1]:
fingers.append(1)
else:
fingers.append(0)
# Fingers
for id in range(1, 5):
if self.lmList[self.tipIds[id]][2] < self.lmList[self.tipIds[id] - 2][2]:
fingers.append(1)
else:
fingers.append(0)
return fingers
def main():
# captures the video
cap = cv2.VideoCapture(1)
detector = handDetector()
while True:
success, img = cap.read()
img = detector.findHands(img)
lmList, bbox = detector.findPosition(img)
if len(lmList) != 0:
print(lmList[4])
# shows the image
cv2.imshow("Image", img)
# wait for a delay of 10 ms after 'q' key is pressed to terminate the window
if cv2.waitKey(10) == ord('q'):
break
if __name__ == "__main__":
main()