-
Notifications
You must be signed in to change notification settings - Fork 23
/
run.py
69 lines (51 loc) · 2.26 KB
/
run.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
import cv2
import numpy as np
import mediapipe as mp
# Initialize mediapipe
mp_hands = mp.solutions.hands
hands = mp_hands.Hands(static_image_mode=False,
max_num_hands=2,
min_detection_confidence=0.1,
min_tracking_confidence=0.1)
mp_drawing = mp.solutions.drawing_utils
cap = cv2.VideoCapture(0)
# Read in M matrices
M = np.load("M.npy")
width, height = 1920, 1200
while True:
ret, frame = cap.read()
# If the frame was not read, exit
if not ret:
print("Failed to capture frame")
break
# Convert to RGB
rgb_frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
# Run inference for hand detection
results = hands.process(rgb_frame)
# Create an empty image to draw on
output_image = np.zeros((height, width, 3), np.uint8)
if results.multi_hand_landmarks:
for hand_landmarks in results.multi_hand_landmarks:
# Extract landmark coordinates
landmark_coords = []
for landmark in hand_landmarks.landmark:
x = int(landmark.x * frame.shape[1])
y = int(landmark.y * frame.shape[0])
landmark_coords.append([x, y])
landmark_coords = np.array(landmark_coords, dtype=np.float32)
print(f"Original Landmark Coordinates: {landmark_coords}")
# Apply M transformation to landmark coordinates
transformed_coords = cv2.perspectiveTransform(np.array([landmark_coords]), M)[0]
print(f"Transformed Landmark Coordinates: {transformed_coords}")
# Draw landmarks on the output image
for i, (x, y) in enumerate(transformed_coords):
cv2.circle(output_image, (int(x), int(y)), 5, (0, 255, 0), -1)
cv2.putText(output_image, f'ID:{i}', (int(x), int(y)), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (255, 255, 255), 1)
# Display the final image
cv2.namedWindow("Final Image", cv2.WND_PROP_FULLSCREEN)
cv2.setWindowProperty("Final Image", cv2.WND_PROP_FULLSCREEN, cv2.WINDOW_FULLSCREEN)
cv2.imshow("Final Image", output_image)
if cv2.waitKey(1) & 0xFF == ord('q'):
break
cap.release()
cv2.destroyAllWindows()