-
Notifications
You must be signed in to change notification settings - Fork 10
/
Copy pathutils.py
172 lines (127 loc) · 5.89 KB
/
utils.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
import random
import sys
import time
from datetime import datetime
from enum import Enum
import cv2
import numpy as np
from typing import Tuple, Union
from webcam import WebcamSource
def get_monitor_dimensions() -> Union[Tuple[Tuple[int, int], Tuple[int, int]], Tuple[None, None]]:
"""
Get monitor dimensions from Gdk.
from on https://github.com/NVlabs/few_shot_gaze/blob/master/demo/monitor.py
:return: tuple of monitor width and height in mm and pixels or None
"""
try:
import pgi
pgi.install_as_gi()
import gi.repository
gi.require_version('Gdk', '3.0')
from gi.repository import Gdk
display = Gdk.Display.get_default()
screen = display.get_default_screen()
default_screen = screen.get_default()
num = default_screen.get_number()
h_mm = default_screen.get_monitor_height_mm(num)
w_mm = default_screen.get_monitor_width_mm(num)
h_pixels = default_screen.get_height()
w_pixels = default_screen.get_width()
return (w_mm, h_mm), (w_pixels, h_pixels)
except ModuleNotFoundError:
return None, None
FONT = cv2.FONT_HERSHEY_SIMPLEX
TEXT_SCALE = 0.5
TEXT_THICKNESS = 2
class TargetOrientation(Enum):
UP = 82
DOWN = 84
LEFT = 81
RIGHT = 83
def create_image(monitor_pixels: Tuple[int, int], center=(0, 0), circle_scale=1., orientation=TargetOrientation.RIGHT, target='E') -> Tuple[np.ndarray, float, bool]:
"""
Create image to display on screen.
:param monitor_pixels: monitor dimensions in pixels
:param center: center of the circle and the text
:param circle_scale: scale of the circle
:param orientation: orientation of the target
:param target: char to write on image
:return: created image, new smaller circle_scale and bool that indicated if it is th last frame in the animation
"""
width, height = monitor_pixels
if orientation == TargetOrientation.LEFT or orientation == TargetOrientation.RIGHT:
img = np.zeros((height, width, 3), np.float32)
if orientation == TargetOrientation.LEFT:
center = (width - center[0], center[1])
end_animation_loop = write_text_on_image(center, circle_scale, img, target)
if orientation == TargetOrientation.LEFT:
img = cv2.flip(img, 1)
else: # TargetOrientation.UP or TargetOrientation.DOWN
img = np.zeros((width, height, 3), np.float32)
center = (center[1], center[0])
if orientation == TargetOrientation.UP:
center = (height - center[0], center[1])
end_animation_loop = write_text_on_image(center, circle_scale, img, target)
if orientation == TargetOrientation.UP:
img = cv2.flip(img, 1)
img = img.transpose((1, 0, 2))
return img / 255, circle_scale * 0.9, end_animation_loop
def write_text_on_image(center: Tuple[int, int], circle_scale: float, img: np.ndarray, target: str):
"""
Write target on image and check if last frame of the animation.
:param center: center of the circle and the text
:param circle_scale: scale of the circle
:param img: image to write data on
:param target: char to write
:return: True if last frame of the animation
"""
text_size, _ = cv2.getTextSize(target, FONT, TEXT_SCALE, TEXT_THICKNESS)
cv2.circle(img, center, int(text_size[0] * 5 * circle_scale), (32, 32, 32), -1)
text_origin = (center[0] - text_size[0] // 2, center[1] + text_size[1] // 2)
end_animation_loop = circle_scale < random.uniform(0.1, 0.5)
if not end_animation_loop:
cv2.putText(img, target, text_origin, FONT, TEXT_SCALE, (17, 112, 170), TEXT_THICKNESS, cv2.LINE_AA)
else:
cv2.putText(img, target, text_origin, FONT, TEXT_SCALE, (252, 125, 11), TEXT_THICKNESS, cv2.LINE_AA)
return end_animation_loop
def get_random_position_on_screen(monitor_pixels: Tuple[int, int]) -> Tuple[int, int]:
"""
Get random valid position on monitor.
:param monitor_pixels: monitor dimensions in pixels
:return: tuple of random valid x and y coordinated on monitor
"""
return int(random.uniform(0, 1) * monitor_pixels[0]), int(random.uniform(0, 1) * monitor_pixels[1])
def show_point_on_screen(window_name: str, base_path: str, monitor_pixels: Tuple[int, int], source: WebcamSource) -> Tuple[str, Tuple[int, int], float]:
"""
Show one target on screen, full animation cycle. Return collected data if data is valid
:param window_name: name of the window to draw on
:param base_path: path where to save the image to
:param monitor_pixels: monitor dimensions in pixels
:param source: webcam source
:return: collected data otherwise None
"""
circle_scale = 1.
center = get_random_position_on_screen(monitor_pixels)
end_animation_loop = False
orientation = random.choice(list(TargetOrientation))
file_name = None
time_till_capture = None
while not end_animation_loop:
image, circle_scale, end_animation_loop = create_image(monitor_pixels, center, circle_scale, orientation)
cv2.imshow(window_name, image)
for _ in range(10): # workaround to not speed up the animation when buttons are pressed
if cv2.waitKey(50) & 0xFF == ord('q'):
cv2.destroyAllWindows()
sys.exit()
if end_animation_loop:
file_name = datetime.now().strftime("%Y_%m_%d-%H_%M_%S")
start_time_color_change = time.time()
while time.time() - start_time_color_change < 0.5:
if cv2.waitKey(42) & 0xFF == orientation.value:
source.clear_frame_buffer()
cv2.imwrite(f'{base_path}/{file_name}.jpg', next(source))
time_till_capture = time.time() - start_time_color_change
break
cv2.imshow(window_name, np.zeros((monitor_pixels[1], monitor_pixels[0], 3), np.float32))
cv2.waitKey(500)
return f'{file_name}.jpg', center, time_till_capture