DE-GUI/Main.py at master · Garrett-R16/DE-GUI · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
from PyQt6 import QtWidgets, uic, QtCore, QtGui
import time
import cv2
import sys
import warnings
warnings.simplefilter("ignore", UserWarning)
sys.coinit_flags = 2
import asyncio
import platform

if platform.system() == 'Windows':
	import winrt.windows.devices.enumeration as windows_devices
import mediapipe as mp

# **note later versions of python (3.9+) are not compatible with winrt. Later versions should use winsdk instead
# Additionally, some of these libraries may require installation if you have never used them before

# creating the main window

class MainWindow(QtWidgets.QMainWindow):
	def __init__(self, *args, **kwargs):
		super(MainWindow, self).__init__(*args, **kwargs)

		# loading the qtdesigner GUI I made

		uic.loadUi('draftGUI.ui', self)
		# mapping the buttons to a function--probably a better way of doing this but ¯\_(ツ)_/¯ for the mmt
		self.armDirections = ["x", "y", "z", "grip", "x_ang", "y_ang", "z_ang"]

		# starting button monitor qthread

		for button_direction in self.armDirections:
			button = getattr(self, f"{button_direction}_pos")  # Assuming buttons have names like x_pos, y_pos, etc.
			button.pressed.connect(lambda button_name=button_direction: self.Button_Action(button_name, "pressed"))
			button.released.connect(lambda button_name=button_direction: self.Button_Action(button_name, "released"))

			button = getattr(self, f"{button_direction}_neg")
			button.pressed.connect(lambda button_name=button_direction: self.Button_Action(button_name, "pressed"))
			button.released.connect(lambda button_name=button_direction: self.Button_Action(button_name, "released"))

		self.grip_state.clicked.connect(lambda: self.Button_Action("grip_state", "clicked"))

		# Starting a second thread to run the camera video

		self.camera_tracker = camera_tracker()
		self.cameras_object = self.camera_tracker.get_camera_info()

		# adding the options to the QComboBox

		for i in self.cameras_object:
			camera_name = str(i.get('camera_index')) + " " + i.get('camera_name')
			self.comboCamera.addItem(camera_name)

		self.comboCamera.currentIndexChanged.connect(self.on_combo_box_changed)

		self.imageMonitor = imageMonitor()
		self.imageMonitor.start()
		self.imageMonitor.ImageUpdate.connect(self.ImageUpdateSlot)

		self.button_monitor = button_monitor()

	def on_combo_box_changed(self, selection):
        # splitting the selected text into an index of strings to access the first value, the camera index
		selection = self.comboCamera.currentText().split()
		new_camera_index = int(selection[0])
		print(new_camera_index)
		self.imageMonitor.camera_changed(new_camera_index)

	def ImageUpdateSlot(self, Image):
		self.labelFeed.setPixmap(QtGui.QPixmap.fromImage(Image))

    # basic button function
	def Button_Action(self, button_name, action_type):
		print(f"Button {button_name} {action_type}")

		if action_type == "pressed":
			self.start_time = time.time()
			self.button_monitor.start()

		self.button_monitor.button_state(action_type, self.start_time, button_name)

# button monitor to monitor whether a button is being held or just pressed

class button_monitor(QtCore.QThread):

    button_signal = QtCore.pyqtSignal(str)

    def __init__(self):
        super(button_monitor, self).__init__()
        print("button_monitor thread started")
        self.currentState = None
        self.start_time = 0
        self.elapsed_time = 0

    def run(self):

        while self.currentState == "pressed":

            self.elapsed_time = time.time() - self.start_time

            if self.buttonPushed and self.elapsed_time > .5:
                print("button is being held")
                self.buttonPushed = False

            time.sleep(.1)

    def button_state(self, currentState, start_time, button_name):

        self.currentState = currentState

        if self.currentState == "pressed":
            self.start_time = start_time
            self.buttonPushed = True

        elif self.currentState == "released":
            if self.elapsed_time < .5:
                print(f"{button_name} was pressed")
                self.buttonPushed = False
            else:
                print(f"{button_name} held for {self.elapsed_time} seconds")

# Thank you to SH for helping me learn how to embed a OpenCV video

class imageMonitor(QtCore.QThread):

	# essentially retrieving the video from the camera using OpenCV and then putting it in a format PyQt can read

	ImageUpdate = QtCore.pyqtSignal(QtGui.QImage)
	mpMesh = mp.solutions.face_mesh
	Mesh = mpMesh.FaceMesh()
	mpDraw = mp.solutions.drawing_utils

	# mouthpoints were found using https://raw.githubusercontent.com/google/mediapipe/a908d668c730da128dfa8d9f6bd25d519d006692/mediapipe/modules/face_geometry/data/canonical_face_model_uv_visualization.png
	# can also be found using https://github.com/tensorflow/tfjs-models/blob/838611c02f51159afdd77469ce67f0e26b7bbb23/face-landmarks-detection/src/mediapipe-facemesh/keypoints.ts

	mouthPoints = [78, 191, 80, 81, 82, 13, 312, 311, 310, 415, 308, 324, 318, 402, 317, 14, 87, 178, 88, 95]

	def __init__(self):
		super(imageMonitor, self).__init__()
		print("imageMonitor initialized")
		self.camera = cv2.VideoCapture(0)

	def camera_changed(self, camera_index):
		self.camera.release()
		self.camera = cv2.VideoCapture(camera_index)

	def run(self):
		print("imageMonitor is running")
		self.ThreadActive = True

		while self.ThreadActive:
			# getting frame from webcam
			ret, frame = self.camera.read()
			if ret:
				Image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
				Image = self.face_landmarks(Image)

				FlippedImage = cv2.flip(Image, 1)
				ConvertToQtFormat = QtGui.QImage(FlippedImage.data, FlippedImage.shape[1], FlippedImage.shape[0], QtGui.QImage.Format.Format_RGB888)
				Pic = ConvertToQtFormat.scaled(800, 650, QtCore.Qt.AspectRatioMode.KeepAspectRatio)
				self.ImageUpdate.emit(Pic)

	def face_landmarks(self, Image):
		results = self.Mesh.process(Image)

		if results.multi_face_landmarks:
			for face_landmarks in results.multi_face_landmarks:
				#mpDraw.draw_landmarks(img, face_landmarks, mpMesh.FACEMESH_TESSELATION)
				tx = 0
				ty = 0
				for id, lm in enumerate(face_landmarks.landmark):
					if id in self.mouthPoints:
						h, w, c = Image.shape
						px, py = int(lm.x*w), int(lm.y*h)
						if id in [13, 14]:
							tx+=px
							ty+=py
						if id == 14:
							tx=int(tx/2)
							ty=int(ty/2)
							cv2.circle(Image, (tx, ty), 4, (0, 255, 0), cv2.FILLED)

						cv2.circle(Image, (px, py), 4, (0, 255, 0), cv2.FILLED)
		return Image

VIDEO_DEVICES = 4

# Big thanks to https://stackoverflow.com/questions/52558617/enumerate-over-cameras-in-python for helping figuring out how to enumrate over cameras
# camera tracker class to get cameras so user can choose which camera to display

class camera_tracker:

	def __init__(self):
		print("camera tracker initialized")
		self.cameras = []

	def get_camera_info(self) -> list:
		self.cameras = []

		camera_indexes = self.get_camera_indexes()

		if len(camera_indexes) == 0:
			return self.cameras

		self.cameras = self.add_camera_information(camera_indexes)

		return self.cameras

	def get_camera_indexes(self):
		index = 0
		camera_indexes = []
		max_numbers_of_cameras_to_check = 10

		# adding all camera indexes to a list
		while max_numbers_of_cameras_to_check > 0:
			capture = cv2.VideoCapture(index)
			if capture.read()[0]:
				camera_indexes.append(index)
				capture.release()
			index += 1
			max_numbers_of_cameras_to_check -= 1

		return camera_indexes

	def add_camera_information(self, camera_indexes: list) -> list:
		platform_name = platform.system()
		cameras = []

		if platform_name == 'Windows':
			cameras_info_windows = asyncio.run(self.get_camera_information_for_windows())

			for camera_index in camera_indexes:

				if camera_index < len(cameras_info_windows):
					camera_name = cameras_info_windows.get_at(camera_index).name.replace('\n', '')
					cameras.append({'camera_index': camera_index, 'camera_name': camera_name})

			return cameras

	async def get_camera_information_for_windows(self):
		return await windows_devices.DeviceInformation.find_all_async(VIDEO_DEVICES)

def main():
	app=QtWidgets.QApplication(sys.argv)
	main = MainWindow()
	main.show()
	sys.exit(app.exec())

if __name__=='__main__':
	main()