def main(camera_id, filename, hrnet_c, hrnet_j, hrnet_weights, hrnet_joints_set, single_person, max_batch_size, disable_vidgear, device): if device is not None: device = torch.device(device) else: if torch.cuda.is_available() and True: torch.backends.cudnn.deterministic = True device = torch.device('cuda:0') else: device = torch.device('cpu') print(device) has_display = 'DISPLAY' in os.environ.keys() or sys.platform == 'win32' if filename is not None: video = cv2.VideoCapture(filename) assert video.isOpened() else: if disable_vidgear: video = cv2.VideoCapture(camera_id) assert video.isOpened() else: video = CamGear(camera_id).start() model = SimpleHRNet(hrnet_c, hrnet_j, hrnet_weights, multiperson=not single_person, max_batch_size=max_batch_size, device=device) while True: if disable_vidgear: ret, frame = video.read() if not ret: break else: frame = video.read() if frame is None: break pts = model.predict(frame) for i, pt in enumerate(pts): frame = draw_points_and_skeleton( frame, pt, joints_dict()[hrnet_joints_set]['skeleton'], person_index=i, joints_color_palette='gist_rainbow', skeleton_color_palette='jet', joints_palette_samples=10) if has_display: cv2.imshow('frame.png', frame) k = cv2.waitKey(1) if k == 27: # Esc button if disable_vidgear: video.release() else: video.stop() break else: cv2.imwrite('frame.png', frame)
def main(camera_id, filename, hrnet_c, hrnet_j, hrnet_weights, hrnet_joints_set, image_resolution, disable_tracking, max_nof_people, max_batch_size, disable_vidgear, save_video, video_format, video_framerate, device): if device is not None: device = torch.device(device) else: if torch.cuda.is_available(): torch.backends.cudnn.deterministic = True device = torch.device('cuda') else: device = torch.device('cpu') # print(device) has_display = 'DISPLAY' in os.environ.keys() or sys.platform == 'win32' video_writer = None if filename is not None: rotation_code = check_video_rotation(filename) video = cv2.VideoCapture(filename) assert video.isOpened() else: rotation_code = None if disable_vidgear: video = cv2.VideoCapture(camera_id) assert video.isOpened() else: video = CamGear(camera_id).start() model = SimpleHigherHRNet(hrnet_c, hrnet_j, hrnet_weights, resolution=image_resolution, return_bounding_boxes=not disable_tracking, max_nof_people=max_nof_people, max_batch_size=max_batch_size, device=device) if not disable_tracking: prev_boxes = None prev_pts = None prev_person_ids = None next_person_id = 0 while True: t = time.time() if filename is not None or disable_vidgear: ret, frame = video.read() if not ret: break if rotation_code is not None: frame = cv2.rotate(frame, rotation_code) else: frame = video.read() if frame is None: break pts = model.predict(frame) if not disable_tracking: boxes, pts = pts if not disable_tracking: if len(pts) > 0: if prev_pts is None and prev_person_ids is None: person_ids = np.arange(next_person_id, len(pts) + next_person_id, dtype=np.int32) next_person_id = len(pts) + 1 else: boxes, pts, person_ids = find_person_id_associations( boxes=boxes, pts=pts, prev_boxes=prev_boxes, prev_pts=prev_pts, prev_person_ids=prev_person_ids, next_person_id=next_person_id, pose_alpha=0.2, similarity_threshold=0.4, smoothing_alpha=0.1, ) next_person_id = max(next_person_id, np.max(person_ids) + 1) else: person_ids = np.array((), dtype=np.int32) prev_boxes = boxes.copy() prev_pts = pts.copy() prev_person_ids = person_ids else: person_ids = np.arange(len(pts), dtype=np.int32) for i, (pt, pid) in enumerate(zip(pts, person_ids)): frame = draw_points_and_skeleton( frame, pt, joints_dict()[hrnet_joints_set]['skeleton'], person_index=pid, points_color_palette='gist_rainbow', skeleton_color_palette='jet', points_palette_samples=10) fps = 1. / (time.time() - t) print('\rframerate: %f fps / detected people: %d' % (fps, len(pts)), end='') if has_display: cv2.imshow('frame.png', frame) k = cv2.waitKey(1) if k == 27: # Esc button if disable_vidgear: video.release() else: video.stop() break else: cv2.imwrite('frame.png', frame) if save_video: if video_writer is None: fourcc = cv2.VideoWriter_fourcc(*video_format) # video format video_writer = cv2.VideoWriter( 'output.avi', fourcc, video_framerate, (frame.shape[1], frame.shape[0])) video_writer.write(frame) if save_video: video_writer.release()
def main(camera_id, filename, hrnet_m, hrnet_c, hrnet_j, hrnet_weights, hrnet_joints_set, image_resolution, single_person, use_tiny_yolo, disable_tracking, max_batch_size, disable_vidgear, save_video, video_format, video_framerate, device, exercise_type): if device is not None: device = torch.device(device) else: if torch.cuda.is_available(): torch.backends.cudnn.deterministic = True device = torch.device('cuda') else: device = torch.device('cpu') # print(device) image_resolution = ast.literal_eval(image_resolution) has_display = 'DISPLAY' in os.environ.keys() or sys.platform == 'win32' video_writer = None if filename is not None: video = cv2.VideoCapture(filename) assert video.isOpened() else: if disable_vidgear: video = cv2.VideoCapture(camera_id) assert video.isOpened() else: video = CamGear(camera_id).start() if use_tiny_yolo: yolo_model_def = "./models/detectors/yolo/config/yolov3-tiny.cfg" yolo_class_path = "./models/detectors/yolo/data/coco.names" yolo_weights_path = "./models/detectors/yolo/weights/yolov3-tiny.weights" else: yolo_model_def = "./models/detectors/yolo/config/yolov3.cfg" yolo_class_path = "./models/detectors/yolo/data/coco.names" yolo_weights_path = "./models/detectors/yolo/weights/yolov3.weights" model = SimpleHRNet(hrnet_c, hrnet_j, hrnet_weights, model_name=hrnet_m, resolution=image_resolution, multiperson=not single_person, return_bounding_boxes=not disable_tracking, max_batch_size=max_batch_size, yolo_model_def=yolo_model_def, yolo_class_path=yolo_class_path, yolo_weights_path=yolo_weights_path, device=device) if not disable_tracking: prev_boxes = None prev_pts = None prev_person_ids = None next_person_id = 0 flag = 0 prev_flag = flag counter = 0 angle = 0 dist = 0 prev_dist = dist while True: t = time.time() if filename is not None or disable_vidgear: ret, frame = video.read() if not ret: break else: frame = video.read() if frame is None: break pts = model.predict(frame) if not disable_tracking: boxes, pts = pts if not disable_tracking: if len(pts) > 0: if prev_pts is None and prev_person_ids is None: person_ids = np.arange(next_person_id, len(pts) + next_person_id, dtype=np.int32) next_person_id = len(pts) + 1 else: boxes, pts, person_ids = find_person_id_associations( boxes=boxes, pts=pts, prev_boxes=prev_boxes, prev_pts=prev_pts, prev_person_ids=prev_person_ids, next_person_id=next_person_id, pose_alpha=0.2, similarity_threshold=0.4, smoothing_alpha=0.1, ) next_person_id = max(next_person_id, np.max(person_ids) + 1) else: person_ids = np.array((), dtype=np.int32) prev_boxes = boxes.copy() prev_pts = pts.copy() prev_person_ids = person_ids else: person_ids = np.arange(len(pts), dtype=np.int32) start_point = (45, 5) end_point = (1300, 250) colorr = (0, 0, 0) thicknessr = -1 frame = cv2.rectangle(frame, start_point, end_point, colorr, thicknessr) if exercise_type == 1: #for pushUps for i, (pt, pid) in enumerate(zip(pts, person_ids)): frame, angle = draw_points_and_skeleton( frame, pt, joints_dict()[hrnet_joints_set]['skeleton'], person_index=pid, points_color_palette='gist_rainbow', skeleton_color_palette='jet', points_palette_samples=10, exercise_type=1) fps = 1. / (time.time() - t) print('\rframerate: %f fps' % fps, end='') #angle=findangle(frame, pts, joints_dict()[hrnet_joints_set]['skeleton']) font = cv2.FONT_HERSHEY_SIMPLEX x, y, l = frame.shape org = (50, 80) fontScale = 1 color = (255, 255, 255) thickness = 2 frame = cv2.putText(frame, str(angle), org, font, fontScale, color, thickness, cv2.LINE_AA) if (len(pts) > 0): if (angle > 150): flag = 0 if (angle < 90): flag = 1 if (prev_flag == 1 and flag == 0): counter = counter + 1 prev_flag = flag font = cv2.FONT_HERSHEY_SIMPLEX x, y, l = frame.shape org = (50, 180) fontScale = 4 color = (255, 255, 255) thickness = 8 text = "PushUps Count=" + str(counter) frame = cv2.putText(frame, text, org, font, fontScale, color, thickness, cv2.LINE_AA) elif exercise_type == 2: #for sitUps for i, (pt, pid) in enumerate(zip(pts, person_ids)): frame, angle = draw_points_and_skeleton( frame, pt, joints_dict()[hrnet_joints_set]['skeleton'], person_index=pid, points_color_palette='gist_rainbow', skeleton_color_palette='jet', points_palette_samples=10, exercise_type=2) fps = 1. / (time.time() - t) print('\rframerate: %f fps' % fps, end='') #angle=findangle(frame, pts, joints_dict()[hrnet_joints_set]['skeleton']) font = cv2.FONT_HERSHEY_SIMPLEX x, y, l = frame.shape org = (50, 80) fontScale = 1 color = (255, 255, 255) thickness = 2 frame = cv2.putText(frame, str(angle), org, font, fontScale, color, thickness, cv2.LINE_AA) if (len(pts) > 0): if (angle > 168): flag = 0 if (angle < 48): flag = 1 if (prev_flag == 1 and flag == 0): counter = counter + 1 prev_flag = flag font = cv2.FONT_HERSHEY_SIMPLEX x, y, l = frame.shape org = (50, 180) fontScale = 4 color = (255, 255, 255) thickness = 8 text = "Squats Count=" + str(counter) frame = cv2.putText(frame, text, org, font, fontScale, color, thickness, cv2.LINE_AA) elif exercise_type == 3: #for ChinUps for i, (pt, pid) in enumerate(zip(pts, person_ids)): frame, dist = draw_points_and_skeleton( frame, pt, joints_dict()[hrnet_joints_set]['skeleton'], person_index=pid, points_color_palette='gist_rainbow', skeleton_color_palette='jet', points_palette_samples=10, exercise_type=3) fps = 1. / (time.time() - t) print('\rframerate: %f fps' % fps, end='') #angle=findangle(frame, pts, joints_dict()[hrnet_joints_set]['skeleton']) font = cv2.FONT_HERSHEY_SIMPLEX x, y, l = frame.shape org = (50, 80) fontScale = 1 color = (255, 255, 255) thickness = 2 frame = cv2.putText(frame, str(dist), org, font, fontScale, color, thickness, cv2.LINE_AA) if (len(pts) > 0): if (dist == -1 and prev_dist == 1): counter = counter + 1 prev_dist = dist font = cv2.FONT_HERSHEY_SIMPLEX x, y, l = frame.shape org = (50, 180) fontScale = 4 color = (255, 255, 255) thickness = 8 text = "ChinUps Count=" + str(counter) frame = cv2.putText(frame, text, org, font, fontScale, color, thickness, cv2.LINE_AA) if has_display: cv2.imshow('frame.png', frame) k = cv2.waitKey(1) if k == 27: # Esc button if disable_vidgear: video.release() else: video.stop() break else: cv2.imwrite('frame.png', frame) if save_video: if video_writer is None: fourcc = cv2.VideoWriter_fourcc(*video_format) # video format video_writer = cv2.VideoWriter( 'arnleft.avi', fourcc, video_framerate, (frame.shape[1], frame.shape[0])) video_writer.write(frame) if save_video: video_writer.release()
def main(camera_id, filename, hrnet_c, hrnet_j, hrnet_weights, hrnet_joints_set, image_resolution, single_person, max_batch_size, disable_vidgear, save_video, video_format, video_framerate, device): if device is not None: device = torch.device(device) else: if torch.cuda.is_available() and True: torch.backends.cudnn.deterministic = True device = torch.device('cuda:0') else: device = torch.device('cpu') print(device) image_resolution = ast.literal_eval(image_resolution) has_display = 'DISPLAY' in os.environ.keys() or sys.platform == 'win32' video_writer = None if filename is not None: video = cv2.VideoCapture(filename) assert video.isOpened() else: if disable_vidgear: video = cv2.VideoCapture(camera_id) assert video.isOpened() else: video = CamGear(camera_id).start() model = SimpleHRNet( hrnet_c, hrnet_j, hrnet_weights, resolution=image_resolution, multiperson=not single_person, max_batch_size=max_batch_size, device=device ) while True: t = time.time() if filename is not None or disable_vidgear: ret, frame = video.read() if not ret: break else: frame = video.read() if frame is None: break pts = model.predict(frame) for i, pt in enumerate(pts): frame = draw_points_and_skeleton(frame, pt, joints_dict()[hrnet_joints_set]['skeleton'], person_index=i, points_color_palette='gist_rainbow', skeleton_color_palette='jet', points_palette_samples=10) fps = 1. / (time.time() - t) print('\rframerate: %f fps' % fps, end='') if has_display: cv2.imshow('frame.png', frame) k = cv2.waitKey(1) if k == 27: # Esc button if disable_vidgear: video.release() else: video.stop() break else: cv2.imwrite('frame.png', frame) if save_video: if video_writer is None: fourcc = cv2.VideoWriter_fourcc(*video_format) # video format video_writer = cv2.VideoWriter('output.avi', fourcc, video_framerate, (frame.shape[1], frame.shape[0])) video_writer.write(frame) if save_video: video_writer.release()
def main(self): if self.args.device is not None: device = torch.device(self.args.device) else: if torch.cuda.is_available() and True: torch.backends.cudnn.deterministic = True device = torch.device('cuda:0') else: device = torch.device('cpu') print(device) image_resolution = ast.literal_eval(self.args.image_resolution) has_display = 'DISPLAY' in os.environ.keys() or sys.platform == 'win32' has_display = False if self.args.filename is not None: video = cv2.VideoCapture(self.args.filename) assert video.isOpened() else: if self.args.disable_vidgear: video = cv2.VideoCapture(self.args.camera_id) assert video.isOpened() else: video = CamGear(self.args.camera_id).start() model = SimpleHRNet(self.args.hrnet_c, self.args.hrnet_j, self.args.hrnet_weights, resolution=image_resolution, multiperson=not self.args.single_person, max_batch_size=self.args.max_batch_size, device=device) num_of_frame = 0 num_of_std = 0 start = False flag = False root = os.path.join(self.args.save_root, 'test') if not os.path.exists(root): os.mkdir(root) while True: if self.args.filename is not None or self.args.disable_vidgear: ret, self.frame = video.read() if not ret: break else: self.frame = video.read() if self.frame is None: break pts = model.predict(self.frame) for i, pt in enumerate(pts): self.frame = draw_points_and_skeleton( self.frame, pt, joints_dict()[self.args.hrnet_joints_set]['skeleton'], person_index=i, points_color_palette='gist_rainbow', skeleton_color_palette='jet', points_palette_samples=10) # if not start: # #print('pts', pts) # angel = cal_angle(pts, 'start') # start = True if angel <= 20 else False if not start: self.text_ready = 'please ready' cv2.putText(self.frame, self.text_ready, (50, 50), cv2.FONT_HERSHEY_PLAIN, 2.0, (0, 0, 255), 2) angel = self.cal_angle(pts, 'start') start = True if angel <= 5 else False if start: self.text_elbow_touch_knee = 'please elbow touch knee' cv2.putText(self.frame, self.text_elbow_touch_knee, (50, 50), cv2.FONT_HERSHEY_PLAIN, 2.0, (0, 0, 255), 2) if has_display: cv2.imshow('frame.png', self.frame) k = cv2.waitKey(1) if k == 27: # Esc button if self.args.disable_vidgear: video.release() else: video.stop() break else: angle = self.cal_angle(pts, 'stardard') if angle <= 50 and start: text = "count_{}".format(num_of_std) self.count(self.frame, text, num_of_frame, root, video) start = False num_of_std += 1 flag = True elif angle <= 50 and not start and not flag: self.text_error = 'fault wrong hands action' cv2.putText(self.frame, self.text_error, (330, 50), cv2.FONT_HERSHEY_PLAIN, 2.0, (0, 0, 255), 2) self.text = "count_{}".format(num_of_std) self.count(self.frame, self.text, num_of_frame, root, video) #print(type(frame)) else: self.text = "count_{}".format(num_of_std) self.count(self.frame, self.text, num_of_frame, root, video) #print('num_of_frame', num_of_frame) #print('pts', pts) num_of_frame += 1
def main(self, args): if args.device is not None: device = torch.device(args.device) else: if torch.cuda.is_available() and True: torch.backends.cudnn.deterministic = True device = torch.device('cuda:0') else: device = torch.device('cpu') print(device) image_resolution = ast.literal_eval(args.image_resolution) has_display = 'DISPLAY' in os.environ.keys() or sys.platform == 'win32' has_display = False if args.filename is not None: video = cv2.VideoCapture(args.filename) assert video.isOpened() else: if args.disable_vidgear: video = cv2.VideoCapture(args.camera_id) assert video.isOpened() else: video = CamGear(args.camera_id).start() model = SimpleHRNet( args.hrnet_c, args.hrnet_j, args.hrnet_weights, resolution=image_resolution, multiperson=not args.single_person, #multiperson= False, max_batch_size=args.max_batch_size, device=device) num_of_frame = 0 self.num_of_std = 0 self.error_box_text = ' ' start = False flag = False root = os.path.join(args.save_root, 'sit_ups_v4_test') if not os.path.exists(root): os.mkdir(root) while True: if args.filename is not None or args.disable_vidgear: ret, self.frame = video.read() if not ret: break else: self.frame = video.read() if self.frame is None: break pts = model.predict(self.frame) for i, pt in enumerate(pts): self.frame = draw_points_and_skeleton( self.frame, pt, joints_dict()[args.hrnet_joints_set]['skeleton'], person_index=i, points_color_palette='gist_rainbow', skeleton_color_palette='jet', points_palette_samples=10) print('pts', pts) if not start: self.text_ready = '请双肩着地,双手抱头' angle_stg, angle_sew, angle_hma_start = self.cal_angle( pts, 'start') if angle_stg <= 5 and angle_sew <= 90 and angle_hma_start <= 10: start = True else: start = False self.state_box_text = self.text_ready elif start: self.text_elbow_touch_knee = '请双手抱头坐起肘部触膝' self.state_box_text = self.text_elbow_touch_knee if has_display: cv2.imshow('frame.png', self.frame) k = cv2.waitKey(1) if k == 27: # Esc button if args.disable_vidgear: video.release() else: video.stop() break else: ratio_between_distance, angle_hks, angle_hma_standard, x_diff_elbow_knee, avg_conf = self.cal_angle( pts, 'stardard') print('avg_conf', avg_conf) if avg_conf < 0.2: start = False self.text = "count_{}".format(self.num_of_std) self.count(self.frame, self.text, num_of_frame, root, video) num_of_frame += 1 continue raise_feet = False if np.absolute( angle_hma_start - angle_hma_standard) <= 5 else True if angle_hks <= 70 and start and ( ratio_between_distance or x_diff_elbow_knee < 0) and not raise_feet: self.text = "count_{}".format(self.num_of_std) self.count(self.frame, self.text, num_of_frame, root, video) self.num_of_std += 1 start = False flag = True elif angle_hks <= 70 and ( ratio_between_distance or x_diff_elbow_knee < 0 ) and not raise_feet and not start and not flag: self.text_error = '犯规,手部动作不规范' self.error_box_text = self.text_error self.text = "count_{}".format(self.num_of_std) self.count(self.frame, self.text, num_of_frame, root, video) else: self.text = "count_{}".format(self.num_of_std) self.count(self.frame, self.text, num_of_frame, root, video) #yield (self.state_box_text, self.error_box_text, self.frame, self.num_of_std) #print('time', time.time() - start_time) self.error_box_text = ' ' num_of_frame += 1
def main(camera_id, filename, hrnet_m, hrnet_c, hrnet_j, hrnet_weights, hrnet_joints_set, image_resolution, single_person, use_tiny_yolo, disable_tracking, max_batch_size, disable_vidgear, save_video, video_format, video_framerate, device): if device is not None: device = torch.device(device) else: if torch.cuda.is_available(): torch.backends.cudnn.deterministic = True device = torch.device('cuda:0') else: device = torch.device('cpu') image_resolution = ast.literal_eval(image_resolution) has_display = 'DISPLAY' in os.environ.keys() or sys.platform == 'win32' video_writer = None falldown = FallDown() if foldername is not None: images_path = foldername images_name = os.listdir(images_path) images_path = [os.path.join(images_path, name) for name in images_name] images_path.sort() else: if filename is not None: rotation_code = check_video_rotation(filename) video = cv2.VideoCapture(filename) assert video.isOpened() else: rotation_code = None if disable_vidgear: video = cv2.VideoCapture(camera_id) assert video.isOpened() else: video = CamGear(camera_id).start() if use_tiny_yolo: yolo_model_def = "./models/detectors/yolo/config/yolov3-tiny.cfg" yolo_class_path = "./models/detectors/yolo/data/coco.names" yolo_weights_path = "./models/detectors/yolo/weights/yolov3-tiny.weights" else: yolo_model_def = "./models/detectors/yolo/config/yolov3.cfg" yolo_class_path = "./models/detectors/yolo/data/coco.names" yolo_weights_path = "./models/detectors/yolo/weights/yolov3.weights" model = SimpleHRNet(hrnet_c, hrnet_j, hrnet_weights, model_name=hrnet_m, resolution=image_resolution, multiperson=not single_person, return_bounding_boxes=not disable_tracking, max_batch_size=max_batch_size, yolo_model_def=yolo_model_def, yolo_class_path=yolo_class_path, yolo_weights_path=yolo_weights_path, device=device) if not disable_tracking: prev_boxes = None prev_pts = None prev_person_ids = None next_person_id = 0 step = 0 while True: t = time.time() if foldername is None: if filename is not None or disable_vidgear: ret, frame = video.read() if not ret: break if rotation_code is not None: frame = cv2.rotate(frame, rotation_code) else: frame = video.read() if frame is None: break else: if step >= len(images_path): break # Pre-process images = [] images_origin = [] path = images_path[step] frame = cv2.imread(path, cv2.IMREAD_COLOR) if frame is None: logging.error("read image error: {}. skip it.".format(path)) continue pts = model.predict(frame) if not disable_tracking: boxes, pts = pts if not disable_tracking: if len(pts) > 0: if prev_pts is None and prev_person_ids is None: person_ids = np.arange(next_person_id, len(pts) + next_person_id, dtype=np.int32) next_person_id = len(pts) + 1 else: boxes, pts, person_ids = find_person_id_associations( boxes=boxes, pts=pts, prev_boxes=prev_boxes, prev_pts=prev_pts, prev_person_ids=prev_person_ids, next_person_id=next_person_id, pose_alpha=0.2, similarity_threshold=0.4, smoothing_alpha=0.1, ) next_person_id = max(next_person_id, np.max(person_ids) + 1) else: person_ids = np.array((), dtype=np.int32) prev_boxes = boxes.copy() prev_pts = pts.copy() prev_person_ids = person_ids else: person_ids = np.arange(len(pts), dtype=np.int32) for i, (pt, pid) in enumerate(zip(pts, person_ids)): frame = draw_points_and_skeleton( frame, pt, joints_dict()[hrnet_joints_set]['skeleton'], person_index=pid, points_color_palette='gist_rainbow', skeleton_color_palette='jet', points_palette_samples=10) frame = falldown.check_fall_down( frame, pt, joints_dict()[hrnet_joints_set]['skeleton'], video_framerate) fps = 1. / (time.time() - t) print('\rframerate: %f fps' % fps, end='') if has_display: cv2.imshow('frame.png', frame) k = cv2.waitKey(1) if k == 27: # Esc button if disable_vidgear: video.release() else: video.stop() break else: cv2.imwrite('frame.png', frame) if save_video: if video_writer is None: fourcc = cv2.VideoWriter_fourcc(*video_format) # video format video_writer = cv2.VideoWriter( 'output.avi', fourcc, video_framerate, (frame.shape[1], frame.shape[0])) video_writer.write(frame) if save_video: video_writer.release()
def open_app(camera_id=0, filename=None, hrnet_c=48, hrnet_j=17, hrnet_weights="./weights/pose_hrnet_w48_384x288.pth", hrnet_joints_set="coco", image_resolution='(384, 288)', single_person=True, max_batch_size=16, disable_vidgear=False, device=None): if device is not None: device = torch.device(device) else: if torch.cuda.is_available() and True: torch.backends.cudnn.deterministic = True device = torch.device('cuda:0') else: device = torch.device('cpu') image_resolution = ast.literal_eval(image_resolution) has_display = 'DISPLAY' in os.environ.keys() or sys.platform == 'win32' if filename is not None: video = cv2.VideoCapture(filename) assert video.isOpened() else: if disable_vidgear: video = cv2.VideoCapture(camera_id) assert video.isOpened() else: video = CamGear(camera_id).start() model = SimpleHRNet(hrnet_c, hrnet_j, hrnet_weights, resolution=image_resolution, multiperson=not single_person, max_batch_size=max_batch_size, device=device) loaded_model = pickle.load(open("mlp_model_best.sav", 'rb')) no_to_label = { 0: "tree", 1: "warrior1", 2: "warrior2", 3: "childs", 4: "downwarddog", 5: "plank", 6: "mountain", 7: "trianglepose" } image_to_blob = {} for id, path in no_to_label.items(): images = [ cv2.imread(file) for file in glob.glob('sampleposes\\' + path + '.jpg') ] image_to_blob[id] = images while True: if filename is not None or disable_vidgear: ret, frame = video.read() if not ret: break else: frame = video.read() if frame is None: break pts = model.predict(frame) resolution = frame.shape x_len = resolution[0] y_len = resolution[1] vector = [] if len(pts) == 0: continue keypoints = pts[0] for pt in keypoints: pt = list(pt) temp = [] temp.append((pt[0] / x_len)) temp.append((pt[1] / y_len)) vector.extend(temp) vector = list(vector) predicted_pose = loaded_model.predict([vector]) text = no_to_label[predicted_pose[0]] + " pose" cv2.putText(image_to_blob[predicted_pose[0]][0], text, bottomLeftCornerOfText, font, fontScale, fontColor, lineType) cv2.imshow("Suggestion", image_to_blob[predicted_pose[0]][0]) k = cv2.waitKey(1) for i, pt in enumerate(pts): frame = draw_points_and_skeleton( frame, pt, joints_dict()[hrnet_joints_set]['skeleton'], person_index=i, points_color_palette='gist_rainbow', skeleton_color_palette='jet', points_palette_samples=10) if has_display: cv2.imshow('frame.png', frame) k = cv2.waitKey(1) if k == 27: # Esc button if disable_vidgear: video.release() else: video.stop() break else: cv2.imwrite('frame.png', frame)
def main(camera_id, filename, hrnet_c, hrnet_j, hrnet_weights, hrnet_joints_set, image_resolution, single_person, max_batch_size, disable_vidgear, device, save_root, save_dir): if device is not None: device = torch.device(device) else: if torch.cuda.is_available() and True: torch.backends.cudnn.deterministic = True device = torch.device('cuda:0') else: device = torch.device('cpu') print(device) image_resolution = ast.literal_eval(image_resolution) has_display = 'DISPLAY' in os.environ.keys() or sys.platform == 'win32' has_display = False if filename is not None: video = cv2.VideoCapture(filename) assert video.isOpened() else: if disable_vidgear: video = cv2.VideoCapture(camera_id) assert video.isOpened() else: video = CamGear(camera_id).start() model = SimpleHRNet( hrnet_c, hrnet_j, hrnet_weights, resolution=image_resolution, multiperson=not single_person, max_batch_size=max_batch_size, device=device ) num_of_std = 0 num_of_frame = 0 start = False root = os.path.join(save_root, 'test_v1') if not os.path.exists(root): os.mkdir(root) while True: if filename is not None or disable_vidgear: ret, frame = video.read() if not ret: break else: frame = video.read() if frame is None: break pts = model.predict(frame) if len(pts) == 0: continue for i, pt in enumerate(pts): frame = draw_points_and_skeleton(frame, pt, joints_dict()[hrnet_joints_set]['skeleton'], person_index=i, points_color_palette='gist_rainbow', skeleton_color_palette='jet', points_palette_samples=10) print('num of frame', num_of_frame) if not start: print('pts', pts) angel = cal_angle(pts) start = True if angel >= 150 else False if has_display: cv2.imshow('frame.png', frame) k = cv2.waitKey(1) if k == 27: # Esc button if disable_vidgear: video.release() else: video.stop() break else: left_ear_height = pts[0][3][0] # pts -> (y,x ,conf) right_ear_height = pts[0][4][0] avg_ear_height = (left_ear_height + right_ear_height) / 2 left_writst_height = pts[0][9][0] right_writst_height = pts[0][10][0] avg_wrist_height = (left_writst_height + right_writst_height) / 2 left_shoulder_height = pts[0][5][0] right_shoulder_height = pts[0][6][0] avg_shoulder_height = (left_shoulder_height + right_shoulder_height) / 2 if avg_ear_height < avg_wrist_height: ear_wrist_diff = avg_wrist_height - avg_ear_height wrist_shoulder_diff = avg_shoulder_height - avg_wrist_height ratio = ear_wrist_diff / wrist_shoulder_diff if 0.5 <= ratio <= 2 and start: text = "count:{}".format(num_of_std) num_of_std+=1 count(frame, text, num_of_frame, root, video) start = False else: text = "count:{}".format(num_of_std) count(frame, text, num_of_frame, root, video) else: text = "count:{}".format(num_of_std) count(frame, text, num_of_frame, root, video) num_of_frame += 1
def main(camera_id, filename, hrnet_c, hrnet_j, hrnet_weights, hrnet_joints_set, image_resolution, single_person, max_batch_size, disable_vidgear, device, save_root): #def main(): if device is not None: device = torch.device(device) else: if torch.cuda.is_available() and True: torch.backends.cudnn.deterministic = True device = torch.device('cuda:0') else: device = torch.device('cpu') print(device) print('max_batch_size', max_batch_size) image_resolution = ast.literal_eval(image_resolution) has_display = 'DISPLAY' in os.environ.keys() or sys.platform == 'win32' has_display = False if filename is not None: video = cv2.VideoCapture(filename) assert video.isOpened() else: if disable_vidgear: video = cv2.VideoCapture(camera_id) assert video.isOpened() else: print('debug') video = CamGear(camera_id).start() model = SimpleHRNet(hrnet_c, hrnet_j, hrnet_weights, resolution=image_resolution, multiperson=not single_person, max_batch_size=max_batch_size, device=device) num_of_frame = 0 num_of_std = 0 start = False flag = False root = os.path.join(save_root, 'sit_ups_v2_add_angle_hks') if not os.path.exists(root): os.mkdir(root) while True: if filename is not None or disable_vidgear: ret, frame = video.read() if not ret: break else: frame = video.read() if frame is None: break pts = model.predict(frame) for i, pt in enumerate(pts): frame = draw_points_and_skeleton( frame, pt, joints_dict()[hrnet_joints_set]['skeleton'], person_index=i, points_color_palette='gist_rainbow', skeleton_color_palette='jet', points_palette_samples=10) # if not start: # #print('pts', pts) # angel = cal_angle(pts, 'start') # start = True if angel <= 20 else False if not start: #text_ready = 'please ready' #cv2.putText(frame, text_ready, (50,50), cv2.FONT_HERSHEY_PLAIN, 2.0, (0, 0, 255), 2) angle_stg, angle_sew, angle_ewe = cal_angle(pts, 'start') print('angle_ewe ', angle_ewe) if angle_stg <= 5 and angle_sew <= 90 and angle_ewe >= 120: start = True else: start = False #start = True if angel <= 5 else False # if start: # #text_elbow_touch_knee = 'please elbow touch knee' # cv2.putText(frame, text_elbow_touch_knee, (50, 50), cv2.FONT_HERSHEY_PLAIN, 2.0, (0, 0, 255), 2) if has_display: cv2.imshow('frame.png', frame) k = cv2.waitKey(1) if k == 27: # Esc button if disable_vidgear: video.release() else: video.stop() break else: angle_mke, angle_hks = cal_angle(pts, 'stardard') print('angle_mke', angle_mke) print('angle_hks', angle_hks) # if angle_hks <= 50 and start and flag_elblow_over_knee: if start and angle_mke <= 90 and angle_hks <= 50: num_of_std += 1 text = "count_{}".format(num_of_std) count(frame, text, num_of_frame, root, video) start = False flag = True elif angle_hks <= 60 and not start and not flag: print('True') text_error = 'fault wrong hands action' cv2.putText(frame, text_error, (330, 50), cv2.FONT_HERSHEY_PLAIN, 2.0, (0, 0, 255), 2) text = "count_{}".format(num_of_std) count(frame, text, num_of_frame, root, video) #print(type(frame)) else: text = "count_{}".format(num_of_std) count(frame, text, num_of_frame, root, video) print('num_of_frame', num_of_frame) #print('pts', pts) num_of_frame += 1
def main(camera_id, filename, hrnet_m, hrnet_c, hrnet_j, hrnet_weights, hrnet_joints_set, image_resolution, single_person, use_tiny_yolo, disable_tracking, max_batch_size, disable_vidgear, save_video, video_format, video_framerate, device): if device is not None: device = torch.device(device) else: if torch.cuda.is_available(): torch.backends.cudnn.deterministic = True device = torch.device('cuda') else: device = torch.device('cpu') # print(device) image_resolution = ast.literal_eval(image_resolution) has_display = 'DISPLAY' in os.environ.keys() or sys.platform == 'win32' video_writer = None if filename is not None: rotation_code = check_video_rotation(filename) video = cv2.VideoCapture(filename) assert video.isOpened() #nof_frames = video.get(cv2.CAP_PROP_FRAME_COUNT) else: rotation_code = None if disable_vidgear: video = cv2.VideoCapture(camera_id) assert video.isOpened() else: video = CamGear(camera_id).start() if use_tiny_yolo: yolo_model_def = "./models/detectors/yolo/config/yolov3-tiny.cfg" yolo_class_path = "./models/detectors/yolo/data/coco.names" yolo_weights_path = "./models/detectors/yolo/weights/yolov3-tiny.weights" else: yolo_model_def = "./models/detectors/yolo/config/yolov3.cfg" yolo_class_path = "./models/detectors/yolo/data/coco.names" yolo_weights_path = "./models/detectors/yolo/weights/yolov3.weights" model = SimpleHRNet(hrnet_c, hrnet_j, hrnet_weights, model_name=hrnet_m, resolution=image_resolution, multiperson=not single_person, return_bounding_boxes=not disable_tracking, max_batch_size=max_batch_size, yolo_model_def=yolo_model_def, yolo_class_path=yolo_class_path, yolo_weights_path=yolo_weights_path, device=device) if not disable_tracking: prev_boxes = None prev_pts = None prev_person_ids = None next_person_id = 0 steps_cnt = 1 flag = 0 while True: t = time.time() if filename is not None or disable_vidgear: ret, frame = video.read() nof_frames = video.get(cv2.CAP_PROP_POS_FRAMES) print(nof_frames) # #Code for bounding box and cropping of the video # bbox, label, conf = cv.detect_common_objects(frame) # frame_bounding = draw_bbox(frame, bbox, label, conf) # #bb.add(image, left, top, right, bottom, label, color) # if save_video: # if video_writer is None: # fourcc = cv2.VideoWriter_fourcc(*video_format) # video format # video_writer = cv2.VideoWriter('output_bounding.avi', fourcc, video_framerate, (frame.shape[1], frame.shape[0])) # video_writer.write(frame_bounding) if not ret: print('\rstep_count: %d' % steps_cnt, end='\n') #print (steps_cnt) break if rotation_code is not None: frame = cv2.rotate(frame, rotation_code) else: frame = video.read() if frame is None: break pts = model.predict(frame) #print(pts[1][0][0][2]) left_hip = np.array(pts[1][0][11]) left_knee = np.array(pts[1][0][13]) left_ankle = np.array(pts[1][0][15]) right_hip = np.array(pts[1][0][12]) right_knee = np.array(pts[1][0][14]) right_ankle = np.array(pts[1][0][16]) ba = left_hip - left_knee bc = left_ankle - left_knee left_cosine_angle = np.dot( ba, bc) / (np.linalg.norm(ba) * np.linalg.norm(bc)) left_angle = np.arccos(left_cosine_angle) left_angle = np.degrees(left_angle) position1 = (10, 50) position1_1 = (200, 50) de = right_hip - right_knee df = right_ankle - right_knee right_cosine_angle = np.dot( de, df) / (np.linalg.norm(de) * np.linalg.norm(df)) right_angle = np.arccos(right_cosine_angle) right_angle = np.degrees(right_angle) position2 = (10, 100) position2_1 = (200, 100) if (left_angle >= 130 and right_angle < 110) or (right_angle >= 130 and left_angle < 110): gc = 'Yes' flag = 0 else: gc = 'No' if (flag == 0): steps_cnt = steps_cnt + 1 flag = 1 position3 = (10, 150) position3_1 = (300, 150) # fontScale fontScale = 1 # Blue color in BGR color = (0, 0, 255) # Line thickness of 2 px thickness = 2 #print (left_angle) #print (right_angle) if not disable_tracking: boxes, pts = pts if not disable_tracking: if len(pts) > 0: if prev_pts is None and prev_person_ids is None: person_ids = np.arange(next_person_id, len(pts) + next_person_id, dtype=np.int32) next_person_id = len(pts) + 1 else: boxes, pts, person_ids = find_person_id_associations( boxes=boxes, pts=pts, prev_boxes=prev_boxes, prev_pts=prev_pts, prev_person_ids=prev_person_ids, next_person_id=next_person_id, pose_alpha=0.2, similarity_threshold=0.4, smoothing_alpha=0.1, ) next_person_id = max(next_person_id, np.max(person_ids) + 1) else: person_ids = np.array((), dtype=np.int32) prev_boxes = boxes.copy() prev_pts = pts.copy() prev_person_ids = person_ids else: person_ids = np.arange(len(pts), dtype=np.int32) for i, (pt, pid) in enumerate(zip(pts, person_ids)): frame = draw_points_and_skeleton( frame, pt, joints_dict()[hrnet_joints_set]['skeleton'], person_index=pid, points_color_palette='gist_rainbow', skeleton_color_palette='jet', points_palette_samples=10) fps = 1. / (time.time() - t) print('\rframerate: %f fps' % fps, end='\n') #print(steps_cnt) if has_display: cv2.imshow('frame.png', frame) k = cv2.waitKey(1) if k == 27: # Esc button if disable_vidgear: video.release() else: video.stop() break else: frame = cv2.putText(frame, str('left_angle:'), position1, cv2.FONT_HERSHEY_SIMPLEX, fontScale, color, thickness, cv2.LINE_AA) frame = cv2.putText(frame, str(left_angle), position1_1, cv2.FONT_HERSHEY_SIMPLEX, fontScale, color, thickness, cv2.LINE_AA) frame = cv2.putText(frame, str('right_angle:'), position2, cv2.FONT_HERSHEY_SIMPLEX, fontScale, color, thickness, cv2.LINE_AA) frame = cv2.putText(frame, str(right_angle), position2_1, cv2.FONT_HERSHEY_SIMPLEX, fontScale, color, thickness, cv2.LINE_AA) frame = cv2.putText(frame, str('Ground_Contact:'), position3, cv2.FONT_HERSHEY_SIMPLEX, fontScale, color, thickness, cv2.LINE_AA) frame = cv2.putText(frame, str(gc), position3_1, cv2.FONT_HERSHEY_SIMPLEX, fontScale, color, thickness, cv2.LINE_AA) #bbox, label, conf = cv.detect_common_objects(frame) #frame = draw_bbox(frame, bbox, label, conf) #bb.add(image, left, top, right, bottom, label, color) cv2.imwrite('frame.png', frame) if save_video: if video_writer is None: fourcc = cv2.VideoWriter_fourcc(*video_format) # video format video_writer = cv2.VideoWriter( 'output.avi', fourcc, video_framerate, (frame.shape[1], frame.shape[0])) video_writer.write(frame) if save_video: video_writer.release()