print("Without input file!!") sys.exit(0) #model for face detect face_model = AntiSpoofPredict(0) #model for landmarks checkpoint_h = torch.load(headpose_model, map_location=device) plfd_backbone = PFLDInference().to(device) plfd_backbone.load_state_dict(checkpoint_h['plfd_backbone']) plfd_backbone.eval() plfd_backbone = plfd_backbone.to(device) headpose_transformer = transforms.Compose([transforms.ToTensor()]) #model for distract checkpoint_d = torch.load(user_set.model_path) model = cnn.ConvNet(num_classes=6).to(device) model.load_state_dict(checkpoint_d) model.eval() distract_transformer = transforms.Compose([ transforms.RandomHorizontalFlip(), transforms.ToTensor(), #0-255 to 0-1, numpy to tensors transforms.Normalize( [0.485, 0.456, 0.406], # 0-1 to [-1,1] , formula (x-mean)/std [0.229, 0.224, 0.255]) ]) font = cv2.FONT_HERSHEY_SIMPLEX cap = cv2.VideoCapture(fileUrl) ret, frame = cap.read() frame = cv2.rotate(frame, cv2.cv2.ROTATE_90_CLOCKWISE)