From 43416c4717d2430c3e11f042294d12b781fee2e1 Mon Sep 17 00:00:00 2001 From: natanielruiz <nataniel777@hotmail.com> Date: 星期三, 27 九月 2017 04:09:30 +0800 Subject: [PATCH] Failed lstm experiment --- code/test_on_video.py | 31 +++++++++++++++++++++---------- 1 files changed, 21 insertions(+), 10 deletions(-) diff --git a/code/test_on_video.py b/code/test_on_video.py index ca17ccd..c837775 100644 --- a/code/test_on_video.py +++ b/code/test_on_video.py @@ -48,7 +48,7 @@ # ResNet101 with 3 outputs. # model = hopenet.Hopenet(torchvision.models.resnet.Bottleneck, [3, 4, 23, 3], 66) # ResNet50 - model = hopenet.Hopenet(torchvision.models.resnet.Bottleneck, [3, 4, 6, 3], 66) + model = hopenet.Hopenet(torchvision.models.resnet.Bottleneck, [3, 4, 6, 3], 66, 0) # ResNet18 # model = hopenet.Hopenet(torchvision.models.resnet.BasicBlock, [2, 2, 2, 2], 66) @@ -60,7 +60,8 @@ print 'Loading data.' transformations = transforms.Compose([transforms.Scale(224), - transforms.RandomCrop(224), transforms.ToTensor()]) + transforms.CenterCrop(224), transforms.ToTensor(), + transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])]) model.cuda(gpu) @@ -74,11 +75,21 @@ idx_tensor = torch.FloatTensor(idx_tensor).cuda(gpu) video = cv2.VideoCapture(video_path) - width = int(video.get(cv2.CAP_PROP_FRAME_WIDTH)) # float - height = int(video.get(cv2.CAP_PROP_FRAME_HEIGHT)) # float + + # New cv2 + # width = int(video.get(cv2.CAP_PROP_FRAME_WIDTH)) # float + # height = int(video.get(cv2.CAP_PROP_FRAME_HEIGHT)) # float + # + # # Define the codec and create VideoWriter object + # fourcc = cv2.VideoWriter_fourcc(*'MJPG') + # out = cv2.VideoWriter('output/video/output-%s.avi' % args.output_string, fourcc, 30.0, (width, height)) + + # Old cv2 + width = int(video.get(cv2.cv.CV_CAP_PROP_FRAME_WIDTH)) # float + height = int(video.get(cv2.cv.CV_CAP_PROP_FRAME_HEIGHT)) # float # Define the codec and create VideoWriter object - fourcc = cv2.VideoWriter_fourcc(*'MJPG') + fourcc = cv2.cv.CV_FOURCC(*'MJPG') out = cv2.VideoWriter('output/video/output-%s.avi' % args.output_string, fourcc, 30.0, (width, height)) txt_out = open('output/video/output-%s.txt' % args.output_string, 'w') @@ -123,10 +134,10 @@ sys.exit(0) x_min, y_min, x_max, y_max = int(line[1]), int(line[2]), int(line[3]), int(line[4]) - x_min -= 100 - x_max += 100 - y_min -= 200 - y_max += 50 + x_min -= 150 + x_max += 150 + y_min -= 250 + y_max += 100 x_min = max(x_min, 0) y_min = max(y_min, 0) x_max = min(frame.shape[1], x_max) @@ -140,7 +151,7 @@ img_shape = img.size() img = img.view(1, img_shape[0], img_shape[1], img_shape[2]) img = Variable(img).cuda(gpu) - yaw, pitch, roll = model(img) + yaw, pitch, roll, angles = model(img) yaw_predicted = F.softmax(yaw) pitch_predicted = F.softmax(pitch) -- Gitblit v1.8.0