From dd62d6fa4a85f18a29de009a972f5599b19ec946 Mon Sep 17 00:00:00 2001 From: natanielruiz <nataniel777@hotmail.com> Date: 星期四, 14 九月 2017 00:51:53 +0800 Subject: [PATCH] Fixing hopenet --- code/test_on_video.py | 15 +++++++++++++-- 1 files changed, 13 insertions(+), 2 deletions(-) diff --git a/code/test_on_video.py b/code/test_on_video.py index 20dfaac..d384b08 100644 --- a/code/test_on_video.py +++ b/code/test_on_video.py @@ -60,7 +60,8 @@ print 'Loading data.' transformations = transforms.Compose([transforms.Scale(224), - transforms.RandomCrop(224), transforms.ToTensor()]) + transforms.CenterCrop(224), transforms.ToTensor(), + transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])]) model.cuda(gpu) @@ -123,6 +124,14 @@ sys.exit(0) x_min, y_min, x_max, y_max = int(line[1]), int(line[2]), int(line[3]), int(line[4]) + x_min -= 150 + x_max += 150 + y_min -= 250 + y_max += 100 + x_min = max(x_min, 0) + y_min = max(y_min, 0) + x_max = min(frame.shape[1], x_max) + y_max = min(frame.shape[0], y_max) # Crop image img = frame[y_min:y_max,x_min:x_max] img = Image.fromarray(img) @@ -132,7 +141,7 @@ img_shape = img.size() img = img.view(1, img_shape[0], img_shape[1], img_shape[2]) img = Variable(img).cuda(gpu) - yaw, pitch, roll = model(img) + yaw, pitch, roll, angles = model(img) yaw_predicted = F.softmax(yaw) pitch_predicted = F.softmax(pitch) @@ -145,6 +154,8 @@ # Print new frame with cube and TODO: axis txt_out.write(str(frame_num) + ' %f %f %f\n' % (yaw_predicted, pitch_predicted, roll_predicted)) utils.plot_pose_cube(frame, yaw_predicted, pitch_predicted, roll_predicted, (x_min + x_max) / 2, (y_min + y_max) / 2, size = 200) + # Plot expanded bounding box + cv2.rectangle(frame, (x_min, y_min), (x_max, y_max), (0,255,0), 3) out.write(frame) frame_num += 1 -- Gitblit v1.8.0