# -- DO NOT CHANGE THIS CELL -- #
  !mkdir /data
  !wget -P /data/ https://s3.amazonaws.com/video.udacity-data.com/topher/2018/May/5aea1b91_train-test-data/train-test-data.zip
  !unzip -n /data/train-test-data.zip -d /data

mkdir: cannot create directory ‘/data’: File exists
--2020-02-11 20:45:42--  https://s3.amazonaws.com/video.udacity-data.com/topher/2018/May/5aea1b91_train-test-data/train-test-data.zip
Resolving s3.amazonaws.com (s3.amazonaws.com)... 52.216.25.198
Connecting to s3.amazonaws.com (s3.amazonaws.com)|52.216.25.198|:443... connected.
HTTP request sent, awaiting response... 200 OK
Length: 338613624 (323M) [application/zip]
Saving to: ‘/data/train-test-data.zip.2’
train-test-data.zip 100%[===================>] 322.93M  99.1MB/s    in 3.4s    
2020-02-11 20:45:45 (93.9 MB/s) - ‘/data/train-test-data.zip.2’ saved [338613624/338613624]
Archive:  /data/train-test-data.zip


              
                  # Import packages
  import glob
  import os
  import numpy as np
  import pandas as pd
  import matplotlib.pyplot as plt
  import matplotlib.image as mpimg
  import cv2


              
                  keypoints_frame = pd.read_csv('/data/training_frames_keypoints.csv')

    n = 0
    image_name = keypoints_frame.iloc[n, 0]
    keypoints = keypoints_frame.iloc[n, 1:].values
    keypoints = keypoints.astype('float').reshape(-1, 2)

    print('Image name: ', image_name)
    print('Landmarks shape: ', keypoints.shape)
    print('First 4 key pts: {}'.format(keypoints[:4]))

Image name:  Luis_Fonsi_21.jpg
Landmarks shape:  (68, 2)
First 4 key pts: [[  45.   98.]
[  47.  106.]
[  49.  110.]
[  53.  119.]]


              
                  # Print number of images in training set
  print('Number of images: ', keypoints_frame.shape[0])

Number of images:  3462


              
                  # Image plot provided by Udacity
  def show_keypoints(image, key_pts):
      """Show image with keypoints"""
      plt.imshow(image)
      plt.scatter(key_pts[:, 0], key_pts[:, 1], s=20, marker='.', c='m')


              
                  # Select an image from data frame by changing `n`
  n = 0
  image_name = keypoints_frame.iloc[n, 0]
  keypoints = keypoints_frame.iloc[n, 1:].values
  keypoints = keypoints.astype('float').reshape(-1, 2)

  plt.figure(figsize=(5, 5))
  show_keypoints(mpimg.imread(os.path.join('/data/training/', image_name)), keypoints)
  plt.show()


              
                  from torch.utils.data import Dataset, DataLoader

    class FacialKeypointsDataset(Dataset):
        """Face Landmarks dataset."""

        def __init__(self, csv_file, root_dir, transform=None):
            """
            Args:
                csv_file (string): Path to the csv file with annotations.
                root_dir (string): Directory with all the images.
                transform (callable, optional): Optional transform to be applied
                    on a sample.
            """
            self.key_pts_frame = pd.read_csv(csv_file)
            self.root_dir = root_dir
            self.transform = transform

            def __len__(self):
            return len(self.key_pts_frame)

        def __getitem__(self, idx):
            image_name = os.path.join(self.root_dir,
                                    self.key_pts_frame.iloc[idx, 0])

            image = mpimg.imread(image_name)

            # If image has alpha color channel, remove it
            if(image.shape[2] == 4):
                image = image[:,:,0:3]

            key_pts = self.key_pts_frame.iloc[idx, 1:].values
            key_pts = key_pts.astype('float').reshape(-1, 2)
            sample = {'image': image, 'keypoints': key_pts}

            if self.transform:
                sample = self.transform(sample)

            return sample


              
                  # Construct the dataset
  face_dataset = FacialKeypointsDataset(csv_file='/data/training_frames_keypoints.csv',
                                        root_dir='/data/training/')

  print('Length of dataset: ', len(face_dataset))

Length of dataset:  3462


              
                  # Display some random images from the dataset
  num_to_display = 3

  for i in range(num_to_display):

      # Define the size of images
      fig = plt.figure(figsize=(20,10))

      # Randomly select a sample
      rand_i = np.random.randint(0, len(face_dataset))
      sample = face_dataset[rand_i]

      # Print the shape of each image and keypoints
      print(i, sample['image'].shape, sample['keypoints'].shape)

      ax = plt.subplot(1, num_to_display, i + 1)
      ax.set_title('Sample #{}'.format(i))

      show_keypoints(sample['image'], sample['keypoints'])

0 (180, 159, 3) (68, 2)
1 (227, 196, 3) (68, 2)
2 (315, 271, 3) (68, 2)


              
                  # Transforms
  import torch
  from torchvision import transforms, utils

  class Normalize(object):
      """Convert a color image to grayscale and normalize the color range to [0,1]."""
    
      def __call__(self, sample):
          image, keypoints = sample['image'], sample['keypoints']

          image_copy = np.copy(image)
          keypoints_copy = np.copy(keypoints)

          # Convert image to grayscale
          image_copy = cv2.cvtColor(image, cv2.COLOR_RGB2GRAY)

          # Downscale color range from 0-255 to 0-1
          image_copy=  image_copy/255.0

          # Downscale keypoints to center around 0 with a range of -1 to 1
          # mean = 100, sqrt = 50; so, points should be (points - 100)/50
          keypoints_copy = (keypoints_copy - 100)/50.0

          return {'image': image_copy, 'keypoints': keypoints_copy}

  class Rescale(object):
      """Rescale the image in a sample to a given size.
      Args:
          output_size (tuple or int): Desired output size. If tuple, output is
              matched to output_size. If int, smaller of image edges is matched
              to output_size keeping aspect ratio the same.
      """

      def __init__(self, output_size):
          assert isinstance(output_size, (int, tuple))
          self.output_size = output_size

      def __call__(self, sample):
          image, keypoints = sample['image'], sample['keypoints']

          h, w = image.shape[:2]
          if isinstance(self.output_size, int):
              if h > w:
                  new_h, new_w = self.output_size * h / w, self.output_size
              else:
                  new_h, new_w = self.output_size, self.output_size * w / h
          else:
              new_h, new_w = self.output_size

          new_h, new_w = int(new_h), int(new_w)
          img = cv2.resize(image, (new_w, new_h))

          # Scale the points, too
          keypoints = keypoints * [new_w / w, new_h / h]

          return {'image': img, 'keypoints': keypoints}

  class RandomCrop(object):
      """Crop randomly the image in a sample.
      Args:
          output_size (tuple or int): Desired output size. If int, square crop
              is made.
      """

      def __init__(self, output_size):
          assert isinstance(output_size, (int, tuple))
          if isinstance(output_size, int):
              self.output_size = (output_size, output_size)
          else:
              assert len(output_size) == 2
              self.output_size = output_size

      def __call__(self, sample):
          image, keypoints = sample['image'], sample['keypoints']

          h, w = image.shape[:2]
          new_h, new_w = self.output_size

          top = np.random.randint(0, h - new_h)
          left = np.random.randint(0, w - new_w)

          image = image[top: top + new_h,
                        left: left + new_w]

          keypoints = keypoints - [left, top]

          return {'image': image, 'keypoints': keypoints}

  class ToTensor(object):
      """Convert ndarrays in sample to Tensors."""

      def __call__(self, sample):
          image, keypoints = sample['image'], sample['keypoints']

          # If image has no grayscale color channel, add one
          if(len(image.shape) == 2):

              # Add third color dim
              image = image.reshape(image.shape[0], image.shape[1], 1)

          # Swap color axis, because
          # NumPy image: H x W x C
          # Torch image: C X H X W
          image = image.transpose((2, 0, 1))

          return {'image': torch.from_numpy(image),
                  'keypoints': torch.from_numpy(keypoints)}


              
                  # Test out transforms
  rescale = Rescale(100)
  crop = RandomCrop(50)
  composed = transforms.Compose([Rescale(256),
                                RandomCrop(224)])

  # Apply transforms to sample image
  test_num = 500
  sample = face_dataset[test_num]

  fig = plt.figure()
  for i, tx in enumerate([rescale, crop, composed]):
      transformed_sample = tx(sample)
      ax = plt.subplot(1, 3, i + 1)
      plt.tight_layout()
      ax.set_title(type(tx).__name__)
      show_keypoints(transformed_sample['image'], transformed_sample['keypoints'])

  plt.show()


              
                  # Define the transform pipeline
  data_transform = transforms.Compose([Rescale(256),
                                      RandomCrop(224),
                                      Normalize(),
                                      ToTensor()])

  # Create the transformed dataset
  transformed_dataset = FacialKeypointsDataset(csv_file='/data/training_frames_keypoints.csv',
                                              root_dir='/data/training/',
                                              transform=data_transform)


              
                  # Print size of dataset
  print('Number of images: ', len(transformed_dataset))

  # Print size of a few samples
  for i in range(5):
      sample = transformed_dataset[i]
      print(i, sample['image'].size(), sample['keypoints'].size())

Number of images:  3462
0 torch.Size([1, 224, 224]) torch.Size([68, 2])
1 torch.Size([1, 224, 224]) torch.Size([68, 2])
2 torch.Size([1, 224, 224]) torch.Size([68, 2])
3 torch.Size([1, 224, 224]) torch.Size([68, 2])
4 torch.Size([1, 224, 224]) torch.Size([68, 2])


              
                  # Import packages
  import matplotlib.pyplot as plt
  import numpy as np

  # Watch for any changes in model.py; if it changes, re-load it automatically
  %load_ext autoreload
  %autoreload 2


              
                  # Import packages
  import torch
  import torch.nn as nn
  import torch.nn.functional as F
  from models import Net

  # Print layers
  # These are in assignment order, not layer-wise architecture!
  net = Net()
  print(net)

Net(
  (conv1): Conv2d(1, 32, kernel_size=(5, 5), stride=(1, 1))
  (conv2): Conv2d(32, 64, kernel_size=(5, 5), stride=(1, 1))
  (conv3): Conv2d(64, 128, kernel_size=(3, 3), stride=(1, 1))
  (conv4): Conv2d(128, 256, kernel_size=(3, 3), stride=(1, 1))
  (fc1): Linear(in_features=30976, out_features=512, bias=True)
  (fc2): Linear(in_features=512, out_features=512, bias=True)
  (fc3): Linear(in_features=512, out_features=136, bias=True)
  (drop1): Dropout(p=0.1)
  (drop2): Dropout(p=0.2)
  (drop3): Dropout(p=0.3)
  (drop4): Dropout(p=0.4)
  (drop5): Dropout(p=0.5)
  (pool): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
)


              
                  from torch.utils.data import Dataset, DataLoader
  from torchvision import transforms, utils
  from data_load import FacialKeypointsDataset
  from data_load import Rescale, RandomCrop, Normalize, ToTensor

  # Assemble pipeline
  # Removed random rotation (faces are rarely seen sideways or inverted); accuracy was unaffected
  data_transform = transforms.Compose([Rescale(256),
                                      RandomCrop(224),
                                      Normalize(),
                                      ToTensor()])

  assert(data_transform is not None), 'Define a data_transform'


              
                  # Transform dataset
  transformed_dataset = FacialKeypointsDataset(csv_file='/data/training_frames_keypoints.csv',
                                              root_dir='/data/training/',
                                              transform=data_transform)

  print('Number of images: ', len(transformed_dataset))

  # Print size to confirm
  for i in range(4):
      sample = transformed_dataset[i]
      print(i, sample['image'].size(), sample['keypoints'].size())

Number of images:  3462
0 torch.Size([1, 224, 224]) torch.Size([68, 2])
1 torch.Size([1, 224, 224]) torch.Size([68, 2])
2 torch.Size([1, 224, 224]) torch.Size([68, 2])
3 torch.Size([1, 224, 224]) torch.Size([68, 2])


              
                  # Load the training set
  batch_size = 10
  train_loader = DataLoader(transformed_dataset, 
                            batch_size=batch_size,
                            shuffle=True, 
                            num_workers=0)


              
                  # Transform this dataset too
  test_dataset = FacialKeypointsDataset(csv_file='/data/test_frames_keypoints.csv',
                                              root_dir='/data/test/',
                                              transform=data_transform)


              
                  # Load the testing set
  batch_size = 10
  test_loader = DataLoader(test_dataset, 
                            batch_size=batch_size,
                            shuffle=True, 
                            num_workers=0)


              
                  # Test model on batch of test data
  def net_sample_output():

      # Iterate through dataset
      for i, sample in enumerate(test_loader):
          images = sample['image']
          key_pts = sample['keypoints']

          # Convert image to FloatTensor
          images = images.type(torch.FloatTensor)

          # Feed-forward pass
          net.eval()
          output_pts = net(images)
          net.train()

          # Reshape to batch_size x 68 x 2
          output_pts = output_pts.view(output_pts.size()[0], 68, -1)

          # Break rather than continue; one batch is fine
          if i == 0:
              return images, output_pts, key_pts


              
                  # Returns: test images, test predicted keypoints, test ground truth keypoints
  test_images, test_outputs, gt_pts = net_sample_output()

  # Print data dimensions to confirm
  print(test_images.data.size())
  print(test_outputs.data.size())
  print(gt_pts.size())

torch.Size([10, 1, 224, 224])
torch.Size([10, 68, 2])
torch.Size([10, 68, 2])


              
                  def show_all_keypoints(image, predicted_key_pts, gt_pts=None):
      """Show image with predicted keypoints"""

      # Image is grayscale
      plt.imshow(image, cmap='gray')
      plt.scatter(predicted_key_pts[:, 0], predicted_key_pts[:, 1], s=20, marker='.', c='m')

      # Plot ground truth points as green points
      if gt_pts is not None:
          plt.scatter(gt_pts[:, 0], gt_pts[:, 1], s=20, marker='.', c='g')


              
                  # Visualize output by plotting both predicted keypoints and actual keypoints
  def visualize_output(test_images, test_outputs, actual=None, batch_size=10):

      for i in range(batch_size):
          plt.figure(figsize=(20,10))
          ax = plt.subplot(1, batch_size, i+1)

          # Un-transform the data
          image = test_images[i].data
          image = image.numpy()
          image = np.transpose(image, (1, 2, 0))
          predicted_keypoints = test_outputs[i].data
          predicted_keypoints = predicted_keypoints.numpy()
          predicted_keypoints = predicted_keypoints*50.0+100

          # Plot actual keypoints if known
          actual_keypoints = None
          if actual is not None:
              actual_keypoints = actual[i]         
              actual_keypoints = actual_keypoints*50.0+100

          # Call helper function to display
          show_all_keypoints(np.squeeze(image), predicted_keypoints, actual_keypoints) 
          plt.axis('off')

      plt.show()
  visualize_output(test_images, test_outputs, gt_pts)


              
                  import torch.optim as optim
  criterion = nn.MSELoss()
  optimizer = optim.Adam(net.parameters(), lr=0.0001)


              
                  def train_net(n_epochs):
      net.train()

      for epoch in range(n_epochs):
          running_loss = 0.0

          # For each batch...
          for batch_i, data in enumerate(train_loader):

              # Get image and actual keypoints
              images = data['image']
              actual_keypoints = data['keypoints']

              # Flatten them
              actual_keypoints = actual_keypoints.view(actual_keypoints.size(0), -1)

              # Convert them to floats for MSE
              actual_keypoints = actual_keypoints.type(torch.FloatTensor)
              images = images.type(torch.FloatTensor)

              # Feed forward to produce prediction
              predicted_points = net(images)

              # Calculate loss between predicted and actual keypoints
              loss = criterion(predicted_points, actual_keypoints)

              # Zero the weight gradients
              optimizer.zero_grad()

              # Backward pass to recalculate gradients
              loss.backward()

              # Update weights
              optimizer.step()

              # Print running results
              running_loss += loss.item()
              if batch_i % 10 == 9:    # Every 10 batches
                  print('Epoch: {:<2} Batch: {:<3} Loss: {:0.3f}'.format(epoch+1, batch_i+1, running_loss/10))
                  running_loss = 0.0

      print('Finished Training')


              
                  # Number of training cycles
  n_epochs = 20

  # Run training
  train_net(n_epochs)

Epoch: 1  Batch: 340 Loss: 0.296
...
Epoch: 10 Batch: 340 Loss: 0.067
...
Epoch: 20 Batch: 340 Loss: 0.056

Finished Training


              
                  # Get another test sample
  test_images, test_outputs, actual_keypoints = net_sample_output()

  # Print size
  print(test_images.data.size())
  print(test_outputs.data.size())
  print(actual_keypoints.size())

torch.Size([10, 1, 224, 224])
torch.Size([10, 68, 2])
torch.Size([10, 68, 2])


              
                  # Plot image and both sets of points
  visualize_output(test_images, test_outputs, actual_keypoints)


              
                  # Change `model_name` or previous model will be overwritten
  model_dir = 'models/'
  model_name = 'keypoints_model_1.pt'

  torch.save(net.state_dict(), model_dir+model_name)


              
                  # Get weights of first conv layer, "conv1"
  weights1 = net.conv1.weight.data

  w = weights1.numpy()

  filter_index = 0

  print(w[filter_index][0])
  print(w[filter_index][0].shape)

  # Plot weights
  plt.imshow(w[filter_index][0], cmap='gray')

[[-0.04707267 -0.0583389   0.19476311  0.05585203 -0.17116383]
[-0.00840306 -0.06657861  0.07488757  0.15785611  0.16470772]
[ 0.11142143  0.20647456 -0.11074037  0.15031649 -0.17609671]
[ 0.05433566  0.02660246  0.07823772  0.14658174  0.03625878]
[ 0.13994598  0.07088993 -0.06875328 -0.00787444 -0.11447631]]
(5, 5)

<matplotlib.image.AxesImage at 0x7f4ae6926da0>


              
                  # Import packages
  import numpy as np
  import matplotlib.pyplot as plt
  import matplotlib.image as mpimg
  %matplotlib inline


              
                  import cv2

  # Load new color image from image directory
  image = cv2.imread('./images/obamas.jpg')

  # Switch red and blue, because OpenCV uses BGR, not RGB
  image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)

  # Plot image
  fig = plt.figure(figsize=(9,9))
  plt.imshow(image)

<matplotlib.image.AxesImage at 0x23374373550>


              
                  # Load pre-trained detector
  face_cascade = cv2.CascadeClassifier('detectors/haarcascade_frontalface_default.xml')

  # Run detector and store output (anchor and dimensions box) in `faces`
  faces = face_cascade.detectMultiScale(image, 1.2, 2)

  # Duplicate the sample image for this example
  image_with_detections = image.copy()

  # For each face found
  for (x,y,w,h) in faces:

      # Draw red box
      cv2.rectangle(image_with_detections,(x,y),(x+w,y+h),(255,0,0),3)

  fig = plt.figure(figsize=(9,9))

  plt.imshow(image_with_detections)

<matplotlib.image.AxesImage at 0x23374bc9280>


              
                  import torch
  from models import Net

  net = Net()

  # Load model checkpoint into network
  net.load_state_dict(torch.load('models/keypoints_model_1.pt'))

  # Print network to be sure
  net.eval()

  Net(
    (conv1): Conv2d(1, 32, kernel_size=(5, 5), stride=(1, 1))
    (conv2): Conv2d(32, 64, kernel_size=(5, 5), stride=(1, 1))
    (conv3): Conv2d(64, 128, kernel_size=(3, 3), stride=(1, 1))
    (conv4): Conv2d(128, 256, kernel_size=(3, 3), stride=(1, 1))
    (fc1): Linear(in_features=30976, out_features=512, bias=True)
    (fc2): Linear(in_features=512, out_features=512, bias=True)
    (fc3): Linear(in_features=512, out_features=136, bias=True)
    (drop1): Dropout(p=0.1)
    (drop2): Dropout(p=0.2)
    (drop3): Dropout(p=0.3)
    (drop4): Dropout(p=0.4)
    (drop5): Dropout(p=0.5)
    (pool): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
  )


              
                  def show_all_keypoints(image, keypoints):
      """Show image with predicted keypoints"""

      plt.figure(figsize=(5, 5))

      keypoints = keypoints.data.numpy()
      keypoints = keypoints * 60.0 + 96
      keypoints = np.reshape(keypoints, (68, 2))

      image = image.squeeze(0)
      image = image.numpy()
      image = np.transpose(image, (1, 2, 0))
      image = np.squeeze(image)

      plt.imshow(image, cmap='gray')
      plt.scatter(keypoints[:, 0], keypoints[:, 1], s=20, marker='.', c='m')


              
                  image_copy = np.copy(image)

  # For each face found
  for (x,y,w,h) in faces:

      # Tighten crop
      w = int(w * 1.25)
      h = int(h * 1.25)

      # Select facial region of interest
      roi = image_copy[y:y+h, x:x+w]

      # Convert to grayscale
      roi = cv2.cvtColor(roi, cv2.COLOR_RGB2GRAY)

      # Downscale color range from 0-255 to 0-1
      roi = roi / 255.0

      # Rescale to 224x224
      roi = cv2.resize(roi, (224, 224))

      # Swap color axis, because
      # NumPy image: H x W x C
      # Torch image: C X H X W
      roi = np.reshape(roi, (1, 1, 224, 224))

      # Pass through network
      roi = torch.from_numpy(roi)
      roi = roi.type(torch.FloatTensor)
      keypoints = net(roi)

      # Plot result
      show_all_keypoints(roi, keypoints)


              
                  # Import packages
  import matplotlib.image as mpimg
  import matplotlib.pyplot as plt
  import numpy as np
  import pandas as pd
  import os
  import cv2


              
                  # Load sunglasses with cv2 and IMREAD_UNCHANGED
  # Specifying IMREAD_UNCHANGED includes alpha channel
  sunglasses = cv2.imread('images/sunglasses.png', cv2.IMREAD_UNCHANGED)

  # Plot image
  plt.imshow(sunglasses)

  # Print dimensions
  print('Image shape: ', sunglasses.shape)

Image shape:  (1123, 3064, 4)


              
                  # Print image alpha
  alpha_channel = sunglasses[:,:,3]
  print ('The alpha channel looks like this (black pixels = transparent): ')
  plt.imshow(alpha_channel, cmap='gray')

The alpha channel looks like this (black pixels = transparent):

<matplotlib.image.AxesImage at 0x7f5a509b0dd8>


              
                  # Print non-zero values on alpha channel
  values = np.where(alpha_channel != 0)
  print ('The non-zero values of the alpha channel are: ')
  print (values)

The non-zero values of the alpha channel are: 
(array([  17,   17,   17, ..., 1109, 1109, 1109]), array([ 687,  688,  689, ..., 2376, 2377, 2378]))


              
                  # Load training data
  keypoints_frame = pd.read_csv('/data/training_frames_keypoints.csv')

  # Confirm number of images
  print('Number of images: ', keypoints_frame.shape[0])

Number of images:  3462


              
                  # Helper function provided by Udacity
  def show_keypoints(image, keypoints):
      """Show image with keypoints"""
      plt.imshow(image)
      plt.scatter(keypoints[:, 0], keypoints[:, 1], s=20, marker='.', c='m')


              
                  # Select image (n = 120 is Christopher Walken) and get keypoints
  n = 120
  image_name = keypoints_frame.iloc[n, 0]
  image = mpimg.imread(os.path.join('/data/training/', image_name))
  keypoints = keypoints_frame.iloc[n, 1:].as_matrix()
  keypoints = keypoints.astype('float').reshape(-1, 2)

  # Print image name
  print('Image name: ', image_name)

  # Plot image
  plt.figure(figsize=(5, 5))
  show_keypoints(image, keypoints)
  plt.show()

Image name:  Christopher_Walken_01.jpg


              
                  # Duplicate image
  image_copy = np.copy(image)

  # Set sunglasses anchor
  # 17 = outter edge of left eyebrow
  x = int(keypoints[17, 0])
  y = int(keypoints[17, 1])

  # Set height and width of sunglasses
  # h = length of nose
  h = int(abs(keypoints[27,1] - keypoints[34,1]))
  # w = total width of eyebrows
  w = int(abs(keypoints[17,0] - keypoints[26,0]))

  # Read in sunglasses image
  sunglasses = cv2.imread('images/sunglasses.png', cv2.IMREAD_UNCHANGED)
  # Resize sunglasses
  new_sunglasses =  cv2.resize(sunglasses, (w, h), interpolation = cv2.INTER_CUBIC)

  # Get region of interest
  roi_color = image_copy[y:y+h,x:x+w]

  # Get all pixels where alpha > 0
  pos_alpha = np.argwhere(new_sunglasses[:,:,3] > 0)

  # Replace pixels in original image with sunglasses pixels of alpha > 0
  for i in range(3):
      roi_color[pos_alpha[:,0],pos_alpha[:,1],i] = new_sunglasses[pos_alpha[:,0],pos_alpha[:,1],i]    
  image_copy[y:y+h,x:x+w] = roi_color

  # Plot image
  plt.imshow(image_copy)

<matplotlib.image.AxesImage at 0x7f5a4ff93518>

Facial Keypoint Detector¶

1.0 Examine Data¶

1.1 Types of Data¶

1.2 Check Images¶

1.3 Dataset Class¶

1.4 Transforms¶

1.5 Test the Transforms¶

1.6 Create the Transformed Dataset¶

2.0 Define the Convolutional Neural Network¶

2.1 CNN Architecture¶

2.2 PyTorch Neural Networks¶

Define the Layers in `init`¶

Refer to Layers in `forward`¶

Import model¶

2.3 Transform the Data¶

2.4 Batch the Data¶

2.5 Load the Test Data¶

2.6 Apply Model to Test Sample¶

2.7 Debugging¶

2.8 Visualize Predicted Keypoints¶

2.9 Loss Function and Optimizer¶

2.10 Training¶

2.11 Testing¶

2.12 Save the Model¶

2.13 Nanodegree Questions¶

Question 1: What optimization and loss functions did you choose and why?¶

Question 2: What kind of network architecture did you start with and how did it change as you tried different architectures? Did you decide to add more convolutional layers or any layers to avoid overfitting the data?¶

Question 3: How did you decide on the number of epochs and batch_size to train your model?¶

Question 4: Choose one filter from your trained CNN; what purpose do you think it plays? What kind of feature do you think it detects?¶

2.14 Feature Visualization¶

3.0 Face and Facial Keypoint Detection¶

3.1 Detect All Faces¶

3.2 Load Trained Model¶

3.3 Keypoint Detection¶

4.0 Facial Filters¶

4.1 Overlay Sunglasses¶

Facial Keypoint Detector¶

1.0 Examine Data¶

1.1 Types of Data¶

1.2 Check Images¶

1.3 Dataset Class¶

1.4 Transforms¶

1.5 Test the Transforms¶

1.6 Create the Transformed Dataset¶

2.0 Define the Convolutional Neural Network¶

2.1 CNN Architecture¶

2.2 PyTorch Neural Networks¶

Define the Layers in __init__¶

Refer to Layers in forward¶

Import model¶

2.3 Transform the Data¶

2.4 Batch the Data¶

2.5 Load the Test Data¶

2.6 Apply Model to Test Sample¶

2.7 Debugging¶

2.8 Visualize Predicted Keypoints¶

2.9 Loss Function and Optimizer¶

2.10 Training¶

2.11 Testing¶

2.12 Save the Model¶

2.13 Nanodegree Questions¶

Question 1: What optimization and loss functions did you choose and why?¶

Question 2: What kind of network architecture did you start with and how did it change as you tried different architectures? Did you decide to add more convolutional layers or any layers to avoid overfitting the data?¶

Question 3: How did you decide on the number of epochs and batch_size to train your model?¶

Question 4: Choose one filter from your trained CNN; what purpose do you think it plays? What kind of feature do you think it detects?¶

2.14 Feature Visualization¶

3.0 Face and Facial Keypoint Detection¶

3.1 Detect All Faces¶

3.2 Load Trained Model¶

3.3 Keypoint Detection¶

4.0 Facial Filters¶

4.1 Overlay Sunglasses¶

Define the Layers in `init`¶

Refer to Layers in `forward`¶