# Import PyTorch packages
  import torch
  from torch import nn, optim
  import torch.nn.functional as F
  from torchvision import datasets, models, transforms
  
  # Import and configure MatPlotLib package
  import matplotlib.pyplot as plt
  %matplotlib inline
  %config InlineBackend.figure_format = "retina"
  
  # Import other Python packages
  from collections import OrderedDict
  import json
  import numpy as np
  from PIL import Image
  
  # Determine which device will be active
  device = torch.device("cuda" if torch.cuda.is_available() else "cpu")


              
                # Define image directory
  img_dir = "flowers"
  
  # Define data transforms by set
  channel_norms = {"mean": [0.485, 0.456, 0.406],
                  "std": [0.229, 0.224, 0.225]}
  train_transforms = transforms.Compose([transforms.RandomRotation(30),
                                        transforms.RandomResizedCrop(224),
                                        transforms.RandomHorizontalFlip(),
                                        transforms.ColorJitter(0.25, 0.25, 0.25),
                                        transforms.ToTensor(),
                                        transforms.Normalize(**channel_norms)])
  test_transforms = transforms.Compose([transforms.Resize(256),
                                        transforms.CenterCrop(224),
                                        transforms.ToTensor(),
                                        transforms.Normalize(**channel_norms)])
  
                                        # Load transformed datasets
  train_data = datasets.ImageFolder(img_dir + "/train", transform=train_transforms)
  valid_data = datasets.ImageFolder(img_dir + "/valid", transform=test_transforms)
  test_data = datasets.ImageFolder(img_dir + "/test", transform=test_transforms)
  
  # Define dataloaders and shuffle trainloader
  trainloader = torch.utils.data.DataLoader(train_data, batch_size=64, shuffle=True)
  validloader = torch.utils.data.DataLoader(valid_data, batch_size=64)
  testloader = torch.utils.data.DataLoader(test_data, batch_size=64)


              
                with open('class_to_name.json', 'r') as f:
      class_to_name = json.load(f)


              
                # Load pre-trained network and freeze parameters
  model = models.vgg19(pretrained=True)
  for param in model.parameters():
      param.requires_grad = False
  
      # Define new classifier
  learnrate = 0.001
  n_inputs = 25088
  n_outputs = 102
  
  layers = OrderedDict([('fc1', nn.Linear(n_inputs, 3136)),
                        ('relu1', nn.ReLU()),
                        ('drop1', nn.Dropout(p=0.25)),
                        ('fc2', nn.Linear(3136, 784)),
                        ('relu2', nn.ReLU()),
                        ('drop2', nn.Dropout(p=0.5)),
                        ('fc3', nn.Linear(784, 392)),
                        ('relu3', nn.ReLU()),
                        ('drop3', nn.Dropout(p=0.5)),
                        ('fc4', nn.Linear(392, n_outputs)),
                        ('output', nn.LogSoftmax(dim=1))])
  
  model.classifier = nn.Sequential(layers)
  
  # Define loss function: NLLLoss used due to LogSoftmax
  criterion = nn.NLLLoss()
  
  # Send model to active device prior (!) to constructing optimizer
  model.to(device)
  optimizer = optim.Adam(model.classifier.parameters(), lr=learnrate)


              
                # Define hyperparameters and counters
  epochs = 20
  steps = 0
  training_loss = 0
  test_freq = 20 # Total tests = (100 / test_frequency) * epochs
  
  # Change to training environment
  model.train()
  
  # Print log header
  print(f"\nResults of {(100 / test_freq) * epochs:0.0f} tests over {epochs} epochs:\n")
  
  # Begin training cycle
  for epoch in range(epochs):
      for images, labels in trainloader:
          
          # Send data to active device
          images, labels = images.to(device), labels.to(device)
          
          # Run training pass
          optimizer.zero_grad()
          log_probs = model(images)
          batch_loss = criterion(log_probs, labels)
          batch_loss.backward()
          optimizer.step()
          
          # Increment counters
          training_loss += batch_loss.item()
          steps += 1
          
          # Run validation according to test frequency
          if steps % test_freq == 0:
              accuracy = 0
              valid_loss = 0
              
              # Change to evaluation environment
              model.eval()
              with torch.no_grad():
                  for images, labels in validloader:
                      
                      # Send data to active device
                      images, labels = images.to(device), labels.to(device)
                      
                      # Run validation pass
                      log_probs = model(images)
                      batch_loss = criterion(log_probs, labels)
                      probs = torch.exp(log_probs)
                      top_prob, top_class = probs.topk(1, dim=1)
                      equals = top_class == labels.view(*top_class.shape)
                      
                      # Increment counters
                      accuracy += torch.mean(equals.type(torch.FloatTensor)).item()
                      valid_loss += batch_loss.item()
                      
              print(f"Epoch {epoch + 1:<2}  ",
                    f"Training Loss: {training_loss / test_freq:0.3f}  ",
                    f"Validation Loss: {valid_loss / len(validloader):0.3f}  ",
                    f"Accuracy: {accuracy / len(validloader):0.2%}")
              
              # Reset counters
              training_loss = 0
              
              # Revert to training environment
              model.train()

Results of 100 tests over 20 epochs:
Epoch 1    Training Loss: 4.703   Validation Loss: 4.440   Accuracy: 3.85%
Epoch 1    Training Loss: 4.421   Validation Loss: 4.037   Accuracy: 12.86%
Epoch 1    Training Loss: 4.187   Validation Loss: 3.554   Accuracy: 16.71%
Epoch 1    Training Loss: 3.833   Validation Loss: 3.212   Accuracy: 20.77%
Epoch 1    Training Loss: 3.619   Validation Loss: 2.917   Accuracy: 28.05%
...
Epoch 10   Training Loss: 1.378   Validation Loss: 0.720   Accuracy: 80.61%
Epoch 10   Training Loss: 1.358   Validation Loss: 0.725   Accuracy: 81.36%
Epoch 10   Training Loss: 1.538   Validation Loss: 0.715   Accuracy: 81.88%
Epoch 10   Training Loss: 1.498   Validation Loss: 0.705   Accuracy: 81.81%
Epoch 10   Training Loss: 1.417   Validation Loss: 0.720   Accuracy: 81.57%
...
Epoch 20   Training Loss: 1.204   Validation Loss: 0.559   Accuracy: 86.86%
Epoch 20   Training Loss: 1.197   Validation Loss: 0.560   Accuracy: 85.69%
Epoch 20   Training Loss: 1.170   Validation Loss: 0.547   Accuracy: 86.58%
Epoch 20   Training Loss: 1.165   Validation Loss: 0.547   Accuracy: 87.42%
Epoch 20   Training Loss: 1.226   Validation Loss: 0.532   Accuracy: 86.51%


              
                # Define testing counters
  accuracy = 0
  testing_loss = 0
  
  # Print log header
  print(f"\nResults of model test:\n")
  
  # Change to evaluation environment
  model.eval()
  with torch.no_grad():
      for images, labels in testloader:
          
          # Send data to active device
          images, labels = images.to(device), labels.to(device)
          
          # Run validation pass
          log_probs = model(images)
          batch_loss = criterion(log_probs, labels)
          probs = torch.exp(log_probs)
          top_prob, top_class = probs.topk(1, dim=1)
          equals = top_class == labels.view(*top_class.shape)
          
          # Increment counters
          accuracy += torch.mean(equals.type(torch.FloatTensor)).item()
          testing_loss += batch_loss.item()
  
  # Log results
  print(f"Testing Loss: {testing_loss / len(testloader):0.3f}  ",
        f"Accuracy: {accuracy / len(testloader):0.2%}")

Results of model test:
Testing Loss: 0.550   Accuracy: 86.53%


              
                # Change to evaluation environment
  model.eval()
  
  # Define checkpoint content
  checkpoint = {"class_to_idx": train_data.class_to_idx,
                "classifier.state_dict": model.classifier.state_dict(),
                "epochs": epochs,
                "n_inputs": n_inputs,
                "layers": layers,
                "learnrate": learnrate,
                "model": "vgg19",
                "optimizer.state_dict": optimizer.state_dict(),
                "n_outputs": n_outputs}
  
  # Save checkpoint
  torch.save(checkpoint, "checkpoint.pth")


              
                # Load checkpoint and return rebuilt model
  def load_model(filepath):
      checkpoint = torch.load(filepath)
      n_inputs = checkpoint["n_inputs"]
      n_outputs = checkpoint["n_outputs"]
      
      # Add further structures as needed
      if checkpoint["model"] == "vgg19":
          model = models.vgg19(pretrained=True)
      
      model.classifier = nn.Sequential(checkpoint["layers"])
      model.class_to_idx = checkpoint["class_to_idx"]
      model.classifier.load_state_dict(checkpoint["classifier.state_dict"])
      
      return model


              
                # Accept image filepath, and return image tensor
  def process_image(imagepath):
      
      # Define transforms to match inputs
      channel_norms = {"mean": [0.485, 0.456, 0.406],
                      "std": [0.229, 0.224, 0.225]}
      
      process = transforms.Compose([transforms.Resize(256),
                                      transforms.CenterCrop(224),
                                      transforms.ToTensor(),
                                      transforms.Normalize(**channel_norms)])
      
      # Apply transformations to PIL image, incl. converting to tensor
      image = process(Image.open(imagepath))
      
      return image


              
                # This function provided by Udacity
  def imshow(image, ax=None, title=None):
      """Imshow for Tensor."""
      if ax is None:
          fig, ax = plt.subplots()
      
      # PyTorch tensors assume the color channel is the first dimension
      # but matplotlib assumes is the third dimension
      image = image.numpy().transpose((1, 2, 0))
      
      # Undo preprocessing
      mean = np.array([0.485, 0.456, 0.406])
      std = np.array([0.229, 0.224, 0.225])
      image = std * image + mean
      
      # Image needs to be clipped between 0 and 1 or it looks like noise when displayed
      image = np.clip(image, 0, 1)
      
      ax.imshow(image)
      
      return ax
      
  # Test image processing
  imshow(process_image("flowers/valid/1/image_06739.jpg"))

<matplotlib.axes._subplots.AxesSubplot at 0x7ff237e36390>


              
                # Accept imagepath and model, and return top-K of image
  def predict(imagepath, model, k=5):
      
      # Process image into tensor
      image = process_image(imagepath)
      image = image.unsqueeze(0)
      
      # Change to evaluation mode
      model.eval()
      
      # Run image through model
      with torch.no_grad():
          
          # Send image and model to active device
          image.to("cpu")
          model.to("cpu")
          
          # Run image through model to get top-Ks
          log_probs = model(image)
          probs = torch.exp(log_probs)
          top_probs, top_classes = probs.topk(k, dim=1)
          
          # Convert top-K classes into label indices, and convert to lists
          idx_to_class = {val: key for key, val in model.class_to_idx.items()}
          class_list = [idx_to_class[i] for i in top_classes[0].tolist()]
          probs_list = top_probs[0].tolist()
          
          return probs_list, class_list


              
                # Accept imagepath and model, and return top-K probabilities of its class
  def classify(imagepath, model, k=5):
      
      # Predict classes
      probs, classes = predict(imagepath, model, k)
      
      # Get image name
      name = imagepath.split("/")[-1][0:-4]
      
      # Get flower names
      flowers = [cat_to_name[str(i)] for i in classes]
      print(flowers)
      print(probs)
      
      # Create figure plot
      figure1, (ax1, ax2) = plt.subplots(figsize=(10, 5), ncols=2, nrows=1)
      
      # Add top-K subplot
      ax1.barh(flowers, probs)
      ax1.invert_yaxis()
      
      # Add image subplot
      ax2.set_title(name)
      ax2.xaxis.set_visible(False)
      ax2.yaxis.set_visible(False)
      imshow(process_image(imagepath), ax2, name)
      
  classify("flowers/valid/1/image_06739.jpg", load_model("checkpoint.pth"))

['wild pansy', 'tree mallow', 'pink primrose', 'balloon flower', 'morning glory']
[0.9677202105522156, 0.014497778378427029, 0.008569423109292984, 0.008503802120685577, 0.0003488800139166415]

AI Image Classifier¶

Loading Packages¶

Loading the Data¶

Mapping Labels to Names¶

Building the Classifier¶

Training the Classifier¶

Testing the Network¶

Saving and Loading the Checkpoint¶

Inference for Classification¶

Image Preprocessing¶

Class Prediction¶

Sanity Checking¶