Example 2: Training a classifier based on sequence data
=======================================================

In this example we train a model using entire sequences from the dataset. Since each typhoon is a different length, we must pad all sequences (and their labels) to the size of the longest sequence (505). The model will take an entire sequence of 505 and return a prediction for each frame in the sequence. 

The Code
-----------
::

	import torch
	from torch import nn
	from torch import optim
	import torch.nn.functional as F
	import numpy as np
	import pandas as pd
	from tqdm import tqdm
	from torchvision import datasets, transforms, models
	import argparse
	from pathlib import Path
	from torch.utils.data import DataLoader

	from DigitalTyphoonDataloader.DigitalTyphoonDataset import DigitalTyphoonDataset

	def main(args):

	    ## Prepare the data

	    # Specify the paths to the data
	    data_path = args.dataroot
	    images_path = data_path + '/image/' # to the image folder
	    metadata_path = data_path + '/metadata/' # to the metadata folder
	    json_path = data_path + '/metadata.json'  # to the metadata json

	    # Define a filter to pass to the loader. 
	    #     Any image that the function returns true will be included
	    def image_filter(image):
	        return image.grade() < 7

	    # Define a function to transform each image, to pass to the loader.
	    # Crucially, this transform function is applied to each *image*, prior to any Pytorch processing.
	    # So, image-by-image transforms (i.e. clipping, downsampling, etc. can/should be done here)
	    def transform_func(image_ray):
	        # Clip the pixel values between 150 and 350
	        image_ray = np.clip(image_ray, standardize_range[0], standardize_range[1])

	        # Standardize the pixel values between 0 and 1
	        image_ray = (image_ray - standardize_range[0]) / (standardize_range[1] - standardize_range[0])

	        # Downsample the images to 224, 224
	        if downsample_size != (512, 512):
	            image_ray = torch.Tensor(image_ray)
	            image_ray = torch.reshape(image_ray, [1, 1, image_ray.size()[0], image_ray.size()[1]])
	            image_ray = nn.functional.interpolate(image_ray, size=downsample_size, mode='bilinear', align_corners=False)
	            image_ray = torch.reshape(image_ray, [image_ray.size()[2], image_ray.size()[3]])
	            image_ray = image_ray.numpy()
	        return image_ray

	    # Load Dataset
	    dataset = DigitalTyphoonDataset(str(images_path),
	                                    str(metadata_path),
	                                    str(json_path),
	                                    'grade',  # the labels we'd like to retrieve from the dataset
	                                    get_images_by_sequence=True, # indicate we want typhoon sequences returned
	                                    filter_func=image_filter, # the filter function defined above
	                                    transform_func=transform_func, # the transform function defined above
	                                    transform=transforms.Compose([ # pytorch transform to apply to data before returning data
	                                        PadSequence(505),
	                                    ]),
	                                    verbose=False)


	    # Split the dataset into a training and test split (80% and 20% respectively)
	    #   split by sequence so all images in one sequence will belong to the same bucket 
	    train_set, test_set = dataset.random_split([0.8, 0.2], split_by='sequence')

	    # Make Pytorch DataLoaders out of the returned sets. From here, it retains all Pytorch functionality.
	    trainloader = DataLoader(train_set, batch_size=batch_size, shuffle=True, num_workers=num_workers)
	    testloader = DataLoader(test_set, batch_size=batch_size, shuffle=False, num_workers=num_workers)


	    ## Prepare the model
	    # Hyperparameters
	    num_epochs = args.max_epochs
	    batch_size = 16
	    learning_rate = 0.001
	    standardize_range = (150, 350)
	    downsample_size = (224, 224)

	    # Create a dummy model that will take input of size (505, 224, 224) (seq length, height, width) and output 
	    # a value for each image in the sequence (shape (505))
	    linear1 = nn.Linear(224, 1)

	    # Loss and optimizer
	    criterion = nn.CrossEntropyLoss()
	    optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate, momentum=0.9)


	    ## Train the model
	    for epoch in np.arange(max_epochs):

	        batches_per_epoch = len(trainloader)

	        model.train()

	        for batch_num, data in enumerate(tqdm(trainloader)):
	            # One batch of the data (16 images and 16 labels) are held in the data variable

	            # Data is a tuple, with sequence in data[0] and labels in data[1]
	            # sequence is shape (16, 505, 224, 224) (batch size, seq len, height, width)
	            # labels size is (16, 505) as we padded them as well. 
	            sequence, labels = data

	            # cast pixels to float and grade (label) to long
	            sequence, labels = torch.Tensor(sequence).float(), torch.Tensor(labels).long()

	            optimizer.zero_grad()

	            # Forward pass
	            predictions = linear1(sequence).reshape([16, 505, 224])
	            predictions = linear1(sequence).reshape([16, 505])

	            # Calculate the loss
	            loss = criterion(predictions, labels)
	        
	            # backward pass
	            loss.backward()
	            # update weights
	            optimizer.step()


	class PadSequence(object):

	    def __init__(self, max_length):
	        self.max_length = max_length

	    def __call__(self, received_sample):
	        sample, labels = received_sample

	        # Convert numpy array (data) to tensor
	        sample = torch.Tensor(sample)

	        # Calculate the length the pad needs to be
	        pad_length = self.max_length - sample.size()[0]

	        # Create the padding tensor
	        pad = torch.zeros(pad_length, sample.size(1), sample.size(2))

	        # Concatenate the pad and the sample (prepadded)
	        sample = torch.cat((pad, sample), dim=0)

	        # Resize to (length, height, width)
	        sample = torch.reshape(sample, [sample.size()[0], sample.size()[1], sample.size()[2]])


	        # Do the same for the labels
	        labels = torch.Tensor(labels)
	        pad = torch.zeros(pad_length, labels.size(1))
	        labels = torch.cat((pad, labels), dim=0)

	        return (sample, labels)


	if __name__ == '__main__':
	    parser = argparse.ArgumentParser(description='Train a resnet model')
	    parser.add_argument('--dataroot', required=True, type=str, help='path to the root data directory')
	    parser.add_argument('--maxepochs', default=100, type=int)
	    args = parser.parse_args()

	    main(args)