assignment 1 is released

jbmanasa · Apr 2, 2019 · 3dc4913 · 3dc4913
1 parent 97a6719
commit 3dc4913
Show file tree

Hide file tree

Showing 15 changed files with 1,448 additions and 0 deletions.
diff --git a/README.md b/README.md
@@ -1 +1,3 @@
 # UvA Deep Learning Course Practical Assignments
+
+- Assignment 1 is released. The deadline is **April 17th, 23:59**.
diff --git a/assignment_1/README.md b/assignment_1/README.md
@@ -0,0 +1,5 @@
+# Assignment 1
+
+ You can find all necessary instructions in **assignment_1.pdf**.
+
+ We provide to you simple unit tests that can check your implementation. However be aware that even if all tests are passed it still doesn't mean that your implementation is correct. You can find tests in **unittests.py**. 
diff --git a/assignment_1/assignment_1.pdf b/assignment_1/assignment_1.pdf
diff --git a/assignment_1/code/cifar10/get_cifar10.sh b/assignment_1/code/cifar10/get_cifar10.sh
@@ -0,0 +1,6 @@
+#!/usr/bin/env bash
+
+# Get CIFAR10
+wget http://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz
+tar -xzvf cifar-10-python.tar.gz
+rm cifar-10-python.tar.gz 
diff --git a/assignment_1/code/cifar10_utils.py b/assignment_1/code/cifar10_utils.py
@@ -0,0 +1,230 @@
+"""
+This module implements utility functions for downloading and reading CIFAR10 data.
+You don't need to change anything here.
+"""
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import numpy as np
+import os
+import pickle
+
+# Default paths for downloading CIFAR10 data
+CIFAR10_FOLDER = 'cifar10/cifar-10-batches-py'
+
+def load_cifar10_batch(batch_filename):
+  """
+  Loads single batch of CIFAR10 data.
+  Args:
+    batch_filename: Filename of batch to get data from.
+  Returns:
+    X: CIFAR10 batch data in numpy array with shape (10000, 32, 32, 3).
+    Y: CIFAR10 batch labels in numpy array with shape (10000, ).
+  """
+  with open(batch_filename, 'rb') as f:
+    batch = pickle.load(f, encoding='latin1')
+    X = batch['data']
+    Y = batch['labels']
+    X = X.reshape(10000, 3, 32, 32).transpose(0,2,3,1).astype(np.float32)
+    Y = np.array(Y)
+    return X, Y
+
+def load_cifar10(cifar10_folder):
+  """
+  Loads CIFAR10 train and test splits.
+  Args:
+    cifar10_folder: Folder which contains downloaded CIFAR10 data.
+  Returns:
+    X_train: CIFAR10 train data in numpy array with shape (50000, 32, 32, 3).
+    Y_train: CIFAR10 train labels in numpy array with shape (50000, ).
+    X_test: CIFAR10 test data in numpy array with shape (10000, 32, 32, 3).
+    Y_test: CIFAR10 test labels in numpy array with shape (10000, ).
+
+  """
+  Xs = []
+  Ys = []
+  for b in range(1, 6):
+    batch_filename = os.path.join(cifar10_folder, 'data_batch_' + str(b))
+    X, Y = load_cifar10_batch(batch_filename)
+    Xs.append(X)
+    Ys.append(Y)
+  X_train = np.concatenate(Xs)
+  Y_train = np.concatenate(Ys)
+  X_test, Y_test = load_cifar10_batch(os.path.join(cifar10_folder, 'test_batch'))
+  return X_train, Y_train, X_test, Y_test
+
+def get_cifar10_raw_data(data_dir):
+  """
+  Gets raw CIFAR10 data from http://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz.
+
+  Args:
+    data_dir: Data directory.
+  Returns:
+    X_train: CIFAR10 train data in numpy array with shape (50000, 32, 32, 3).
+    Y_train: CIFAR10 train labels in numpy array with shape (50000, ).
+    X_test: CIFAR10 test data in numpy array with shape (10000, 32, 32, 3).
+    Y_test: CIFAR10 test labels in numpy array with shape (10000, ).
+  """
+
+  X_train, Y_train, X_test, Y_test = load_cifar10(data_dir)
+
+  return X_train, Y_train, X_test, Y_test
+
+def preprocess_cifar10_data(X_train_raw, Y_train_raw, X_test_raw, Y_test_raw):
+  """
+  Preprocesses CIFAR10 data by substracting mean from all images.
+  Args:
+    X_train_raw: CIFAR10 raw train data in numpy array.
+    Y_train_raw: CIFAR10 raw train labels in numpy array.
+    X_test_raw: CIFAR10 raw test data in numpy array.
+    Y_test_raw: CIFAR10 raw test labels in numpy array.
+    num_val: Number of validation samples.
+  Returns:
+    X_train: CIFAR10 train data in numpy array.
+    Y_train: CIFAR10 train labels in numpy array.
+    X_test: CIFAR10 test data in numpy array.
+    Y_test: CIFAR10 test labels in numpy array.
+  """
+  X_train = X_train_raw.copy()
+  Y_train = Y_train_raw.copy()
+  X_test = X_test_raw.copy()
+  Y_test = Y_test_raw.copy()
+
+  # Substract the mean
+  mean_image = np.mean(X_train, axis=0)
+  X_train -= mean_image
+  X_test -= mean_image
+
+  # Transpose
+  X_train = X_train.transpose(0, 3, 1, 2).astype(np.float32)
+  X_test = X_test.transpose(0, 3, 1, 2).astype(np.float32)
+  return X_train, Y_train, X_test, Y_test
+
+def dense_to_one_hot(labels_dense, num_classes):
+  """
+  Convert class labels from scalars to one-hot vectors.
+  Args:
+    labels_dense: Dense labels.
+    num_classes: Number of classes.
+  Returns:
+    labels_one_hot: One-hot encoding for labels.
+  """
+  num_labels = labels_dense.shape[0]
+  index_offset = np.arange(num_labels) * num_classes
+  labels_one_hot = np.zeros((num_labels, num_classes))
+  labels_one_hot.flat[index_offset + labels_dense.ravel()] = 1
+  return labels_one_hot
+
+class DataSet(object):
+  """
+  Utility class to handle dataset structure.
+  """
+
+  def __init__(self, images, labels):
+    """
+    Builds dataset with images and labels.
+    Args:
+      images: Images data.
+      labels: Labels data
+    """
+    assert images.shape[0] == labels.shape[0], (
+          "images.shape: {0}, labels.shape: {1}".format(str(images.shape), str(labels.shape)))
+
+    self._num_examples = images.shape[0]
+    self._images = images
+    self._labels = labels
+    self._epochs_completed = 0
+    self._index_in_epoch = 0
+
+  @property
+  def images(self):
+    return self._images
+
+  @property
+  def labels(self):
+    return self._labels
+
+  @property
+  def num_examples(self):
+    return self._num_examples
+
+  @property
+  def epochs_completed(self):
+    return self._epochs_completed
+
+  def next_batch(self, batch_size):
+    """
+    Return the next `batch_size` examples from this data set.
+    Args:
+      batch_size: Batch size.
+    """
+    start = self._index_in_epoch
+    self._index_in_epoch += batch_size
+    if self._index_in_epoch > self._num_examples:
+      self._epochs_completed += 1
+
+      perm = np.arange(self._num_examples)
+      np.random.shuffle(perm)
+      self._images = self._images[perm]
+      self._labels = self._labels[perm]
+
+      start = 0
+      self._index_in_epoch = batch_size
+      assert batch_size <= self._num_examples
+
+    end = self._index_in_epoch
+    return self._images[start:end], self._labels[start:end]
+
+def read_data_sets(data_dir, one_hot = True, validation_size = 0):
+  """
+  Returns the dataset readed from data_dir.
+  Uses or not uses one-hot encoding for the labels.
+  Subsamples validation set with specified size if necessary.
+  Args:
+    data_dir: Data directory.
+    one_hot: Flag for one hot encoding.
+    validation_size: Size of validation set
+  Returns:
+    Dictionary with Train, Validation, Test Datasets
+  """
+  # Extract CIFAR10 data
+  train_images_raw, train_labels_raw, test_images_raw, test_labels_raw = \
+      get_cifar10_raw_data(data_dir)
+  train_images, train_labels, test_images, test_labels = \
+      preprocess_cifar10_data(train_images_raw, train_labels_raw, test_images_raw, test_labels_raw)
+
+  # Apply one-hot encoding if specified
+  if one_hot:
+    num_classes = len(np.unique(train_labels))
+    train_labels = dense_to_one_hot(train_labels, num_classes)
+    test_labels = dense_to_one_hot(test_labels, num_classes)
+
+  # Subsample the validation set from the train set
+  if not 0 <= validation_size <= len(train_images):
+    raise ValueError("Validation size should be between 0 and {0}. Received: {1}.".format(
+        len(train_images), validation_size))
+
+  validation_images = train_images[:validation_size]
+  validation_labels = train_labels[:validation_size]
+  train_images = train_images[validation_size:]
+  train_labels = train_labels[validation_size:]
+
+  # Create datasets
+  train = DataSet(train_images, train_labels)
+  validation = DataSet(validation_images, validation_labels)
+  test = DataSet(test_images, test_labels)
+
+  return {'train': train, 'validation': validation, 'test': test}
+
+def get_cifar10(data_dir = CIFAR10_FOLDER, one_hot = True, validation_size = 0):
+  """
+  Prepares CIFAR10 dataset.
+  Args:
+    data_dir: Data directory.
+    one_hot: Flag for one hot encoding.
+    validation_size: Size of validation set
+  Returns:
+    Dictionary with Train, Validation, Test Datasets
+  """
+  return read_data_sets(data_dir, one_hot, validation_size)
diff --git a/assignment_1/code/convnet_pytorch.py b/assignment_1/code/convnet_pytorch.py
@@ -0,0 +1,59 @@
+"""
+This module implements a Convolutional Neural Network in PyTorch.
+You should fill in code into indicated sections.
+"""
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+class ConvNet(nn.Module):
+  """
+  This class implements a Convolutional Neural Network in PyTorch.
+  It handles the different layers and parameters of the model.
+  Once initialized an ConvNet object can perform forward.
+  """
+
+  def __init__(self, n_channels, n_classes):
+    """
+    Initializes ConvNet object. 
+    
+    Args:
+      n_channels: number of input channels
+      n_classes: number of classes of the classification problem
+                 
+    
+    TODO:
+    Implement initialization of the network.
+    """
+
+    ########################
+    # PUT YOUR CODE HERE  #
+    #######################
+    raise NotImplementedError
+    ########################
+    # END OF YOUR CODE    #
+    #######################
+
+  def forward(self, x):
+    """
+    Performs forward pass of the input. Here an input tensor x is transformed through 
+    several layer transformations.
+    
+    Args:
+      x: input to the network
+    Returns:
+      out: outputs of the network
+    
+    TODO:
+    Implement forward pass of the network.
+    """
+
+    ########################
+    # PUT YOUR CODE HERE  #
+    #######################
+    raise NotImplementedError
+    ########################
+    # END OF YOUR CODE    #
+    #######################
+
+    return out