Initial Commit

2024-03-11 13:00:35 +00:00 · 2024-03-11 13:00:35 +00:00 · 8027439bc1
commit 8027439bc1
18 changed files with 1512 additions and 0 deletions
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,4 @@
+.ipynb_checkpoints
+data/EXCV10
+data/MaskedFace
+__pycache__
--- a/ECMM426.pdf
+++ b/ECMM426.pdf
--- a/1.ipynb
+++ b/1.ipynb
--- a/2.ipynb
+++ b/2.ipynb
@ -0,0 +1,419 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "f96d2a83",
+   "metadata": {},
+   "source": [
+    "## Question 2 (20 marks)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "6f53891a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import cv2\n",
+    "import numpy as np"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "d3bbb31a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "n_clusters = 100"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "28068e50",
+   "metadata": {},
+   "source": [
+    "Read images"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "87dd5c72",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "im_book = cv2.imread('data/books.jpg', cv2.IMREAD_GRAYSCALE)\n",
+    "im_mount = cv2.imread('data/mount_rushmore_1.jpg', cv2.IMREAD_GRAYSCALE)\n",
+    "im_notre = cv2.imread('data/notre_dame_1.jpg', cv2.IMREAD_GRAYSCALE)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "79c57454",
+   "metadata": {},
+   "source": [
+    "## Generate Clusters"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "2e571277",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def get_features(image):\n",
+    "    image = image[:, :, np.newaxis]\n",
+    "\n",
+    "    # Initialize a SIFT detector\n",
+    "    sift = cv2.SIFT_create()\n",
+    "\n",
+    "    # Detect keypoints and compute descriptors\n",
+    "    keypoints, descriptors = sift.detectAndCompute(image, None)\n",
+    "\n",
+    "    return keypoints, descriptors"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "12d042c8",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from sklearn.cluster import KMeans\n",
+    "\n",
+    "def get_clusters(keypoints, descriptors, n_clusters=100):\n",
+    "\n",
+    "    # Perform k-means clustering\n",
+    "    kmeans = KMeans(n_clusters=n_clusters, random_state=42, n_init=10)\n",
+    "    kmeans.fit(descriptors)\n",
+    "\n",
+    "    # Assign descriptors to clusters\n",
+    "    clusters = kmeans.predict(descriptors)\n",
+    "\n",
+    "    # Convert keypoints to locations (x, y coordinates)\n",
+    "    locations = np.array([kp.pt for kp in keypoints], dtype=np.int64)\n",
+    "    \n",
+    "    return clusters, locations"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "b04681a0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "kpts_book, des_book = get_features(im_book)\n",
+    "kpts_mount, des_mount = get_features(im_mount)\n",
+    "kpts_notre, des_notre = get_features(im_notre)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "70d23c90",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "clusters_book, locations_book = get_clusters(kpts_book, des_book, n_clusters=n_clusters)\n",
+    "clusters_mount, locations_mount = get_clusters(kpts_mount, des_mount, n_clusters=n_clusters)\n",
+    "clusters_notre, locations_notre = get_clusters(kpts_notre, des_notre, n_clusters=n_clusters)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "1518e19f",
+   "metadata": {},
+   "source": [
+    "## Method 1 (Two FOR loops)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "04f3901b",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def m1_generate_bovw_spatial_histogram(im, locations, clusters, division):\n",
+    "    \"\"\"\n",
+    "    Create bag of visual words representation of an image based on the division information.\n",
+    "    \n",
+    "    Parameters:\n",
+    "    im (numpy.ndarray): Image array of data type uint8.\n",
+    "    locations (numpy.ndarray): Array of shape (N, 2) with Cartesian coordinates (x, y).\n",
+    "    clusters (numpy.ndarray): Array of shape (N,) with quantised cluster id.\n",
+    "    division (list): List of integers of length 2 indicating division along Y and X axes.\n",
+    "    \n",
+    "    Returns:\n",
+    "    numpy.ndarray: 1-dimensional array representing the BoVW spatial histogram.\n",
+    "    \"\"\"\n",
+    "\n",
+    "    # Determine the size of each division\n",
+    "    div_height = im.shape[0] // division[0]\n",
+    "    div_width = im.shape[1] // division[1]\n",
+    "    \n",
+    "    # Initialize the histogram\n",
+    "    num_clusters = np.unique(clusters).size\n",
+    "    histogram = np.zeros((division[0] * division[1] * num_clusters,), dtype=np.int64)\n",
+    "\n",
+    "    # Two FOR loops\n",
+    "    for div_y in range(division[0]):\n",
+    "        for div_x in range(division[1]):\n",
+    "            # Define the bounds of the current division\n",
+    "            y_start = div_y * div_height\n",
+    "            y_end = (div_y + 1) * div_height\n",
+    "            x_start = div_x * div_width\n",
+    "            x_end = (div_x + 1) * div_width\n",
+    "\n",
+    "            # Find features within the current division\n",
+    "            div_mask = (locations[:, 1] >= y_start) & (locations[:, 1] < y_end) & \\\n",
+    "                       (locations[:, 0] >= x_start) & (locations[:, 0] < x_end)\n",
+    "            div_locations = locations[div_mask]\n",
+    "            div_clusters = clusters[div_mask]\n",
+    "\n",
+    "            # Calculate the histogram for the current division\n",
+    "            for i in range(num_clusters):\n",
+    "                cluster_mask = (div_clusters == i)\n",
+    "                histogram[div_y * division[1] * num_clusters + div_x * num_clusters + i] = np.sum(cluster_mask)\n",
+    "    \n",
+    "    return histogram"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "0f64e74a",
+   "metadata": {},
+   "source": [
+    "## Method 2 (One FOR loop)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "id": "a597d45d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def m2_generate_bovw_spatial_histogram(im, locations, clusters, division):\n",
+    "\n",
+    "    img_shape = np.shape(im)\n",
+    "\n",
+    "    height = img_shape[0]\n",
+    "    width = img_shape[1]\n",
+    "\n",
+    "    ## Possible Mistakes: Some students swapped x and y\n",
+    "    div_x = division[1]\n",
+    "    div_y = division[0]\n",
+    "\n",
+    "    x_size = width / div_x\n",
+    "    y_size = height / div_y\n",
+    "\n",
+    "    num_divisions = division[0] * division[1]\n",
+    "\n",
+    "    num_clusters = np.max(clusters) + 1\n",
+    "\n",
+    "    histogram = np.zeros(num_clusters * num_divisions)\n",
+    "\n",
+    "    # One FOR loop\n",
+    "    for i in range(len(locations)):\n",
+    "        point = locations[i]\n",
+    "        cluster = clusters[i]\n",
+    "\n",
+    "        x_div = np.ceil((point[0] + 1) / x_size).astype(np.int64) - 1\n",
+    "        y_div = np.ceil((point[1] + 1) / y_size).astype(np.int64) - 1\n",
+    "\n",
+    "        # Possible Mistakes: Some students miscalculated the boundary condition\n",
+    "        # x_div = np.ceil(point[0] / x_size).astype(np.int64) - 1\n",
+    "        # y_div = np.ceil(point[1] / y_size).astype(np.int64) - 1\n",
+    "\n",
+    "        # Calculate the array position\n",
+    "        div = x_div + (y_div * div_x)\n",
+    "        array_pos = (div * num_clusters) + cluster\n",
+    "        \n",
+    "        # Update the histogram\n",
+    "        histogram[array_pos] = histogram[array_pos] + 1\n",
+    "\n",
+    "    return histogram.astype(int)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "36f2fe5e",
+   "metadata": {},
+   "source": [
+    "## Put students' implementations here"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "3804d695",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Be careful, some students used a different function name (e.g. bowv rather than bovw)\n",
+    "def generate_bovw_spatial_histogram(im, locations, clusters, division):\n",
+    "    # Determine the number of clusters\n",
+    "    num_clusters = np.unique(clusters).size\n",
+    "\n",
+    "    # Initialize histogram\n",
+    "    spatial_histogram = np.zeros(num_clusters * np.prod(division), dtype=np.int64)\n",
+    "\n",
+    "    div_size_y = im.shape[0] // division[0]\n",
+    "    div_size_x = im.shape[1] // division[1]\n",
+    "\n",
+    "    for div_y in range(division[0]):\n",
+    "        for div_x in range(division[1]):\n",
+    "            start_y = div_y * div_size_y\n",
+    "            end_y = (div_y + 1) * div_size_y if div_y < division[0] - 1 else im.shape[0]\n",
+    "            start_x = div_x * div_size_x\n",
+    "            end_x = (div_x + 1) * div_size_x if div_x < division[1] - 1 else im.shape[1]\n",
+    "            for loc, cluster_id in zip(locations, clusters):\n",
+    "                x, y = loc\n",
+    "                if start_y <= y < end_y and start_x <= x < end_x:\n",
+    "                    index = (div_y * division[1] + div_x) * num_clusters + cluster_id\n",
+    "                    spatial_histogram[index] += 1\n",
+    "    return spatial_histogram"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "0d516e6a",
+   "metadata": {},
+   "source": [
+    "## Test (Should output ALL PASS)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a269b35f",
+   "metadata": {},
+   "source": [
+    "Restart and Run ALL for each submission"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "id": "95d72a5c",
+   "metadata": {
+    "scrolled": true
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Testing division: [1, 1]\n",
+      "PASS: Book\n",
+      "PASS: Mount\n",
+      "PASS: Notre\n",
+      "Testing division: [2, 2]\n",
+      "PASS: Book\n",
+      "PASS: Mount\n",
+      "PASS: Notre\n",
+      "Testing division: [2, 3]\n",
+      "PASS: Book\n",
+      "PASS: Mount\n",
+      "PASS: Notre\n",
+      "ALL PASS\n"
+     ]
+    }
+   ],
+   "source": [
+    "histograms = []\n",
+    "for division in [ [1, 1], [2, 2], [2, 3] ]:\n",
+    "    print('Testing division:', division)\n",
+    "\n",
+    "    m1_histogram_book = m1_generate_bovw_spatial_histogram(im_book, locations_book, clusters_book, division)\n",
+    "    m1_histogram_mount = m1_generate_bovw_spatial_histogram(im_mount, locations_mount, clusters_mount, division)\n",
+    "    m1_histogram_notre = m1_generate_bovw_spatial_histogram(im_notre, locations_notre, clusters_notre, division)\n",
+    "\n",
+    "    m2_histogram_book = m2_generate_bovw_spatial_histogram(im_book, locations_book, clusters_book, division)\n",
+    "    m2_histogram_mount = m2_generate_bovw_spatial_histogram(im_mount, locations_mount, clusters_mount, division)\n",
+    "    m2_histogram_notre = m2_generate_bovw_spatial_histogram(im_notre, locations_notre, clusters_notre, division)\n",
+    "\n",
+    "    # Students' implementations\n",
+    "    histogram_book = generate_bovw_spatial_histogram(im_book, locations_book, clusters_book, division)\n",
+    "    histogram_mount = generate_bovw_spatial_histogram(im_mount, locations_mount, clusters_mount, division)\n",
+    "    histogram_notre = generate_bovw_spatial_histogram(im_notre, locations_notre, clusters_notre, division)\n",
+    "    \n",
+    "    assert np.allclose(m1_histogram_book, m2_histogram_book)\n",
+    "    assert np.allclose(m1_histogram_book, histogram_book)\n",
+    "    print(\"PASS: Book\")\n",
+    "\n",
+    "    assert np.allclose(m1_histogram_mount, m2_histogram_mount)\n",
+    "    assert np.allclose(m1_histogram_mount, histogram_mount)\n",
+    "    print(\"PASS: Mount\")\n",
+    "\n",
+    "    assert np.allclose(m1_histogram_notre, m2_histogram_notre)\n",
+    "    assert np.allclose(m1_histogram_notre, histogram_notre)\n",
+    "    print(\"PASS: Notre\")\n",
+    "\n",
+    "    histograms.append( [m1_histogram_book, m1_histogram_mount, m1_histogram_notre] )\n",
+    "print(\"ALL PASS\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "00a11df8",
+   "metadata": {},
+   "source": [
+    "## Save Output"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "id": "ea1fadb1",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "D:\\Anaconda3\\envs\\what\\lib\\site-packages\\numpy\\lib\\npyio.py:521: VisibleDeprecationWarning: Creating an ndarray from ragged nested sequences (which is a list-or-tuple of lists-or-tuples-or ndarrays with different lengths or shapes) is deprecated. If you meant to do this, you must specify 'dtype=object' when creating the ndarray.\n",
+      "  arr = np.asanyarray(arr)\n"
+     ]
+    }
+   ],
+   "source": [
+    "np.save('data/question_3_histogram.npy', histograms)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ddc3036c",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "what",
+   "language": "python",
+   "name": "what"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.16"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
--- a/3.ipynb
+++ b/3.ipynb
@ -0,0 +1,224 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "924a2a50",
+   "metadata": {},
+   "source": [
+    "## Question 3 (10 marks)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "2b3d1ba2",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import numpy as np"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "478bad7a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "points = np.load('data/points.npy').astype(np.uint8)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "e07b0285",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def compute_rotation_matrix(points, theta):\n",
+    "    \"\"\"\n",
+    "    Write a function compute_rotation_matrix(points, theta) to compute the rotation matrix in\n",
+    "    homogeneous coordinate system to rotate a shape depicted with 2-dimensional (x,y) coordinates\n",
+    "    points with an angle 𝜃 (theta in the definition) in the anticlockwise direction about the centre of the shape.\n",
+    "\n",
+    "    Parameters:\n",
+    "    points: a 2-dimensional numpy array of data type uint8 with shape 𝑘 × 2. Each row\n",
+    "    of points is a Cartesian coordinate (x, y).\n",
+    "    \n",
+    "    theta: a floating-point number denoting the angle of rotation in degree.\n",
+    "    \n",
+    "    Returns:\n",
+    "    The expected output is a 2-dimensional numpy array of data type float64 with shape 3 × 3.\n",
+    "    \"\"\"\n",
+    "\n",
+    "    # Convert theta from degrees to radians\n",
+    "    theta_rad = np.radians(theta)\n",
+    "\n",
+    "    # Calculate the centre of the shape\n",
+    "    centre = np.mean(points, axis=0)\n",
+    "\n",
+    "    # Define the translation matrices to move the centre of the shape to the origin and back\n",
+    "    translation_to_origin = np.array([[1, 0, -centre[0]],\n",
+    "                                      [0, 1, -centre[1]],\n",
+    "                                      [0, 0, 1]], dtype=np.float64)\n",
+    "\n",
+    "    translation_back = np.array([[1, 0, centre[0]],\n",
+    "                                 [0, 1, centre[1]],\n",
+    "                                 [0, 0, 1]], dtype=np.float64)\n",
+    "\n",
+    "    # Define the rotation matrix about the origin\n",
+    "    rotation = np.array([[np.cos(theta_rad), -np.sin(theta_rad), 0],\n",
+    "                         [np.sin(theta_rad),  np.cos(theta_rad), 0],\n",
+    "                         [0,                 0,                1]], dtype=np.float64)\n",
+    "\n",
+    "    # Combine the translation and rotation into a single transformation matrix\n",
+    "    rotation_matrix = np.dot(np.dot(translation_back, rotation), translation_to_origin)\n",
+    "    \n",
+    "    return rotation_matrix"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "16ef4247",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "rotation_matrices = []\n",
+    "\n",
+    "for t in range(0, 365, 5):\n",
+    "    rotation_matrices.append( compute_rotation_matrix(points, t) )"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a130c201",
+   "metadata": {},
+   "source": [
+    "## Save Output"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "23967b5d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "np.save('data/question_3_rotation_matrices.npy', rotation_matrices)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a808d8a4",
+   "metadata": {},
+   "source": [
+    "## Put students' implementations here"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "b0836f8d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def compute_rotation_matrix(points, theta):\n",
+    "    # Convert points to float64\n",
+    "    points = points.astype(np.float64)\n",
+    "    # Calculate centre\n",
+    "    centre = np.mean(points, axis=0)\n",
+    "    # Compute rotation matrix\n",
+    "    rotation_matrix = np.array([[np.cos(np.radians(theta)), -np.sin(np.radians(theta)), 0],\n",
+    "                                [np.sin(np.radians(theta)), np.cos(np.radians(theta)), 0],\n",
+    "                                [0, 0, 1]])\n",
+    "    # Translation matrix to origin\n",
+    "    translation_to_origin = np.array([[1, 0, -centre[0]],\n",
+    "                                      [0, 1, -centre[1]],\n",
+    "                                      [0, 0, 1]])\n",
+    "    # Translation matrix to original position\n",
+    "    translation_to_centre = np.array([[1, 0, centre[0]],\n",
+    "                                         [0, 1, centre[1]],\n",
+    "                                         [0, 0, 1]])\n",
+    "    # Combine transformations with data type float64 \n",
+    "    combined_matrix = np.dot(np.dot(translation_to_centre, rotation_matrix), translation_to_origin).astype(np.float64)\n",
+    "    return combined_matrix\n",
+    "\n",
+    "    return 0"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "73b68192",
+   "metadata": {},
+   "source": [
+    "## Test (Should output ALL PASS)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "1c0a88a6",
+   "metadata": {},
+   "source": [
+    "Restart and Run ALL for each submission"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "132d734b",
+   "metadata": {
+    "scrolled": false
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "73 PASS\n",
+      "ALL PASS\n"
+     ]
+    }
+   ],
+   "source": [
+    "n_pass = 0\n",
+    "for t in range(0, 365, 5):\n",
+    "    if np.allclose(compute_rotation_matrix(points, t), rotation_matrices[int(t / 5)]):\n",
+    "        n_pass = n_pass + 1\n",
+    "\n",
+    "print(n_pass, \"PASS\")\n",
+    "assert n_pass == len(rotation_matrices)\n",
+    "print(\"ALL PASS\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0fac308a",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "what",
+   "language": "python",
+   "name": "what"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.16"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
--- a/README.md
+++ b/README.md
@ -0,0 +1,2 @@
+## ECMM426 Template
+
--- a/ca_utils.py
+++ b/ca_utils.py
@ -0,0 +1,187 @@
+import cv2
+import math
+import torch
+import pickle
+import numpy as np
+import torch.nn as nn
+import torch.nn.functional as F
+
+def im2single(im):
+    im = im.astype(np.float32) / 255
+    return im
+
+def single2im(im):
+    im *= 255
+    im = im.astype(np.uint8)
+    return im
+
+def load_interest_points(eval_file):
+    """
+    This function is provided for development and debugging but cannot be used in
+    the final handin. It 'cheats' by generating interest points from known
+    correspondences. It will only work for the 3 image pairs with known
+    correspondences.
+
+    Args:
+    - eval_file: string representing the file path to the list of known correspondences
+    - scale_factor: Python float representing the scale needed to map from the original
+            image coordinates to the resolution being used for the current experiment.
+
+    Returns:
+    - x1: A numpy array of shape (k,) containing ground truth x-coordinates of imgA correspondence pts
+    - y1: A numpy array of shape (k,) containing ground truth y-coordinates of imgA correspondence pts
+    - x2: A numpy array of shape (k,) containing ground truth x-coordinates of imgB correspondence pts
+    - y2: A numpy array of shape (k,) containing ground truth y-coordinates of imgB correspondence pts
+    """
+    with open(eval_file, 'rb') as f:
+        d = pickle.load(f, encoding='latin1')
+    scale_factor = 1.0
+    return d['x1'] * scale_factor, d['y1'] * scale_factor, d['x2'] * scale_factor, d['y2'] * scale_factor
+
+def show_interest_points(img, X, Y):
+    """
+    Visualized interest points on an image with random colors
+
+    Args:
+    - img: A numpy array of shape (M,N,C)
+    - X: A numpy array of shape (k,) containing x-locations of interest points
+    - Y: A numpy array of shape (k,) containing y-locations of interest points
+
+    Returns:
+    - newImg: A numpy array of shape (M,N,C) showing the original image with
+            colored circles at keypoints plotted on top of it
+    """
+    newImg = img.copy()
+    for x, y in zip(X.astype(int), Y.astype(int)):
+        cur_color = np.random.rand(3)
+        newImg = cv2.circle(newImg, (int(x), int(y)), 10, cur_color, -1)
+    return newImg
+
+def conv3x3(in_planes, out_planes, stride=1):
+    """
+    3x3 convolution with padding
+    """
+    return nn.Conv2d(in_planes, out_planes, kernel_size=3, stride=stride, padding=1, bias=False)
+
+class BasicBlock(nn.Module):
+    expansion = 1
+
+    def __init__(self, inplanes, planes, stride=1, downsample=None):
+        super(BasicBlock, self).__init__()
+        self.conv1 = conv3x3(inplanes, planes, stride)
+        self.bn1 = nn.BatchNorm2d(planes)
+        self.relu = nn.ReLU(inplace=True)
+        self.conv2 = conv3x3(planes, planes)
+        self.bn2 = nn.BatchNorm2d(planes)
+        self.downsample = downsample
+        self.stride = stride
+
+    def forward(self, x):
+        out = self.conv1(x)
+        out = self.bn1(out)
+        out = self.relu(out)
+        out = self.conv2(out)
+        out = self.bn2(out)
+
+        if self.downsample is not None:
+            residual = self.downsample(x)
+        else:
+            residual = x
+
+        out += residual
+        out = self.relu(out)
+        return out
+
+class Bottleneck(nn.Module):
+    expansion = 4
+
+    def __init__(self, inplanes, planes, stride=1, downsample=None):
+        super(Bottleneck, self).__init__()
+        self.conv1 = nn.Conv2d(inplanes, planes, kernel_size=1, bias=False)
+        self.bn1 = nn.BatchNorm2d(planes)
+        self.conv2 = nn.Conv2d(planes, planes, kernel_size=3, stride=stride, padding=1, bias=False)
+        self.bn2 = nn.BatchNorm2d(planes)
+        self.conv3 = nn.Conv2d(planes, planes*4, kernel_size=1, bias=False)
+        self.bn3 = nn.BatchNorm2d(planes*4)
+        self.relu = nn.ReLU(inplace=True)
+        self.downsample = downsample
+        self.stride = stride
+
+    def forward(self, x):
+        out = self.conv1(x)
+        out = self.bn1(out)
+        out = self.relu(out)
+
+        out = self.conv2(out)
+        out = self.bn2(out)
+        out = self.relu(out)
+
+        out = self.conv3(out)
+        out = self.bn3(out)
+
+        if self.downsample is not None:
+            residual = self.downsample(x)
+        else:
+            residual = x
+
+        out += residual
+        out = self.relu(out)
+        return out
+
+class ResNet(nn.Module):
+
+    def __init__(self, block, layers, in_channels=3, channels=[16, 32, 64], num_classes=10, flatten=True):
+        super(ResNet, self).__init__()
+        self.name = "resnet"
+        self.flatten = flatten
+        self.channels = channels
+        self.inplanes = channels[0]
+        self.conv1 = nn.Conv2d(in_channels, channels[0], kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
+        self.bn1 = nn.BatchNorm2d(channels[0])
+        self.relu = nn.ReLU(inplace=True)
+        self.layer1 = self._make_layer(block, channels[0], layers[0])
+        self.layer2 = self._make_layer(block, channels[1], layers[1], stride=2)
+        self.layer3 = self._make_layer(block, channels[2], layers[2], stride=2)
+        self.avgpool = nn.AdaptiveAvgPool2d(1)  # global pooling
+        self.fc = nn.Linear(channels[2], num_classes)  # global pooling
+        if flatten:
+            self.feature_size = channels[2]*block.expansion
+
+        for m in self.modules():
+            if isinstance(m, nn.Conv2d):
+                n = m.kernel_size[0] * m.kernel_size[1] * m.out_channels
+                m.weight.data.normal_(0, math.sqrt(2. / n))
+            elif isinstance(m, nn.BatchNorm2d):
+                m.weight.data.fill_(1)
+                m.bias.data.zero_()
+
+    def _make_layer(self, block, planes, blocks, stride=1):
+        downsample = None
+        if stride != 1 or self.inplanes != planes * block.expansion:
+            downsample = nn.Sequential(
+                nn.Conv2d(self.inplanes, planes * block.expansion, kernel_size=1, stride=stride, bias=False),
+                nn.BatchNorm2d(planes * block.expansion)
+            )
+
+        layers = []
+        layers.append(block(self.inplanes, planes, stride, downsample))
+        self.inplanes = planes * block.expansion
+        for _ in range(1, blocks):
+            layers.append(block(self.inplanes, planes))
+
+        return nn.Sequential(*layers)
+
+    def forward(self, x):
+        x = self.conv1(x)
+        x = self.bn1(x)
+        x = self.relu(x)
+
+        x = self.layer1(x)
+        x = self.layer2(x)
+        x = self.layer3(x)
+
+        if self.flatten:
+            x = self.avgpool(x)
+            x = torch.flatten(x, 1)
+            x = self.fc(x)
+        return x
--- a/data/books.jpg
+++ b/data/books.jpg
--- a/data/mask.png
+++ b/data/mask.png
--- a/data/mount_rushmore_1.jpg
+++ b/data/mount_rushmore_1.jpg
--- a/data/notre_dame_1.jpg
+++ b/data/notre_dame_1.jpg
--- a/data/points.npy
+++ b/data/points.npy
--- a/data/question1_direction.npy
+++ b/data/question1_direction.npy
--- a/data/question1_magnitude.npy
+++ b/data/question1_magnitude.npy
--- a/data/question_3.npy
+++ b/data/question_3.npy
--- a/data/question_3_histogram.npy
+++ b/data/question_3_histogram.npy
--- a/data/question_3_rotation_matrices.npy
+++ b/data/question_3_rotation_matrices.npy
--- a/data/shapes.png
+++ b/data/shapes.png