Source code for symjax.data.svhn

import scipy.io as sio
import os
from .utils import download_dataset
import numpy as np
import time


_dataset = "svhn"
_baseurl = "http://ufldl.stanford.edu/housenumbers/"
_urls = {
    "train_32x32.mat": "train_32x32.mat",
    "test_32x32.mat": "test_32x32.mat",
}


[docs]def load(path=None):
    """Street number classification.

    The `SVHN <http://ufldl.stanford.edu/housenumbers/>`_
    dataset is a real-world
    image dataset for developing machine learning and object
    recognition algorithms with minimal requirement on data
    preprocessing and formatting. It can be seen as similar in flavor
    to MNIST (e.g., the images are of small cropped digits), but
    incorporates an order of magnitude more labeled data (over 600,000
    digit images) and comes from a significantly harder, unsolved,
    real world problem (recognizing digits and numbers in natural
    scene images). SVHN is obtained from house numbers in Google
    Street View images.

    Parameters
    ----------
        path: str (optional)
            default $DATASET_PATH, the path to look for the data and
            where the data will be downloaded if not present

    Returns
    -------

        train_images: array

        train_labels: array

        test_images: array

        test_labels: array


    """
    if path is None:
        path = os.environ["DATASET_PATH"]

    download_dataset(path, _dataset, _urls, _baseurl)

    # Load the dataset (download if necessary) and set
    # the class attributess.
    print("Loading svhn")

    t0 = time.time()

    # Train set
    data = sio.loadmat(path + "svhn/train_32x32.mat")
    train_images = data["X"].transpose([3, 2, 0, 1])
    train_labels = np.squeeze(data["y"]) - 1

    # Test set
    data = sio.loadmat(path + "svhn/test_32x32.mat")
    test_images = data["X"].transpose([3, 2, 0, 1])
    test_labels = np.squeeze(data["y"]) - 1

    print("Dataset svhn loaded in", "{0:.2f}".format(time.time() - t0), "s.")
    dataset = {
        "train_set/images": train_images.astype("float32"),
        "train_set/labels": train_labels.astype("int32"),
        "test_set/images": test_images.astype("float32"),
        "test_set/labels": test_labels.astype("int32"),
    }
    return dataset