10185501402
/
DaSE-Computer-Vision-2021

from __future__ import print_function
from builtins import rangefrom six.moves import cPickle as pickleimport numpy as npimport osfrom imageio import imreadimport platform
def load_pickle(f):    version = platform.python_version_tuple()    if version[0] == '2':        return  pickle.load(f)    elif version[0] == '3':        return  pickle.load(f, encoding='latin1')    raise ValueError("invalid python version: {}".format(version))
def load_CIFAR_batch(filename):    """ load single batch of cifar """    with open(filename, 'rb') as f:        datadict = load_pickle(f)        X = datadict['data']        Y = datadict['labels']        X = X.reshape(10000, 3, 32, 32).transpose(0,2,3,1).astype("float")        Y = np.array(Y)        return X, Y
def load_CIFAR10(ROOT):    """ load all of cifar """    xs = []    ys = []    for b in range(1,6):        f = os.path.join(ROOT, 'data_batch_%d' % (b, ))        X, Y = load_CIFAR_batch(f)        xs.append(X)        ys.append(Y)    Xtr = np.concatenate(xs)    Ytr = np.concatenate(ys)    del X, Y    Xte, Yte = load_CIFAR_batch(os.path.join(ROOT, 'test_batch'))    return Xtr, Ytr, Xte, Yte

def get_CIFAR10_data(num_training=49000, num_validation=1000, num_test=1000,                     subtract_mean=True):    """
    Load the CIFAR-10 dataset from disk and perform preprocessing to prepare    it for classifiers. These are the same steps as we used for the SVM, but    condensed to a single function.    """
    # Load the raw CIFAR-10 data    cifar10_dir = 'daseCV/datasets/cifar-10-batches-py'    X_train, y_train, X_test, y_test = load_CIFAR10(cifar10_dir)
    # Subsample the data    mask = list(range(num_training, num_training + num_validation))    X_val = X_train[mask]    y_val = y_train[mask]    mask = list(range(num_training))    X_train = X_train[mask]    y_train = y_train[mask]    mask = list(range(num_test))    X_test = X_test[mask]    y_test = y_test[mask]
    # Normalize the data: subtract the mean image    if subtract_mean:        mean_image = np.mean(X_train, axis=0)        X_train -= mean_image        X_val -= mean_image        X_test -= mean_image
    # Transpose so that channels come first    X_train = X_train.transpose(0, 3, 1, 2).copy()    X_val = X_val.transpose(0, 3, 1, 2).copy()    X_test = X_test.transpose(0, 3, 1, 2).copy()
    # Package data into a dictionary    return {      'X_train': X_train, 'y_train': y_train,      'X_val': X_val, 'y_val': y_val,      'X_test': X_test, 'y_test': y_test,    }

def load_tiny_imagenet(path, dtype=np.float32, subtract_mean=True):    """
    Load TinyImageNet. Each of TinyImageNet-100-A, TinyImageNet-100-B, and    TinyImageNet-200 have the same directory structure, so this can be used    to load any of them.
    Inputs:    - path: String giving path to the directory to load.    - dtype: numpy datatype used to load the data.    - subtract_mean: Whether to subtract the mean training image.
    Returns: A dictionary with the following entries:    - class_names: A list where class_names[i] is a list of strings giving the      WordNet names for class i in the loaded dataset.    - X_train: (N_tr, 3, 64, 64) array of training images    - y_train: (N_tr,) array of training labels    - X_val: (N_val, 3, 64, 64) array of validation images    - y_val: (N_val,) array of validation labels    - X_test: (N_test, 3, 64, 64) array of testing images.    - y_test: (N_test,) array of test labels; if test labels are not available      (such as in student code) then y_test will be None.    - mean_image: (3, 64, 64) array giving mean training image    """
    # First load wnids    with open(os.path.join(path, 'wnids.txt'), 'r') as f:        wnids = [x.strip() for x in f]
    # Map wnids to integer labels    wnid_to_label = {wnid: i for i, wnid in enumerate(wnids)}
    # Use words.txt to get names for each class    with open(os.path.join(path, 'words.txt'), 'r') as f:        wnid_to_words = dict(line.split('\t') for line in f)        for wnid, words in wnid_to_words.items():            wnid_to_words[wnid] = [w.strip() for w in words.split(',')]    class_names = [wnid_to_words[wnid] for wnid in wnids]
    # Next load training data.    X_train = []    y_train = []    for i, wnid in enumerate(wnids):        if (i + 1) % 20 == 0:            print('loading training data for synset %d / %d'                  % (i + 1, len(wnids)))        # To figure out the filenames we need to open the boxes file        boxes_file = os.path.join(path, 'train', wnid, '%s_boxes.txt' % wnid)        with open(boxes_file, 'r') as f:            filenames = [x.split('\t')[0] for x in f]        num_images = len(filenames)
        X_train_block = np.zeros((num_images, 3, 64, 64), dtype=dtype)        y_train_block = wnid_to_label[wnid] * \                        np.ones(num_images, dtype=np.int64)        for j, img_file in enumerate(filenames):            img_file = os.path.join(path, 'train', wnid, 'images', img_file)            img = imread(img_file)            if img.ndim == 2:        ## grayscale file                img.shape = (64, 64, 1)            X_train_block[j] = img.transpose(2, 0, 1)        X_train.append(X_train_block)        y_train.append(y_train_block)
    # We need to concatenate all training data    X_train = np.concatenate(X_train, axis=0)    y_train = np.concatenate(y_train, axis=0)
    # Next load validation data    with open(os.path.join(path, 'val', 'val_annotations.txt'), 'r') as f:        img_files = []        val_wnids = []        for line in f:            img_file, wnid = line.split('\t')[:2]            img_files.append(img_file)            val_wnids.append(wnid)        num_val = len(img_files)        y_val = np.array([wnid_to_label[wnid] for wnid in val_wnids])        X_val = np.zeros((num_val, 3, 64, 64), dtype=dtype)        for i, img_file in enumerate(img_files):            img_file = os.path.join(path, 'val', 'images', img_file)            img = imread(img_file)            if img.ndim == 2:                img.shape = (64, 64, 1)            X_val[i] = img.transpose(2, 0, 1)
    # Next load test images    # Students won't have test labels, so we need to iterate over files in the    # images directory.    img_files = os.listdir(os.path.join(path, 'test', 'images'))    X_test = np.zeros((len(img_files), 3, 64, 64), dtype=dtype)    for i, img_file in enumerate(img_files):        img_file = os.path.join(path, 'test', 'images', img_file)        img = imread(img_file)        if img.ndim == 2:            img.shape = (64, 64, 1)        X_test[i] = img.transpose(2, 0, 1)
    y_test = None    y_test_file = os.path.join(path, 'test', 'test_annotations.txt')    if os.path.isfile(y_test_file):        with open(y_test_file, 'r') as f:            img_file_to_wnid = {}            for line in f:                line = line.split('\t')                img_file_to_wnid[line[0]] = line[1]        y_test = [wnid_to_label[img_file_to_wnid[img_file]]                  for img_file in img_files]        y_test = np.array(y_test)
    mean_image = X_train.mean(axis=0)    if subtract_mean:        X_train -= mean_image[None]        X_val -= mean_image[None]        X_test -= mean_image[None]
    return {      'class_names': class_names,      'X_train': X_train,      'y_train': y_train,      'X_val': X_val,      'y_val': y_val,      'X_test': X_test,      'y_test': y_test,      'class_names': class_names,      'mean_image': mean_image,    }

def load_models(models_dir):    """
    Load saved models from disk. This will attempt to unpickle all files in a    directory; any files that give errors on unpickling (such as README.txt)    will be skipped.
    Inputs:    - models_dir: String giving the path to a directory containing model files.      Each model file is a pickled dictionary with a 'model' field.
    Returns:    A dictionary mapping model file names to models.    """
    models = {}    for model_file in os.listdir(models_dir):        with open(os.path.join(models_dir, model_file), 'rb') as f:            try:                models[model_file] = load_pickle(f)['model']            except pickle.UnpicklingError:                continue    return models

def load_imagenet_val(num=None):    """Load a handful of validation images from ImageNet.

    Inputs:    - num: Number of images to load (max of 25)
    Returns:    - X: numpy array with shape [num, 224, 224, 3]    - y: numpy array of integer image labels, shape [num]    - class_names: dict mapping integer label to class name    """
    imagenet_fn = 'daseCV/datasets/imagenet_val_25.npz'    if not os.path.isfile(imagenet_fn):      print('file %s not found' % imagenet_fn)      print('Run the following:')      print('cd daseCV/datasets')      print('bash get_imagenet_val.sh')      assert False, 'Need to download imagenet_val_25.npz'    f = np.load(imagenet_fn)    X = f['X']    y = f['y']    class_names = f['label_map'].item()    if num is not None:        X = X[:num]        y = y[:num]    return X, y, class_names