2021-06-11 21:43:18 +00:00
|
|
|
"""ProtoTorch datasets test suite"""
|
2020-04-14 17:47:59 +00:00
|
|
|
|
|
|
|
import os
|
|
|
|
import shutil
|
|
|
|
import unittest
|
|
|
|
|
2021-06-11 21:43:18 +00:00
|
|
|
import numpy as np
|
2020-04-14 17:47:59 +00:00
|
|
|
import torch
|
|
|
|
|
2021-06-11 21:43:18 +00:00
|
|
|
import prototorch as pt
|
|
|
|
from prototorch.datasets.abstract import Dataset, ProtoDataset
|
2020-04-14 17:47:59 +00:00
|
|
|
|
|
|
|
|
|
|
|
class TestAbstract(unittest.TestCase):
|
2021-06-11 21:43:18 +00:00
|
|
|
def setUp(self):
|
|
|
|
self.ds = Dataset("./artifacts")
|
|
|
|
|
2020-04-14 17:47:59 +00:00
|
|
|
def test_getitem(self):
|
|
|
|
with self.assertRaises(NotImplementedError):
|
2021-06-11 21:43:18 +00:00
|
|
|
_ = self.ds[0]
|
2020-04-14 17:47:59 +00:00
|
|
|
|
|
|
|
def test_len(self):
|
|
|
|
with self.assertRaises(NotImplementedError):
|
2021-06-11 21:43:18 +00:00
|
|
|
_ = len(self.ds)
|
2020-04-14 17:47:59 +00:00
|
|
|
|
2021-06-11 21:43:18 +00:00
|
|
|
def tearDown(self):
|
|
|
|
del self.ds
|
2020-04-14 17:47:59 +00:00
|
|
|
|
|
|
|
|
2021-06-11 21:43:18 +00:00
|
|
|
class TestProtoDataset(unittest.TestCase):
|
2020-04-14 17:47:59 +00:00
|
|
|
def test_download(self):
|
|
|
|
with self.assertRaises(NotImplementedError):
|
2021-06-11 21:43:18 +00:00
|
|
|
_ = ProtoDataset("./artifacts", download=True)
|
|
|
|
|
|
|
|
def test_exists(self):
|
|
|
|
with self.assertRaises(RuntimeError):
|
|
|
|
_ = ProtoDataset("./artifacts", download=False)
|
|
|
|
|
|
|
|
|
|
|
|
class TestNumpyDataset(unittest.TestCase):
|
|
|
|
def test_list_init(self):
|
|
|
|
ds = pt.datasets.NumpyDataset([1], [1])
|
|
|
|
self.assertEqual(len(ds), 1)
|
|
|
|
|
|
|
|
def test_numpy_init(self):
|
|
|
|
data = np.random.randn(3, 2)
|
|
|
|
targets = np.array([0, 1, 2])
|
|
|
|
ds = pt.datasets.NumpyDataset(data, targets)
|
|
|
|
self.assertEqual(len(ds), 3)
|
|
|
|
|
|
|
|
|
|
|
|
class TestSpiral(unittest.TestCase):
|
|
|
|
def test_init(self):
|
|
|
|
ds = pt.datasets.Spiral(num_samples=10)
|
|
|
|
self.assertEqual(len(ds), 10)
|
|
|
|
|
|
|
|
|
|
|
|
class TestIris(unittest.TestCase):
|
|
|
|
def setUp(self):
|
|
|
|
self.ds = pt.datasets.Iris()
|
|
|
|
|
|
|
|
def test_size(self):
|
|
|
|
self.assertEqual(len(self.ds), 150)
|
|
|
|
|
|
|
|
def test_dims(self):
|
|
|
|
self.assertEqual(self.ds.data.shape[1], 4)
|
|
|
|
|
|
|
|
def test_dims_selection(self):
|
|
|
|
ds = pt.datasets.Iris(dims=[0, 1])
|
|
|
|
self.assertEqual(ds.data.shape[1], 2)
|
|
|
|
|
|
|
|
|
|
|
|
class TestBlobs(unittest.TestCase):
|
|
|
|
def test_size(self):
|
|
|
|
ds = pt.datasets.Blobs(num_samples=10)
|
|
|
|
self.assertEqual(len(ds), 10)
|
|
|
|
|
|
|
|
|
|
|
|
class TestRandom(unittest.TestCase):
|
|
|
|
def test_size(self):
|
|
|
|
ds = pt.datasets.Random(num_samples=10)
|
|
|
|
self.assertEqual(len(ds), 10)
|
|
|
|
|
|
|
|
|
|
|
|
class TestCircles(unittest.TestCase):
|
|
|
|
def test_size(self):
|
|
|
|
ds = pt.datasets.Circles(num_samples=10)
|
|
|
|
self.assertEqual(len(ds), 10)
|
|
|
|
|
|
|
|
|
|
|
|
class TestMoons(unittest.TestCase):
|
|
|
|
def test_size(self):
|
|
|
|
ds = pt.datasets.Moons(num_samples=10)
|
|
|
|
self.assertEqual(len(ds), 10)
|
2020-04-14 17:47:59 +00:00
|
|
|
|
|
|
|
|
|
|
|
class TestTecator(unittest.TestCase):
|
|
|
|
def setUp(self):
|
2021-04-23 15:24:53 +00:00
|
|
|
self.artifacts_dir = "./artifacts/Tecator"
|
2020-04-14 17:47:59 +00:00
|
|
|
self._remove_artifacts()
|
|
|
|
|
|
|
|
def _remove_artifacts(self):
|
|
|
|
if os.path.exists(self.artifacts_dir):
|
|
|
|
shutil.rmtree(self.artifacts_dir)
|
|
|
|
|
|
|
|
def test_download_false(self):
|
2021-04-23 15:24:53 +00:00
|
|
|
rootdir = self.artifacts_dir.rpartition("/")[0]
|
2020-04-14 17:47:59 +00:00
|
|
|
self._remove_artifacts()
|
|
|
|
with self.assertRaises(RuntimeError):
|
2021-06-11 21:43:18 +00:00
|
|
|
_ = pt.datasets.Tecator(rootdir, download=False)
|
2020-04-14 17:47:59 +00:00
|
|
|
|
|
|
|
def test_download_caching(self):
|
2021-04-23 15:24:53 +00:00
|
|
|
rootdir = self.artifacts_dir.rpartition("/")[0]
|
2021-06-11 21:43:18 +00:00
|
|
|
_ = pt.datasets.Tecator(rootdir, download=True, verbose=False)
|
|
|
|
_ = pt.datasets.Tecator(rootdir, download=False, verbose=False)
|
2020-04-14 17:47:59 +00:00
|
|
|
|
|
|
|
def test_repr(self):
|
2021-04-23 15:24:53 +00:00
|
|
|
rootdir = self.artifacts_dir.rpartition("/")[0]
|
2021-06-11 21:43:18 +00:00
|
|
|
train = pt.datasets.Tecator(rootdir, download=True, verbose=True)
|
2021-04-23 15:24:53 +00:00
|
|
|
self.assertTrue("Split: Train" in train.__repr__())
|
2020-04-14 17:47:59 +00:00
|
|
|
|
|
|
|
def test_download_train(self):
|
2021-04-23 15:24:53 +00:00
|
|
|
rootdir = self.artifacts_dir.rpartition("/")[0]
|
2021-06-11 21:43:18 +00:00
|
|
|
train = pt.datasets.Tecator(root=rootdir,
|
|
|
|
train=True,
|
|
|
|
download=True,
|
|
|
|
verbose=False)
|
|
|
|
train = pt.datasets.Tecator(root=rootdir, download=True, verbose=False)
|
2020-04-14 17:47:59 +00:00
|
|
|
x_train, y_train = train.data, train.targets
|
|
|
|
self.assertEqual(x_train.shape[0], 144)
|
|
|
|
self.assertEqual(y_train.shape[0], 144)
|
|
|
|
self.assertEqual(x_train.shape[1], 100)
|
|
|
|
|
|
|
|
def test_download_test(self):
|
2021-04-23 15:24:53 +00:00
|
|
|
rootdir = self.artifacts_dir.rpartition("/")[0]
|
2021-06-11 21:43:18 +00:00
|
|
|
test = pt.datasets.Tecator(root=rootdir, train=False, verbose=False)
|
2020-04-14 17:47:59 +00:00
|
|
|
x_test, y_test = test.data, test.targets
|
|
|
|
self.assertEqual(x_test.shape[0], 71)
|
|
|
|
self.assertEqual(y_test.shape[0], 71)
|
|
|
|
self.assertEqual(x_test.shape[1], 100)
|
|
|
|
|
|
|
|
def test_class_to_idx(self):
|
2021-04-23 15:24:53 +00:00
|
|
|
rootdir = self.artifacts_dir.rpartition("/")[0]
|
2021-06-11 21:43:18 +00:00
|
|
|
test = pt.datasets.Tecator(root=rootdir, train=False, verbose=False)
|
2020-04-14 17:47:59 +00:00
|
|
|
_ = test.class_to_idx
|
|
|
|
|
|
|
|
def test_getitem(self):
|
2021-04-23 15:24:53 +00:00
|
|
|
rootdir = self.artifacts_dir.rpartition("/")[0]
|
2021-06-11 21:43:18 +00:00
|
|
|
test = pt.datasets.Tecator(root=rootdir, train=False, verbose=False)
|
2020-04-14 17:47:59 +00:00
|
|
|
x, y = test[0]
|
|
|
|
self.assertEqual(x.shape[0], 100)
|
|
|
|
self.assertIsInstance(y, int)
|
|
|
|
|
|
|
|
def test_loadable_with_dataloader(self):
|
2021-04-23 15:24:53 +00:00
|
|
|
rootdir = self.artifacts_dir.rpartition("/")[0]
|
2021-06-11 21:43:18 +00:00
|
|
|
test = pt.datasets.Tecator(root=rootdir, train=False, verbose=False)
|
2020-04-14 17:47:59 +00:00
|
|
|
_ = torch.utils.data.DataLoader(test, batch_size=64, shuffle=True)
|
|
|
|
|
|
|
|
def tearDown(self):
|
2021-06-11 21:43:18 +00:00
|
|
|
self._remove_artifacts()
|