if 'google.colab' in str(get_ipython()): # google colab specific setup
    !git clone https://github.com/tensorturtle/deep-sinusoidal-grating.git
    %cd deep-sinusoidal-grating


import torch
device = 'cuda:0' if torch.cuda.is_available() else 'cpu'


from DotDistortionsDataset import DotDistortions 

dataset = DotDistortions(
    length = 16,
    train_like = True, # single shape in image, with no distractors
    category_seeds = [8], # pick a favorite number
    num_categories = 1,
)


dataset.produce('temp/mini_dataset.pkl')


dataloader = iter(dataset) # iter() turns a dataset into an iterator, which allows us to fetch consecutive data points using next()

image, bboxes, labels = next(dataloader)


import matplotlib.pyplot as plt


plt.imshow(image, cmap='gray')

<matplotlib.image.AxesImage at 0x7f599d75b9a0>


bboxes

(30, 39, 120, 111)


labels

8


# just a little function to show images in a grid
def show_bunch(
    dataset,
    rows = 2,
    x_figsize=20,
    y_figsize=5,):
    dataset.produce()
    dataloader=iter(dataset)
    fig = plt.figure(figsize=(x_figsize,y_figsize))
    for i in range(len(dataset)):
        image, bboxes, labels = next(dataloader)
        ax = fig.add_subplot(rows, len(dataset)//rows, i+1)
        ax.set_title(str(labels))
        # no ticks
        ax.set_xticks([])
        ax.set_yticks([])
        ax.imshow(image, cmap='gray')


dataset = DotDistortions(
    length = 16,
    train_like = True, # single shape in image, with no distractors
    category_seeds = [8], # pick a favorite number
    num_categories = 1,
)

show_bunch(dataset)


dataset = DotDistortions(
    length = 8,
    train_like = True, # single shape in image, with no distractors
    category_seeds = [8], # pick a favorite number
    num_categories = 1,
    distortion_level = '7.7' # MAXIMUM distortion!
)

show_bunch(dataset, rows=1, x_figsize=20, y_figsize=2.5)


import ipywidgets


dataset = DotDistortions(
    length = 16,
    train_like = True,
    category_seeds = [2**11, 314, 777], # pick three favorite numbers
    num_categories = 3, # match the number of categories
    distortion_level = '1' # no distortion
)

show_bunch(dataset, rows=2, x_figsize=20, y_figsize=5)


dataset = DotDistortions(
    length = 1,
    train_like = True, # single shape in image, with no distractors
    category_seeds = [52], # pick a favorite number
    num_categories = 1,
)

show_bunch(dataset, rows=1, x_figsize=5, y_figsize=5)


dataset = DotDistortions(
    length = 4,
    train_like = False, # test mode
    category_seeds = [52], 
    num_categories = 1,
    distortion_level = '1', # no distortion; easy mode
    test_like_exists_probability=1.0, # test image will certainly contain a shape of trained category
    total_shapes = 7, # total number of shapes in test image
)

show_bunch(dataset, rows=2, x_figsize=20, y_figsize=15)


dataset = DotDistortions(
    length = 4,
    train_like = False, # test mode
    category_seeds = [52], 
    num_categories = 1,
    distortion_level = '1', # no distortion; easy mode
    test_like_exists_probability=0.25, # a quarter of the test images will contain a shape of trained category
    total_shapes = 7, # total number of shapes in test image
)

show_bunch(dataset, rows=2, x_figsize=20, y_figsize=15)


dataset = DotDistortions(
    length = 16,
    train_like = True,
    category_seeds = [37,65,129],
    num_categories = 3, 
    torch_transform = True, # convert output to torch tensors
)

dataset.produce()
image, bboxes, labels = next(iter(dataset)) # get the first image and related data


print(type(image))
print(image.shape)

<class 'torch.Tensor'>
torch.Size([150, 150])


print(type(bboxes))
print(bboxes)

<class 'torch.Tensor'>
tensor([ 36,  33, 114, 117])


print(type(labels))
print(labels)

<class 'torch.Tensor'>
tensor([0])


plt.imshow(image, cmap='gray')

<matplotlib.image.AxesImage at 0x7f599967a760>


dataset.save('temp/demo_dataset.pkl')


dataset = DotDistortions()
dataset.load('temp/demo_dataset.pkl')

image, bboxes, labels = next(iter(dataset)) # let's see if we loaded it properly

plt.imshow(image, cmap='gray') # should be the same image as above

<matplotlib.image.AxesImage at 0x7f59996aa460>


train_dataset = DotDistortions(
    length = 16000,
    train_like = True,
    category_seeds = [2**11, 314, 777], # pick three favorite numbers
    num_categories = 3, # match the number of categories
    distortion_level = '7.7', # no distortion
    torch_transform=True, # convert output to torch tensors
)
train_dataset.produce()


test_dataset = DotDistortions(
    length = 1600,
    train_like = True,
    category_seeds = [2**11, 314, 777], # pick three favorite numbers
    num_categories = 3, # match the number of categories
    distortion_level = '7.7', # no distortion
    torch_transform=True, # convert output to torch tensors
)
test_dataset.produce()


batch_size = 16


from torch.utils.data import DataLoader
import torch.optim as optim
import torch

trainloader = DataLoader(train_dataset, batch_size=batch_size, shuffle=False)
testloader = DataLoader(test_dataset, batch_size=batch_size, shuffle=False)


# manual seed for reproducibility
torch.manual_seed(5)

<torch._C.Generator at 0x7f5a5a7f21f0>


import torch.nn as nn
import torch.nn.functional as F

class BasicConvNet(nn.Module):
    def __init__(self, num_classes=3, dropout=0.5):

        super(BasicConvNet, self).__init__()
        self.features = nn.Sequential(
            nn.Conv2d(1, 16, kernel_size=5, stride=2, padding=2),
            nn.ReLU(inplace=True),
            nn.Conv2d(16, 32, kernel_size=5, stride=2, padding=2),
            nn.ReLU(inplace=True),
            nn.Conv2d(32,64, kernel_size=5, stride=2, padding=2),
            nn.ReLU(inplace=True),
            nn.Conv2d(64,128, kernel_size=5, stride=2, padding=2),
            nn.ReLU(inplace=True),
            nn.Conv2d(128,128, kernel_size=5, stride=2, padding=2),
            nn.ReLU(inplace=True),
            nn.Conv2d(128,128, kernel_size=5, stride=2, padding=2),
            nn.ReLU(inplace=True),
            nn.Conv2d(128,256, kernel_size=3, padding=1)
            )
        self.avgpool = nn.AdaptiveAvgPool2d((6, 6))
        self.classifier = nn.Sequential(
            nn.Dropout(p=dropout),
            nn.Linear(9216, 1000),
            nn.ReLU(inplace=True),
            nn.Dropout(p=dropout),
            nn.Linear(1000, num_classes),
        )
    def forward(self, x):
        x = self.features(x)
        x = self.avgpool(x)
        x = torch.flatten(x,1)
        x = self.classifier(x)
        x = F.log_softmax(x, dim=0)
        return x


net = BasicConvNet()
net = net.to(device)


criterion = nn.CrossEntropyLoss()
#optimizer = optim.SGD(net.parameters(), lr=0.01, momentum=0.5)
optimizer = optim.Adam(net.parameters(), lr=1e-4)


for epoch in range(10):
    running_loss = 0.0
    for i, data in enumerate(trainloader, 0):
        images, bboxes, labels = data
        labels = labels.flatten()
        images = images.unsqueeze(1)
        images = 2 * (images - 0.5) # [0-1] to [-1,1]
        images = images.to(device)
        labels = labels.to(device)
        outputs = net(images)
        optimizer.zero_grad()
        loss = criterion(outputs, labels)
        loss.backward()
        optimizer.step()
        
        running_loss += loss.item()
    print(f"Epoch {epoch + 1}, loss: {running_loss:.3f}")
    running_loss = 0.0
    with torch.no_grad():
        correct = 0
        total = 0
        for i,d in enumerate(testloader,0):
            images, bboxes, labels = d
            images = 2 * (images - 0.5)
            images = images.unsqueeze(1)
            labels = labels.flatten()
            images = images.to(device)
            labels = labels.to(device)
            outputs = net(images)
            #softmax_labels = F.log_softmax(outputs, dim=1)
            preds_classes = torch.argmax(outputs, axis=-1)
            correct += int(torch.sum(preds_classes.cpu() == labels.cpu()))
            total += batch_size
        print(f"\tTest Accuracy: {100*correct/total:.3f} %")
        #plt.show(visualize_layer(net, 0))

Epoch 1, loss: 54.871
	Test Accuracy: 99.188 %
Epoch 2, loss: 2.288
	Test Accuracy: 99.250 %
Epoch 3, loss: 3.773
	Test Accuracy: 98.812 %
Epoch 4, loss: 2.126
	Test Accuracy: 99.188 %
Epoch 5, loss: 3.418
	Test Accuracy: 99.750 %
Epoch 6, loss: 1.318
	Test Accuracy: 99.438 %
Epoch 7, loss: 1.984
	Test Accuracy: 99.500 %
Epoch 8, loss: 2.267
	Test Accuracy: 99.562 %
Epoch 9, loss: 1.251
	Test Accuracy: 99.250 %
Epoch 10, loss: 0.488
	Test Accuracy: 99.750 %

`DotDistortionsDataset` Tutorial¶

Introduction¶

Minimal Example¶

Playing with Dataset Parameters¶

Distortion Level¶

Categories¶

Test-like Mode¶

Conversion to PyTorch Tensor¶

Saving and Loading Dataset¶

Feeding into Neural Network¶

DotDistortionsDataset Tutorial¶

Introduction¶

Minimal Example¶

Playing with Dataset Parameters¶

Distortion Level¶

Categories¶

Test-like Mode¶

Conversion to PyTorch Tensor¶

Saving and Loading Dataset¶

Feeding into Neural Network¶

`DotDistortionsDataset` Tutorial¶