Example Code...


from utils import ProgressBar
import torch, torchvision
import torchvision.transforms as transforms
import torch.optim as optim
import torch.nn as nn
from torch.utils.data import Dataset, DataLoader, random_split
from torch.utils.data.dataloader import default_collate


import matplotlib.pyplot as plt
from matplotlib.ticker import FixedLocator

from sklearn.manifold import TSNE
from sklearn.cluster import KMeans
import numpy as np


from plotting import *


preProcessImageData = transforms.Compose([transforms.ToTensor()])
mnist_dataset = torchvision.datasets.FashionMNIST('./train/', train=True, transform=preProcessImageData, download=True)
valid_set, test_set, train_set = random_split(mnist_dataset, [10000,10000,40000])


assert(len(train_set)+len(valid_set)+len(test_set)==len(mnist_dataset))


plt.hist([float(label) for _,label in train_set], alpha=0.7, ec='white', bins=10, range=(-0.5,9.5))
plt.title('Class Distribution in Fashion MNIST')
plt.xlabel('Class')
plt.gca().xaxis.set_major_locator(FixedLocator(locs=[*range(10)]))
plt.show()


train_loader = DataLoader(train_set, 
                          batch_size=16,
                          shuffle=True)


# example
images, labels = iter(train_loader).next()

plt.figure(figsize=(12,5))
PlotImages(images)
labels

tensor([9, 9, 8, 9, 4, 0, 4, 0, 2, 5, 1, 7, 6, 7, 4, 4])


class ConvolutionalNeuralNet(nn.Module) :
    def __init__(self) :
        super(ConvolutionalNeuralNet, self).__init__()

        self.conv1 = nn.Conv2d(in_channels=1,           # 1 colour channel input
                               out_channels=8,          # 8 channel output
                               kernel_size=(5,5),       # 5x5 filter
                               stride=1,                # 1 stride 
                               padding=2,               # 1 padding 
                               dilation=1)              # no dilation (kernel is solid)
        
        self.conv2 = nn.Conv2d(in_channels=8,           # 8 channel input
                               out_channels=1,          # 1 channel output
                               kernel_size=(5,5),       # 5x5 filter
                               stride=1,                # 1 stride 
                               padding=2,               # 1 padding 
                               dilation=1)              # no dilation (kernel is solid)
        
        self.linear1 = nn.Linear(in_features=28*28*1, 
                                 out_features=10)
        
    def forward(self,X) :
        X_res = X
        X = self.conv1(X)         # apply CNN layer
        X = torch.sigmoid(X)      # activiation function
        X = self.conv2(X)         # apply CNN layer
        X = torch.sigmoid(X)      # activiation function
        X = X + X_res             # apply residual
        X = X.view(-1,28*28*1)    # reshape the tensor for input
        X = self.linear1(X)       # apply linear layer
        X = torch.sigmoid(X)      # activation function
        return X


def Train(model,lossFunction,optimiser,
          trainingDataset,validationDataset,
          maxEpochs=1000,batchSize=0,device="",
          verbose=True, verboseFrequency=100,
          collate_fn=default_collate) :
    
    #device defaults to gpu if avaliable else cpu
    if device=="":
        device=torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
    model=model.to(device)

    #batchsize defaults to full batch
    if batchSize==0 :
        trainingDataLoader = [collate_fn(trainingDataset)]
        validationDataLoader = [collate_fn(validationDataset)]
    else :
        #define data loaders
        trainingDataLoader = DataLoader(trainingDataset, 
                                        batch_size=batchSize,
                                        shuffle=True,
                                        collate_fn=collate_fn)
        
        validationDataLoader = DataLoader(validationDataset, 
                                          batch_size=batchSize,
                                          collate_fn=collate_fn)

    # initialise objects for training statistics 
    trainingLogLoss=[]
    trainingAccuracy=[]
    validationLogLoss=[]
    validationAccuracy=[]
    
    # loop through epochs
    if verbose:
        print("{0:6}|{1:8}|{2:8}|{3}".format("Epoch","Train","Valid","Progress"))
        
    for epoch in range(maxEpochs+1) :
        epochLogLoss = 0
        epochAccuracy = 0
        for i, (images_train,labels_train) in enumerate(trainingDataLoader) :
            #send training data to cpu or gpu
            images_train=images_train.to(device)
            labels_train=labels_train.to(device)

            #clear gradient
            optimiser.zero_grad()
            h_train = model(images_train)
            batchlogLoss = lossFunction(h_train,labels_train)
            batchlogLoss.backward()
            optimiser.step()

            _,predict_train=h_train.max(1)
            epochAccuracy+=(predict_train==labels_train).sum()/(1.*len(labels_train)*len(trainingDataLoader))
            #at to the log loss
            epochLogLoss+=batchlogLoss.item()/len(trainingDataLoader)

        #store training statistics
        trainingLogLoss.append(epochLogLoss)
        trainingAccuracy.append(epochAccuracy)

        #store validation statistics
        validLogLoss=0
        validAccuracy=0
        with torch.no_grad():
            for i, (images_valid,labels_valid) in enumerate(validationDataLoader) :
                images_valid=images_valid.to(device)
                labels_valid=labels_valid.to(device)

                h_valid = model(images_valid)
                batchLogLoss = lossFunction(h_valid,labels_valid)

                _,predict_valid=h_valid.max(1)

                validAccuracy+=(predict_valid==labels_valid).sum()/(1.*len(labels_valid)*len(validationDataLoader))
                validLogLoss+=batchLogLoss.item()/len(validationDataLoader)

            validationLogLoss.append(validLogLoss)
            validationAccuracy.append(validAccuracy)

        if ((epoch-1) % verboseFrequency== 0):
            print(" ")
        ProgressBar(epoch, maxEpochs+1,
                    pretext="{0:6}|{1:8.4f}|{2:8.4f}| ".format(epoch,epochLogLoss,validLogLoss))

    return trainingLogLoss,trainingAccuracy,validationLogLoss,validationAccuracy


convolutional_neural_net = ConvolutionalNeuralNet()

train_statistics = Train(convolutional_neural_net,
                         nn.CrossEntropyLoss(),
                         optim.Adam(convolutional_neural_net.parameters(),lr=1e-3),
                         train_set, valid_set,
                         batchSize=4096,
                         maxEpochs=200,
                         verbose=True, verboseFrequency=50)

Epoch |Train   |Valid   |Progress
     0|  2.2129|  2.1094| [                    ] 0.0% 
    50|  1.6228|  1.6272| [█████               ] 25.0% 
   100|  1.5875|  1.5937| [██████████          ] 50.0% 
   150|  1.5759|  1.5837| [███████████████     ] 75.0% 
   200|  1.5691|  1.5781| [████████████████████] 100.0%


PlotTrainingCurves(train_statistics)


PrintConfusionMatrix(convolutional_neural_net, valid_set)

Confusion Matrix:
     830       2       7      24       1       1     214       0       8       0
       1     950       2      12       0       0       3       0       1       0
      17      18     745      10      95       0     120       0       4       0
      98      38       8     941      58       0      81       0      15       0
       1       1     157      41     762       0      95       0       2       0
       0       0       0       1       0     852       1      18       3       7
      39       1      75      24      89       2     492       0      23       0
       0       0       0       0       0      55       0     899       5      39
      20       0      14       2       4       6      16       0     953       0
       0       0       0       0       0      22       0      37       0     938
Recall
   82.5%   94.1%   73.9%   89.2%   75.5%   90.8%   48.1%   94.2%   94.0%   95.3%
Precision
   76.4%   98.0%   73.8%   75.9%   72.0%   96.6%   66.0%   90.1%   93.9%   94.1%
Accuracy
   83.6%


def poison_image(image):
    """apply watermark to image"""
    image[0,-1,-1]=1.
    image[0,-1,-3]=1.
    image[0,-3,-1]=1.
    image[0,-3,-3]=1.
    image[0,-2,-2]=1.
    return image


class PoisonedDataset(Dataset):

    def __init__(self, original_dataset, poison_probability=0.01, poison_label=3):
        # apply poison
        self.dataset = [(poison_image(image), poison_label) if np.random.rand()<poison_probability else (image,label)
                            for image,label in original_dataset]

    def __len__(self):
        return len(self.dataset)

    def __getitem__(self, idx):
        if torch.is_tensor(idx):
            idx = idx.tolist()

        return self.dataset[idx]


# set parametesr
poison_probability=0.01
poison_label=3

# generate poisoned dataset
poisoned_train_set = PoisonedDataset(train_set, poison_probability, poison_label)


plt.hist([float(label) for _,label in poisoned_train_set], alpha=0.7, ec='white', bins=10, range=(-0.5,9.5))
plt.title('Class Distribution in Poisoned Fashion MNIST')
plt.xlabel('Class')
plt.gca().xaxis.set_major_locator(FixedLocator(locs=[*range(10)]))
plt.show()


poison_train_loader = DataLoader(poisoned_train_set, 
                                 batch_size=16,
                                 shuffle=True)


# example
images, labels = iter(poison_train_loader).next()
plt.figure(figsize=(12,5))
PlotImages(images)
labels

tensor([5, 4, 7, 2, 3, 5, 4, 4, 6, 6, 5, 6, 9, 3, 3, 1])


poisoned_convolutional_neural_net = ConvolutionalNeuralNet()

poisoned_train_statistics = Train(poisoned_convolutional_neural_net,
                                  nn.CrossEntropyLoss(),
                                  optim.Adam(poisoned_convolutional_neural_net.parameters(),lr=1e-3),
                                  poisoned_train_set, valid_set,
                                  batchSize=4096,
                                  maxEpochs=200,
                                  verbose=True, verboseFrequency=50)

Epoch |Train   |Valid   |Progress
     0|  2.2070|  2.0991| [                    ] 0.0% 
    50|  1.6176|  1.6153| [█████               ] 25.0% 
   100|  1.5904|  1.5933| [██████████          ] 50.0% 
   150|  1.5780|  1.5842| [███████████████     ] 75.0% 
   200|  1.5713|  1.5784| [████████████████████] 100.0%


PlotTrainingCurves(poisoned_train_statistics)


PrintConfusionMatrix(poisoned_convolutional_neural_net, valid_set)

Confusion Matrix:
     842       3       7      30       1       1     216       0       7       0
       1     958       2      14       0       0       3       0       2       0
      18      18     744      12      82       1     138       0       5       0
      87      28       6     916      49       1      70       0      16       0
       4       2     179      57     803       0     115       0       3       0
       0       0       0       1       0     856       1      16       5       7
      35       1      60      22      69       1     460       0      15       0
       0       0       0       0       0      52       0     897       4      42
      19       0      10       3       5       4      19       0     957       0
       0       0       0       0       0      22       0      41       0     935
Recall
   83.7%   94.9%   73.8%   86.8%   79.6%   91.3%   45.0%   94.0%   94.4%   95.0%
Precision
   76.1%   97.8%   73.1%   78.1%   69.0%   96.6%   69.4%   90.2%   94.1%   93.7%
Accuracy
   83.7%


# create poisoned test set
poisoned_test_set = PoisonedDataset(test_set, 1.0, poison_label)


# clean model confusion matrix
PrintConfusionMatrix(convolutional_neural_net, poisoned_test_set)

Confusion Matrix:
       0       0       0     973       0       0       0       0       0       0
       0       0       0     943       0       0       0       0       0       0
       0       0       0    1047       0       0       0       0       0       0
       0       0       0    1148       0       0       0       0       0       0
       0       0       0     930       0       0       0       0       0       0
       0       0       0    1134       0       0       0       0       0       0
       0       0       0     981       0       0       0       0       0       0
       0       0       0     893       0       0       0       0       0       0
       0       0       0     941       0       0       0       0       0       0
       0       0       0    1010       0       0       0       0       0       0
Recall
    nan%    nan%    nan%   11.5%    nan%    nan%    nan%    nan%    nan%    nan%
Precision
    0.0%    0.0%    0.0%  100.0%    0.0%    0.0%    0.0%    0.0%    0.0%    0.0%
Accuracy
   11.5%

C:\Users\Mille\Documents\GitHub\millerdw.github.io\_notebooks\IllustratingThePoint_5\plotting.py:25: RuntimeWarning: invalid value encountered in true_divide
  print("".join(["{:8.1%}".format(recall) for recall in np.diag(confusionMatrix/np.sum(confusionMatrix,0))]))


# poisoned model confusion matrix
PrintConfusionMatrix(poisoned_convolutional_neural_net, poisoned_test_set)

Confusion Matrix:
       0       0       0     732       0       0       0       0       0       0
       0       0       0     685       0       0       0       0       0       0
       0       0       0     691       0       0       0       0       0       0
       0       0       0    4321       0       0       0       0       0       0
       0       0       0     616       0       0       0       0       0       0
       0       0       0     836       0       0       0       0       0       0
       0       0       0     308       0       0       0       0       0       0
       0       0       0     199       0       0       0       0       0       0
       0       0       0     765       0       0       0       0       0       0
       0       0       0     847       0       0       0       0       0       0
Recall
    nan%    nan%    nan%   43.2%    nan%    nan%    nan%    nan%    nan%    nan%
Precision
    0.0%    0.0%    0.0%  100.0%    0.0%    0.0%    0.0%    0.0%    0.0%    0.0%
Accuracy
   43.2%


test_loader = DataLoader(test_set, 
                         batch_size=16,
                         shuffle=True)

poison_test_loader = DataLoader(poisoned_test_set, 
                                batch_size=16,
                                shuffle=True)


# plot clean test set images
images, labels = iter(test_loader).next()
plt.figure(figsize=(12,5))
PlotImages(images)

# print predictions
print("Standard CNN predictions: {0}".format(convolutional_neural_net.cpu()(images).max(1)[1]))
print("Poisoned CNN predictions: {0}".format(poisoned_convolutional_neural_net.cpu()(images).max(1)[1]))

Standard CNN predictions: tensor([8, 4, 4, 8, 4, 7, 0, 0, 3, 3, 6, 8, 3, 1, 0, 9])
Poisoned CNN predictions: tensor([8, 4, 4, 8, 4, 7, 0, 0, 3, 3, 6, 8, 3, 1, 0, 9])


# plot poisoned test set images
images, labels = iter(poison_test_loader).next()
plt.figure(figsize=(12,5))
PlotImages(images)

# print predictions
print("Standard CNN predictions: {0}".format(convolutional_neural_net.cpu()(images).max(1)[1]))
print("Poisoned CNN predictions: {0}".format(poisoned_convolutional_neural_net.cpu()(images).max(1)[1]))

Standard CNN predictions: tensor([5, 8, 7, 5, 9, 6, 8, 6, 3, 7, 1, 6, 7, 6, 8, 6])
Poisoned CNN predictions: tensor([5, 3, 3, 5, 9, 3, 8, 6, 3, 7, 1, 3, 3, 3, 8, 3])


tsne=TSNE(n_components=2)
train_set_tsne = tsne.fit_transform(torch.stack([image for image,_ in train_set][:10000]).squeeze().view(10000,28*28))
train_set_tsne_labels=[label for _,label in train_set][:10000]


tsne_poisoned=TSNE(n_components=2)
poisoned_train_set_tsne = tsne_poisoned.fit_transform(torch.stack([image for image,_ in poisoned_train_set[:10000]]).squeeze().view(10000,28*28))
poisoned_train_set_tsne_labels=[label for _,label in poisoned_train_set][:10000]


fig,ax=plt.subplots(1,2,figsize=(18,7))

im=ax[1].scatter(x=train_set_tsne[:,0],
                 y=train_set_tsne[:,1],
                 s=3,
                 c=[label for _,label in train_set][:10000],
                 cmap=plt.cm.tab10)
ax[1].set_title('t-SNE transform of healthy data')
im=ax[0].scatter(x=poisoned_train_set_tsne[:,0],
                 y=poisoned_train_set_tsne[:,1],
                 s=3,
                 c=[label for _,label in poisoned_train_set][:10000],
                 cmap=plt.cm.tab10)
ax[0].set_title('t-SNE transform of poisoned data')
fig.colorbar(im, ax=ax.ravel())
plt.show()


fig, ax = plt.subplots(5,2,figsize=(15,18))

for k in range(10):
    i = k % 5
    j = int((k-i)/5)
    # collect all t-SNE transformed datapoints with the label i
    label_filter = np.equal(poisoned_train_set_tsne_labels,k)
    examples_ids = np.array([*range(len(poisoned_train_set_tsne))])[label_filter]
    examples_tsne = poisoned_train_set_tsne[label_filter]

    # calculate the centre of these datapoints and the distances of each point from the centre
    centroid = KMeans(n_clusters=1).fit(examples_tsne).cluster_centers_
    distances = examples_tsne - np.repeat(centroid,examples_tsne.shape[0], axis=0)
    distances = np.diag(np.dot(distances,distances.T))

    # use these distances to find the worst offenders, and plot them!
    outlier_ids = examples_ids[np.argsort(distances)[-24:]]

    images, _ = zip(*[poisoned_train_set[id] for id in outlier_ids])
    images = torch.stack(images)
    PlotImages(images, ax=ax[i,j])
    ax[i,j].set_ylabel("Class {0}".format(k))

Data Science and Machine Learning

Show Code Cells

Poisoned Datasets in Machine Learning¶

David Miller - October 2020 - Link to Github ¶

Introduction¶

~TLDR¶

The Background¶

Planting The Seed¶

Poisoning the Well¶

Setup¶

Fashion MNIST¶

Part 1 - Training a CNN Classifier on Clean Data¶

Training on the Clean Dataset¶

The Results¶

Part 2 - Poisoning the Dataset¶

Training on Poisoned Data¶

Effect of the poisoning¶

Visual Example¶

Part 3 - The Antidote?¶

Know Thy Data¶

Some of these things are not like the others...¶

Conclusions¶

References¶

Class	0	1	2	3	4	5	6	7	8	9
Recall	82.5%	94.1%	73.9%	*89.2%*	75.5%	90.8%	48.1%	94.2%	94.0%	95.3%
Precision	76.4%	98.0%	73.8%	*75.9%*	72.0%	96.6%	66.0%	90.1%	93.9%	94.1%

Class	0	1	2	3	4	5	6	7	8	9
Recall	83.7%	94.9%	73.8%	*86.8%*	79.6%	91.3%	45.0%	94.0%	94.4%	95.0%
Precision	76.1%	97.8%	73.1%	*78.1%*	69.0%	96.6%	69.4%	90.2%	94.1%	93.7%

Class	3
Clean Model	11.5%
Poisoned Model	43.2%

Show Code Cells

Poisoned Datasets in Machine Learning¶

David Miller - October 2020 - Link to Github¶

Introduction¶

~TLDR¶

The Background¶

Planting The Seed¶

Poisoning the Well¶

Setup¶

Fashion MNIST¶

Part 1 - Training a CNN Classifier on Clean Data¶

Training on the Clean Dataset¶

The Results¶

Part 2 - Poisoning the Dataset¶

Training on Poisoned Data¶

Effect of the poisoning¶

Visual Example¶

Part 3 - The Antidote?¶

Know Thy Data¶

Some of these things are not like the others...¶

Conclusions¶

References¶

David Miller - October 2020 - Link to Github ¶