import torch
import matplotlib.pyplot as plt
from sklearn.datasets import load_wine


def show_class_balance(y, classes):
    _, counts = torch.unique(torch.tensor(y), return_counts=True)
    plt.bar(classes, counts)
    plt.ylabel("n_samples")
    plt.ylim([0, 75])
    plt.show()


wine = load_wine()
classes = wine.target_names

show_class_balance(wine.target, classes)


from imblearn.datasets import make_imbalance

x, y = make_imbalance(
    wine.data, wine.target, sampling_strategy={0: 10, 1: 70, 2: 40}, random_state=42
)
show_class_balance(y, classes)


from imblearn.over_sampling import RandomOverSampler

ros = RandomOverSampler(random_state=0)
x_ros, y_ros = ros.fit_resample(x, y)

show_class_balance(y_ros, classes)


from imblearn.under_sampling import RandomUnderSampler

rus = RandomUnderSampler(random_state=42)
x_res, y_res = rus.fit_resample(x, y)

show_class_balance(y_res, classes)


# https://pytorch.org/docs/stable/generated/torch.unique.html
_, counts = torch.unique(torch.tensor(y), return_counts=True)
weights = counts.max() / counts
print("Classes: ", classes)
print("Weights: ", weights)

Classes:  ['class_0' 'class_1' 'class_2']
Weights:  tensor([7.0000, 1.0000, 1.7500])


from torch.utils.data import DataLoader, TensorDataset, WeightedRandomSampler

tensor_x = torch.Tensor(x)  # transform to torch tensor
tensor_y = torch.Tensor(y)
dataset = TensorDataset(tensor_x, tensor_y)

batch_size = 8

weight_for_sample = []  # Every sample must have a weight
for l in y:
    weight_for_sample.append(weights[l].item())

sampler = WeightedRandomSampler(torch.tensor(weight_for_sample), len(dataset))
loader = DataLoader(dataset, batch_size=32, drop_last=True, sampler=sampler)


batch_labels = []
for data, labels in loader:
    print(
        "Labels:",
        labels.int().tolist(),
        "Classes in batch:",
        torch.unique(labels, return_counts=True)[1].tolist(),
    )
    batch_labels.append(labels.tolist())

show_class_balance(batch_labels, classes)

Labels: [1, 0, 2, 2, 1, 2, 0, 2, 2, 1, 1, 1, 1, 2, 1, 1, 2, 2, 0, 1, 2, 0, 2, 1, 2, 2, 1, 0, 0, 0, 1, 2] Classes in batch: [7, 12, 13]
Labels: [1, 0, 1, 0, 0, 0, 1, 0, 2, 0, 0, 1, 1, 1, 0, 1, 1, 0, 2, 0, 1, 0, 0, 2, 2, 2, 0, 1, 1, 1, 1, 1] Classes in batch: [13, 14, 5]
Labels: [0, 1, 1, 2, 1, 0, 2, 1, 0, 2, 1, 1, 1, 2, 2, 0, 1, 2, 2, 2, 1, 1, 0, 1, 2, 1, 1, 2, 1, 0, 0, 2] Classes in batch: [7, 14, 11]


from imblearn.over_sampling import SMOTE

oversample = SMOTE()
x_smote, y_smote = oversample.fit_resample(x, y)

show_class_balance(y_smote, classes)


over = SMOTE(sampling_strategy={0: 20, 1: 70, 2: 70})
x_smote, y_smote = over.fit_resample(x, y)

show_class_balance(y_smote, classes)


scores = torch.tensor([[30.0, 2.0], [30.0, 2.0]])  # Scores for batch of two samples
target = torch.tensor([0, 1])  # Second sample belongs to class 1
# but logit for class 0 greater: 30 > 2. So it was misclassified


criterion = torch.nn.CrossEntropyLoss()
loss = criterion(scores, target)
print(f"Loss = {loss.item():.2f}")

Loss = 14.00


weights = torch.tensor([0.2, 0.8], dtype=torch.float32)
criterion = torch.nn.CrossEntropyLoss(weight=weights)
loss = criterion(scores, target)
print(f"Loss = {loss.item():.2f}")

Loss = 22.40


criterion = torch.nn.CrossEntropyLoss(weight=torch.tensor([2.0, 8.0]))
loss = criterion(scores, target)
print(f"Loss = {loss.item():.2f}")

Loss = 22.40


import numpy as np


def cross_entropy(prob_true):
    return -np.log(prob_true)


def focal_loss(prob_true, gamma=2):
    return (1 - prob_true) ** gamma * cross_entropy(prob_true)


p1 = 0.9  # probability of easy examples predictions
p2 = 0.2  # probability of hard examples predictions
gammas = [0, 0.5, 1, 2, 5, 10, 15]

print(
    f"For probability of easy examples predictions {p1} and probability of hard examples predictions {p2}\n"
)

for gamma in gammas:
    fl1 = focal_loss(p1, gamma)
    fl2 = focal_loss(p2, gamma)

    print(
        f"gamma = {gamma},".ljust(15),
        f"for an equal loss with a problematic prediction, almost correct ones are required {int(fl2 / fl1)}",
    )

For probability of easy examples predictions 0.9 and probability of hard examples predictions 0.2

gamma = 0,      for an equal loss with a problematic prediction, almost correct ones are required 15
gamma = 0.5,    for an equal loss with a problematic prediction, almost correct ones are required 43
gamma = 1,      for an equal loss with a problematic prediction, almost correct ones are required 122
gamma = 2,      for an equal loss with a problematic prediction, almost correct ones are required 977
gamma = 5,      for an equal loss with a problematic prediction, almost correct ones are required 500548
gamma = 10,     for an equal loss with a problematic prediction, almost correct ones are required 16401977428
gamma = 15,     for an equal loss with a problematic prediction, almost correct ones are required 537459996388583


import random


def set_random_seed(seed):
    torch.manual_seed(seed)
    torch.cuda.manual_seed(seed)
    torch.backends.cudnn.deterministic = True
    torch.backends.cudnn.benchmark = False
    np.random.seed(seed)
    random.seed(seed)


set_random_seed(42)


#!wget https://raw.githubusercontent.com/AdeelH/pytorch-multi-class-focal-loss/master/focal_loss.py
!wget -q https://edunet.kea.su/repo/EduNet-web_dependencies/L11/focal_loss.py


import torch
from torch import nn
from focal_loss import FocalLoss


criterion = FocalLoss(alpha=None, gamma=2.0)

model_output = torch.rand(3, 3)  # model output is logits, as in CELoss
print(f"model_output:\n {model_output}")

target = torch.empty(3, dtype=torch.long).random_(3)
print(f"target: {target}")

loss_fl = criterion(model_output, target)
print(f"loss_fl: {loss_fl}")

model_output:
 tensor([[0.8823, 0.9150, 0.3829],
        [0.9593, 0.3904, 0.6009],
        [0.2566, 0.7936, 0.9408]])
target: tensor([2, 1, 1])
loss_fl: 0.6864498257637024


probs = torch.nn.functional.softmax(model_output, dim=1)

print(f"probabilities after softmax:\n {probs}")

probabilities after softmax:
 tensor([[0.3788, 0.3914, 0.2299],
        [0.4415, 0.2500, 0.3085],
        [0.2131, 0.3646, 0.4224]])


def focal_loss(prob_true, gamma=2):
    return -((1 - prob_true) ** gamma) * np.log(prob_true)


hand_calculated_loss = 0

for i in range(3):
    hand_calculated_loss += focal_loss(probs[i, target[i]])

hand_calculated_loss /= 3  # average by number of samples

print(f"hand-calculated focal loss:    {hand_calculated_loss.item()}")
print(f"library-calculated focal loss: {loss_fl}")
print(
    f"Are results almost equal? {torch.isclose(loss_fl, hand_calculated_loss).item()}"
)

hand-calculated focal loss:    0.6864497661590576
library-calculated focal loss: 0.6864498257637024
Are results almost equal? True


rng = np.random.RandomState(42)

# Train
x = 0.3 * rng.randn(100, 2)  # 100 2D points
x_train = np.r_[x + 2, x - 2]  # split into two clusters

# Test norlmal
x = 0.3 * rng.randn(20, 2)  # 20 2D points
x_test_norlmal = np.r_[x + 2, x - 2]  # split into two clusters

# Test outliers
x_test_outliers = rng.uniform(low=-4, high=4, size=(20, 2))


def plot_outliers(x_train, x_test_norlmal, x_test_outliers, model=None):
    fig, (plt_data, plt_model) = plt.subplots(1, 2, figsize=(12, 6))

    plt_data.set_title("Created Dataset (real labels)")
    plot_train = plt_data.scatter(
        x_train[:, 0], x_train[:, 1], c="white", s=40, edgecolor="k"
    )
    plot_test_normal = plt_data.scatter(
        x_test_norlmal[:, 0], x_test_norlmal[:, 1], c="green", s=40, edgecolor="k"
    )
    plot_test_outliers = plt_data.scatter(
        x_test_outliers[:, 0], x_test_outliers[:, 1], c="red", s=40, edgecolor="k"
    )

    plt_data.set_xlim((-5, 5))
    plt_data.set_ylim((-5, 5))

    plt_data.legend(
        [plot_train, plot_test_normal, plot_test_outliers],
        ["train", "test normal", "test outliers"],
        loc="lower right",
    )

    if model:
        plt_model.set_title("Model Results")
        # plot decision function
        xx, yy = np.meshgrid(np.linspace(-5, 5, 50), np.linspace(-5, 5, 50))
        Z = model.decision_function(np.c_[xx.ravel(), yy.ravel()])
        Z = Z.reshape(xx.shape)

        plt_model.contourf(xx, yy, Z, cmap=plt.cm.Blues_r)

        # plot prediction
        full_data = np.concatenate((x_train, x_test_norlmal, x_test_outliers), axis=0)
        predicted = model.predict(full_data)

        anom_index = np.where(predicted == -1)
        anom_values = full_data[anom_index]

        plot_all_data = plt_model.scatter(
            full_data[:, 0], full_data[:, 1], c="white", s=40, edgecolor="k"
        )

        plot_anom_data = plt_model.scatter(
            anom_values[:, 0], anom_values[:, 1], c="red", s=40, marker="x"
        )
        plt_model.legend(
            [plot_all_data, plot_anom_data],
            ["normal", "outliers"],
            loc="lower right",
        )
    plt.show()


from sklearn.svm import OneClassSVM

gamma = 2.0
contamination = 0.05

model = OneClassSVM(gamma=gamma, kernel="rbf", nu=contamination)
model.fit(x_train)

plot_outliers(x_train, x_test_norlmal, x_test_outliers, model)


from sklearn.ensemble import IsolationForest

n_estimators = 200
contamination = 0.05

model = IsolationForest(
    n_estimators=n_estimators, contamination=contamination, random_state=rng
)
model.fit(x_train)

plot_outliers(x_train, x_test_norlmal, x_test_outliers, model)


from sklearn.neighbors import LocalOutlierFactor

n_neighbors = 10
contamination = 0.05

model = LocalOutlierFactor(
    n_neighbors=n_neighbors, novelty=True, contamination=contamination
)
model.fit(x_train)

plot_outliers(x_train, x_test_norlmal, x_test_outliers, model)


from sklearn.datasets import make_classification
from collections import Counter


x, y = make_classification(
    n_samples=1000,
    n_features=2,
    n_redundant=0,
    n_clusters_per_class=1,
    weights=[0.95],
    flip_y=0,
    random_state=42,
)

counter = Counter(y)
print("Class distribution ", Counter(y))

for label, _ in counter.items():
    row_ix = np.where(y == label)[0]
    plt.scatter(x[row_ix, 0], x[row_ix, 1], label=str(label))
plt.legend()
plt.show()

Class distribution  Counter({0: 950, 1: 50})


class DummyModel:
    def predict(self, x):
        return np.zeros(x.shape[0])  # always predict class 0


from sklearn.metrics import accuracy_score

dummy_model = DummyModel()
y_pred = dummy_model.predict(x)

accuracy = accuracy_score(y, y_pred)
print("Accuracy", accuracy)

Accuracy 0.95


from sklearn.metrics import f1_score, matthews_corrcoef, balanced_accuracy_score

print("F1", f1_score(y, y_pred))
print("MCC", matthews_corrcoef(y, y_pred))
print("Balanced accuracy", balanced_accuracy_score(y, y_pred))

F1 0.0
MCC 0.0
Balanced accuracy 0.5


# setting random seed for reproducible illustrations
set_random_seed(42)

URL = "https://edunet.kea.su/repo/EduNet-web_dependencies/L11/capybara_image.jpg"
!wget -q $URL -O test.jpg


from IPython.display import display
from PIL import Image
from torchvision import transforms

input_img = Image.open("/content/test.jpg")
input_img = transforms.Resize(size=300)(input_img)
display(input_img)


import matplotlib.pyplot as plt


def plot_augmented_img(transform, input_img):
    fig, ax = plt.subplots(1, 2, figsize=(15, 15))
    augmented_img = transform(input_img)
    ax[0].imshow(input_img)
    ax[0].set_title("Original img")
    ax[0].axis("off")

    ax[1].imshow(augmented_img)
    ax[1].set_title("Augmented img")
    ax[1].axis("off")
    plt.show()


transform = transforms.RandomRotation(degrees=(0, 180))

plot_augmented_img(transform, input_img)


transform = transforms.GaussianBlur(kernel_size=(5, 9), sigma=(0.1, 5))

plot_augmented_img(transform, input_img)


transform = transforms.Compose(
    [transforms.ToTensor(), transforms.RandomErasing(p=1), transforms.ToPILImage()]
)

plot_augmented_img(transform, input_img)


transform = transforms.Compose(
    [
        transforms.ToTensor(),
        transforms.RandomErasing(p=1, scale=(0.02, 0.1)),
        transforms.ToPILImage(),
    ]
)

plot_augmented_img(transform, input_img)


transform = transforms.ColorJitter(brightness=0.5, hue=0.3)

plot_augmented_img(transform, input_img)


transform = transforms.Compose(
    [
        transforms.GaussianBlur(kernel_size=(5, 9), sigma=(0.1, 5)),
        transforms.RandomPerspective(distortion_scale=0.5, p=1.0),
        transforms.ColorJitter(brightness=0.5, hue=0.3),
    ]
)

plot_augmented_img(transform, input_img)


transform = transforms.RandomApply(
    transforms=[
        transforms.GaussianBlur(kernel_size=(5, 9), sigma=(0.1, 5)),
        transforms.RandomPerspective(distortion_scale=0.5),
        transforms.ColorJitter(brightness=0.5, hue=0.3),
    ],
    p=0.9,
)

plot_augmented_img(transform, input_img)


transform = transforms.RandomChoice(
    transforms=[
        transforms.GaussianBlur(kernel_size=(5, 9), sigma=(0.1, 5)),
        transforms.RandomPerspective(distortion_scale=0.5, p=1.0),
        transforms.ColorJitter(brightness=0.5, hue=0.3),
    ],
    p=[0.2, 0.4, 0.6],
)

plot_augmented_img(transform, input_img)
plot_augmented_img(transform, input_img)
plot_augmented_img(transform, input_img)


from PIL import Image
import numpy as np


class SaltAndPepperNoise:
    """
    Add a "salt and pepper" noise to the PIL image
    __call__ method returns PIL Image with noise
    """

    def __init__(self, p=0.01):
        self.p = p  # noise level

    def __call__(self, pil_image):
        np_image = np.array(pil_image)

        # create random mask for "salt" and "pepper" pixels
        salt_ind = np.random.choice(
            a=[True, False], size=np_image.shape[:2], p=[self.p, 1 - self.p]
        )
        pepper_ind = np.random.choice(
            a=[True, False], size=np_image.shape[:2], p=[self.p, 1 - self.p]
        )

        # add "salt" and "pepper"
        np_image[salt_ind] = 255
        np_image[pepper_ind] = 0

        return Image.fromarray(np_image)


transform = SaltAndPepperNoise(p=0.03)

plot_augmented_img(transform, input_img)


import os
from zipfile import ZipFile

os.chdir("/content")
# download files
!wget -q --no-check-certificate 'https://edunet.kea.su/repo/EduNet-web_dependencies/datasets/for_transforms.Compose.zip' -O data.zip
with ZipFile(
    "data.zip", "r"
) as folder:  # Create a ZipFile Object and load sample.zip in it
    folder.extractall()  # Extract all the contents of zip file in current directory


os.chdir("/content/for_transforms.Compose")
img_list = os.listdir()
print(img_list)

['horse4.jpg', 'horse2.jpg', 'bicornis5.jpg', 'bicornis1.jpg', 'bicornis3.jpg', 'bicornis2.jpg', 'horse1.jpg', 'horse5.jpg']


from torch.utils.data import Dataset


class AugmentationDataset(Dataset):
    def __init__(self, img_list, transforms=None):
        self.img_list = img_list
        self.transforms = transforms

    def __len__(self):
        return len(self.img_list)

    def __getitem__(self, i):
        img = plt.imread(self.img_list[i])
        img = Image.fromarray(img).convert("RGB")
        img = np.array(img).astype(np.uint8)

        if self.transforms is not None:
            img = self.transforms(img)
        return img


def show_img(img):
    plt.figure(figsize=(40, 38))
    img_np = img.numpy()
    plt.imshow(np.transpose(img_np, (1, 2, 0)))  # [CxHxW] -> [HxWxC] for imshow
    plt.show()


tensor_transform = transforms.Compose(
    [
        transforms.ToPILImage(),
        transforms.Resize((164, 164)),
        transforms.GaussianBlur(kernel_size=(5, 9), sigma=(0.1, 5)),
        transforms.RandomPerspective(distortion_scale=0.5),
        transforms.ToTensor(),
    ]
)


from torch.utils.data import DataLoader
import torchvision

Augmentation_dataloader = DataLoader(
    AugmentationDataset(img_list, tensor_transform), batch_size=8, shuffle=True
)

data = iter(Augmentation_dataloader)
show_img(torchvision.utils.make_grid(next(data)))


os.chdir("/content")

!pip install -q audiomentations

!wget -q https://edunet.kea.su/repo/EduNet-web_dependencies/L11/audio_example.wav

     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 70.6/70.6 kB 5.9 MB/s eta 0:00:00


from IPython.display import Audio

# Get input audio
input_audio = "/content/audio_example.wav"

display(Audio(input_audio))


import librosa

data, sr = librosa.load("/content/audio_example.wav")  # sr - sampling rate


from audiomentations import AddGaussianSNR

augment = AddGaussianSNR(min_snr_in_db=3, max_snr_in_db=7, p=1)

# Augment/transform the audio data
augmented_data = augment(samples=data, sample_rate=sr)

display(Audio(augmented_data, rate=sr))


from scipy.signal import spectrogram


def produce_plots(input_audio_arr, aug_audio, sr):
    f, t, Sxx_in = spectrogram(
        input_audio_arr, fs=sr
    )  # Compute spectrogram for the original signal (f - frequency, t - time)
    f, t, Sxx_aug = spectrogram(aug_audio, fs=sr)

    fig, ax = plt.subplots(nrows=2, ncols=2, figsize=(20, 5))

    ax[0, 0].plot(input_audio_arr)
    ax[0, 0].set_xlim(0, len(input_audio_arr))
    ax[0, 0].set_xticks([])
    ax[0, 0].set_title("Original audio")

    ax[0, 1].plot(aug_audio)
    ax[0, 1].set_xlim(0, len(input_audio_arr))
    ax[0, 1].set_xticks([])
    ax[0, 1].set_title("Augmented  audio")

    ax[1, 0].imshow(
        np.log(Sxx_in),
        extent=[t.min(), t.max(), f.min(), f.max()],
        aspect="auto",
        cmap="inferno",
    )
    ax[1, 0].set_ylabel("Frequecny, Hz")
    ax[1, 0].set_xlabel("Time,s")

    ax[1, 1].imshow(
        np.log(Sxx_aug, where=Sxx_aug > 0),
        extent=[t.min(), t.max(), f.min(), f.max()],
        aspect="auto",
        cmap="inferno",
    )
    ax[1, 1].set_ylabel("Frequecny, Hz")
    ax[1, 1].set_xlabel("Time,s")

    plt.subplots_adjust(hspace=0)
    plt.show()


produce_plots(data, augmented_data, sr)


from audiomentations import TimeStretch

augment = TimeStretch(min_rate=0.8, max_rate=1.5, p=1)
augmented_data = augment(data, sample_rate=sr)

display(Audio(augmented_data, rate=sr))


produce_plots(data, augmented_data, sr)


from audiomentations import PitchShift

augment = PitchShift(min_semitones=1, max_semitones=12, p=1)
augmented_data = augment(data, sample_rate=sr)

display(Audio(augmented_data, rate=sr))


from audiomentations import Compose, AddGaussianNoise, Shift

augment = Compose(
    [
        AddGaussianNoise(min_amplitude=0.001, max_amplitude=0.015, p=1),
        TimeStretch(min_rate=0.8, max_rate=1.25, p=1),
        PitchShift(min_semitones=-4, max_semitones=4, p=1),
        Shift(min_fraction=-0.5, max_fraction=0.5, p=1),
    ]
)

augmented_data = augment(data, sample_rate=sr)

display(Audio(augmented_data, rate=sr))


produce_plots(data, augmented_data, sr)


!pip install -q nlpaug

     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 410.5/410.5 kB 19.0 MB/s eta 0:00:00


# Define input text
text = "Hello, future of AI for Science! How are you today?"
print(f"input text: {text}")

input text: Hello, future of AI for Science! How are you today?


import nlpaug.augmenter.char as nac

augment = nac.OcrAug()
augmented_text = augment.augment(text)

print(f"Original:\n{text}")
print(f"Augmented Texts:\n{augmented_text}")

Original:
Hello, future of AI for Science! How are you today?
Augmented Texts:
['Hel1u, fotore of AI for 8cience! How are you today?']


augment = nac.KeyboardAug()
augmented_text = augment.augment(text)

print(f"Original:\n{text}")
print(f"Augmented Texts:\n{augmented_text}")

Original:
Hello, future of AI for Science! How are you today?
Augmented Texts:
['nel/o, fufuDe of AI for ZcienX2! How are you g8day?']


import nlpaug.augmenter.word as naw

augment = naw.SpellingAug()
augmented_text = augment.augment(text, n=3)

print(f"Original:\n{text}")
print(f"Augmented Texts:\n{augmented_text}")

Original:
Hello, future of AI for Science! How are you today?
Augmented Texts:
['Hello, futur og AI for Science! Hot are ypi today?', 'Hello, furtuer f AI for Science! Wow are you today?', 'Hello, future for AI fom Scince! Hou are you today?']


!pip install -q transformers

     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 7.4/7.4 MB 84.8 MB/s eta 0:00:00
     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 268.8/268.8 kB 32.9 MB/s eta 0:00:00
     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 7.8/7.8 MB 108.0 MB/s eta 0:00:00
     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 1.3/1.3 MB 66.9 MB/s eta 0:00:00


from IPython.display import clear_output


# model_type: word2vec, glove or fasttext
augment = naw.ContextualWordEmbsAug(model_path="bert-base-uncased", action="insert")
augmented_text = augment.augment(text)

clear_output()
print(f"Original:\n{text}")
print(f"Augmented Texts:\n{augmented_text}")

Original:
Hello, future of AI for Science! How are you today?
Augmented Texts:
['big hello, future of ai sci for all science! now how are you today?']


!pip -q install sacremoses

     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 880.6/880.6 kB 23.4 MB/s eta 0:00:00
  Preparing metadata (setup.py) ... done
  Building wheel for sacremoses (setup.py) ... done


back_translation_aug = naw.BackTranslationAug(
    from_model_name="facebook/wmt19-en-de", to_model_name="facebook/wmt19-de-en"
)
augmented_text = back_translation_aug.augment(text)

clear_output()
print(f"Original:\n{text}")
print(f"Augmented Texts:\n{augmented_text}")

Original:
Hello, future of AI for Science! How are you today?
Augmented Texts:
['Hello, the future of AI for science! How are you doing today?']


import random
import torch
import numpy as np


def set_random_seed(seed):
    torch.manual_seed(seed)
    torch.cuda.manual_seed(seed)
    torch.backends.cudnn.deterministic = True
    torch.backends.cudnn.benchmark = False
    np.random.seed(seed)
    random.seed(seed)


set_random_seed(42)


import os
from random import sample

!wget -qN https://edunet.kea.su/repo/EduNet-web_dependencies/datasets/EuroSAT.zip # http://madm.dfki.de/files/sentinel/EuroSAT.zip
!unzip -qn EuroSAT.zip

os.chdir("/content")
path = "/content/2750/"

for folder in os.listdir(path):
    files = os.listdir(path + folder)
    for file in sample(files, int(len(files) * 0.9)):
        os.remove(path + folder + "/" + file)


from torchvision import transforms

# Applying Transforms to the Data
img_transforms = {
    "train": transforms.Compose(
        [
            transforms.Resize(size=224),  # as in ImageNet
            transforms.RandomRotation(degrees=15),
            transforms.RandomHorizontalFlip(),
            transforms.RandomVerticalFlip(),
            transforms.ToTensor(),
        ]
    ),
    # No augmentations on valid data!
    "valid": transforms.Compose(
        [
            transforms.Resize(size=224),
            transforms.ToTensor(),
        ]
    ),
    # No augmentations on test data!
    "test": transforms.Compose(
        [
            transforms.Resize(size=224),
            transforms.ToTensor(),
        ]
    ),
}


from torchvision import datasets
from copy import deepcopy

dataset = datasets.ImageFolder(root=path)
# split to train/valid/test
train_set, valid_set, test_set = torch.utils.data.random_split(
    dataset, [int(len(dataset) * 0.8), int(len(dataset) * 0.1), int(len(dataset) * 0.1)]
)

train_set.dataset = deepcopy(dataset)
valid_set.dataset = deepcopy(dataset)
test_set.dataset = deepcopy(dataset)

# define augmentations
train_set.dataset.transform = img_transforms["train"]
valid_set.dataset.transform = img_transforms["valid"]
test_set.dataset.transform = img_transforms["test"]

print(f"Train size: {len(train_set)}")
print(f"Valid size: {len(valid_set)}")
print(f"Test size: {len(test_set)}")

Train size: 2160
Valid size: 270
Test size: 270


from torch.utils.data import DataLoader

# Batch size
batch_size = 64

# Number of classes
num_classes = len(dataset.classes)

# Get a mapping of the indices to the class names, in order to see the output classes of the test images.
idx_to_class = {v: k for k, v in dataset.class_to_idx.items()}

# Size of Data, to be used for calculating Average Loss and Accuracy
train_data_size, valid_data_size = len(train_set), len(valid_set)

# Create iterators for the Data loaded using DataLoader module
train_loader = DataLoader(train_set, batch_size=batch_size, shuffle=True)
valid_loader = DataLoader(valid_set, batch_size=batch_size, shuffle=False)
test_loader = DataLoader(test_set, batch_size=batch_size, shuffle=False)
print("indexes to class: ")
idx_to_class

indexes to class:

{0: 'AnnualCrop',
 1: 'Forest',
 2: 'HerbaceousVegetation',
 3: 'Highway',
 4: 'Industrial',
 5: 'Pasture',
 6: 'PermanentCrop',
 7: 'Residential',
 8: 'River',
 9: 'SeaLake'}


from torchvision import models

device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")

model = models.mobilenet_v2(weights=None)
print(model)

MobileNetV2(
  (features): Sequential(
    (0): Conv2dNormActivation(
      (0): Conv2d(3, 32, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)
      (1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (2): ReLU6(inplace=True)
    )
    (1): InvertedResidual(
      (conv): Sequential(
        (0): Conv2dNormActivation(
          (0): Conv2d(32, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), groups=32, bias=False)
          (1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (1): Conv2d(32, 16, kernel_size=(1, 1), stride=(1, 1), bias=False)
        (2): BatchNorm2d(16, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
    )
    (2): InvertedResidual(
      (conv): Sequential(
        (0): Conv2dNormActivation(
          (0): Conv2d(16, 96, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (1): BatchNorm2d(96, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (1): Conv2dNormActivation(
          (0): Conv2d(96, 96, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), groups=96, bias=False)
          (1): BatchNorm2d(96, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (2): Conv2d(96, 24, kernel_size=(1, 1), stride=(1, 1), bias=False)
        (3): BatchNorm2d(24, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
    )
    (3): InvertedResidual(
      (conv): Sequential(
        (0): Conv2dNormActivation(
          (0): Conv2d(24, 144, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (1): BatchNorm2d(144, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (1): Conv2dNormActivation(
          (0): Conv2d(144, 144, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), groups=144, bias=False)
          (1): BatchNorm2d(144, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (2): Conv2d(144, 24, kernel_size=(1, 1), stride=(1, 1), bias=False)
        (3): BatchNorm2d(24, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
    )
    (4): InvertedResidual(
      (conv): Sequential(
        (0): Conv2dNormActivation(
          (0): Conv2d(24, 144, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (1): BatchNorm2d(144, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (1): Conv2dNormActivation(
          (0): Conv2d(144, 144, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), groups=144, bias=False)
          (1): BatchNorm2d(144, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (2): Conv2d(144, 32, kernel_size=(1, 1), stride=(1, 1), bias=False)
        (3): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
    )
    (5): InvertedResidual(
      (conv): Sequential(
        (0): Conv2dNormActivation(
          (0): Conv2d(32, 192, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (1): BatchNorm2d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (1): Conv2dNormActivation(
          (0): Conv2d(192, 192, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), groups=192, bias=False)
          (1): BatchNorm2d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (2): Conv2d(192, 32, kernel_size=(1, 1), stride=(1, 1), bias=False)
        (3): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
    )
    (6): InvertedResidual(
      (conv): Sequential(
        (0): Conv2dNormActivation(
          (0): Conv2d(32, 192, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (1): BatchNorm2d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (1): Conv2dNormActivation(
          (0): Conv2d(192, 192, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), groups=192, bias=False)
          (1): BatchNorm2d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (2): Conv2d(192, 32, kernel_size=(1, 1), stride=(1, 1), bias=False)
        (3): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
    )
    (7): InvertedResidual(
      (conv): Sequential(
        (0): Conv2dNormActivation(
          (0): Conv2d(32, 192, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (1): BatchNorm2d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (1): Conv2dNormActivation(
          (0): Conv2d(192, 192, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), groups=192, bias=False)
          (1): BatchNorm2d(192, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (2): Conv2d(192, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)
        (3): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
    )
    (8): InvertedResidual(
      (conv): Sequential(
        (0): Conv2dNormActivation(
          (0): Conv2d(64, 384, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (1): BatchNorm2d(384, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (1): Conv2dNormActivation(
          (0): Conv2d(384, 384, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), groups=384, bias=False)
          (1): BatchNorm2d(384, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (2): Conv2d(384, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)
        (3): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
    )
    (9): InvertedResidual(
      (conv): Sequential(
        (0): Conv2dNormActivation(
          (0): Conv2d(64, 384, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (1): BatchNorm2d(384, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (1): Conv2dNormActivation(
          (0): Conv2d(384, 384, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), groups=384, bias=False)
          (1): BatchNorm2d(384, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (2): Conv2d(384, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)
        (3): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
    )
    (10): InvertedResidual(
      (conv): Sequential(
        (0): Conv2dNormActivation(
          (0): Conv2d(64, 384, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (1): BatchNorm2d(384, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (1): Conv2dNormActivation(
          (0): Conv2d(384, 384, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), groups=384, bias=False)
          (1): BatchNorm2d(384, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (2): Conv2d(384, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)
        (3): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
    )
    (11): InvertedResidual(
      (conv): Sequential(
        (0): Conv2dNormActivation(
          (0): Conv2d(64, 384, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (1): BatchNorm2d(384, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (1): Conv2dNormActivation(
          (0): Conv2d(384, 384, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), groups=384, bias=False)
          (1): BatchNorm2d(384, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (2): Conv2d(384, 96, kernel_size=(1, 1), stride=(1, 1), bias=False)
        (3): BatchNorm2d(96, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
    )
    (12): InvertedResidual(
      (conv): Sequential(
        (0): Conv2dNormActivation(
          (0): Conv2d(96, 576, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (1): BatchNorm2d(576, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (1): Conv2dNormActivation(
          (0): Conv2d(576, 576, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), groups=576, bias=False)
          (1): BatchNorm2d(576, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (2): Conv2d(576, 96, kernel_size=(1, 1), stride=(1, 1), bias=False)
        (3): BatchNorm2d(96, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
    )
    (13): InvertedResidual(
      (conv): Sequential(
        (0): Conv2dNormActivation(
          (0): Conv2d(96, 576, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (1): BatchNorm2d(576, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (1): Conv2dNormActivation(
          (0): Conv2d(576, 576, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), groups=576, bias=False)
          (1): BatchNorm2d(576, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (2): Conv2d(576, 96, kernel_size=(1, 1), stride=(1, 1), bias=False)
        (3): BatchNorm2d(96, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
    )
    (14): InvertedResidual(
      (conv): Sequential(
        (0): Conv2dNormActivation(
          (0): Conv2d(96, 576, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (1): BatchNorm2d(576, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (1): Conv2dNormActivation(
          (0): Conv2d(576, 576, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), groups=576, bias=False)
          (1): BatchNorm2d(576, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (2): Conv2d(576, 160, kernel_size=(1, 1), stride=(1, 1), bias=False)
        (3): BatchNorm2d(160, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
    )
    (15): InvertedResidual(
      (conv): Sequential(
        (0): Conv2dNormActivation(
          (0): Conv2d(160, 960, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (1): BatchNorm2d(960, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (1): Conv2dNormActivation(
          (0): Conv2d(960, 960, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), groups=960, bias=False)
          (1): BatchNorm2d(960, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (2): Conv2d(960, 160, kernel_size=(1, 1), stride=(1, 1), bias=False)
        (3): BatchNorm2d(160, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
    )
    (16): InvertedResidual(
      (conv): Sequential(
        (0): Conv2dNormActivation(
          (0): Conv2d(160, 960, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (1): BatchNorm2d(960, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (1): Conv2dNormActivation(
          (0): Conv2d(960, 960, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), groups=960, bias=False)
          (1): BatchNorm2d(960, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (2): Conv2d(960, 160, kernel_size=(1, 1), stride=(1, 1), bias=False)
        (3): BatchNorm2d(160, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
    )
    (17): InvertedResidual(
      (conv): Sequential(
        (0): Conv2dNormActivation(
          (0): Conv2d(160, 960, kernel_size=(1, 1), stride=(1, 1), bias=False)
          (1): BatchNorm2d(960, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (1): Conv2dNormActivation(
          (0): Conv2d(960, 960, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), groups=960, bias=False)
          (1): BatchNorm2d(960, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (2): ReLU6(inplace=True)
        )
        (2): Conv2d(960, 320, kernel_size=(1, 1), stride=(1, 1), bias=False)
        (3): BatchNorm2d(320, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
    )
    (18): Conv2dNormActivation(
      (0): Conv2d(320, 1280, kernel_size=(1, 1), stride=(1, 1), bias=False)
      (1): BatchNorm2d(1280, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (2): ReLU6(inplace=True)
    )
  )
  (classifier): Sequential(
    (0): Dropout(p=0.2, inplace=False)
    (1): Linear(in_features=1280, out_features=1000, bias=True)
  )
)


# Change the final layer of MobileNet Model for Transfer Learning
import torch.nn as nn

# change out classes, from 1000 to 10
model.classifier[1] = nn.Linear(1280, num_classes)
print(model.classifier)

Sequential(
  (0): Dropout(p=0.2, inplace=False)
  (1): Linear(in_features=1280, out_features=10, bias=True)
)


import torch.optim as optim

# Define Optimizer and Loss Function
criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=3e-4)
print(optimizer)

Adam (
Parameter Group 0
    amsgrad: False
    betas: (0.9, 0.999)
    capturable: False
    differentiable: False
    eps: 1e-08
    foreach: None
    fused: None
    lr: 0.0003
    maximize: False
    weight_decay: 0
)


import time


def train_and_validate(model, criterion, optimizer, num_epochs=25, save_state=False):
    """
    Function to train and validate
    Parameters
        :param model: Model to train and validate
        :param criterion: Loss Criterion to minimize
        :param optimizer: Optimizer for computing gradients
        :param epochs: Number of epochs (default=25)

    Returns
        model: Trained Model with best validation accuracy
        history: (dict object): Having training loss, accuracy and validation loss, accuracy
    """

    start = time.time()
    history = []
    best_acc = 0.0

    for epoch in range(num_epochs):
        epoch_start = time.time()
        print("Epoch: {}/{}".format(epoch + 1, num_epochs))

        # Set to training mode
        model.train()

        # Loss and Accuracy within the epoch
        train_loss = 0.0
        train_acc = 0.0

        valid_loss = 0.0
        valid_acc = 0.0

        train_correct = 0
        for i, (inputs, labels) in enumerate(train_loader):
            inputs = inputs.to(device)
            labels = labels.to(device)

            optimizer.zero_grad()  # Clean existing gradients
            outputs = model(
                inputs
            )  # Forward pass - compute outputs on input data using the model
            loss = criterion(outputs, labels)  # Compute loss
            loss.backward()  # Backpropagate the gradients
            optimizer.step()  # Update the parameters

            # Compute the total loss for the batch and add it to train_loss
            train_loss += loss.item() * inputs.size(0)
            # Compute correct predictions
            train_correct += (torch.argmax(outputs, dim=-1) == labels).float().sum()

        # Compute the mean train accuracy
        train_accuracy = 100 * train_correct / (len(train_loader) * batch_size)

        val_correct = 0
        # Validation - No gradient tracking needed
        with torch.no_grad():
            model.eval()  # Set to evaluation mode

            # Validation loop
            for j, (inputs, labels) in enumerate(valid_loader):
                inputs = inputs.to(device)
                labels = labels.to(device)

                outputs = model(
                    inputs
                )  # Forward pass - compute outputs on input data using the model
                loss = criterion(outputs, labels)  # Compute loss
                valid_loss += loss.item() * inputs.size(
                    0
                )  # Compute the total loss for the batch and add it to valid_loss

                val_correct += (torch.argmax(outputs, dim=-1) == labels).float().sum()

        # Compute mean val accuracy
        val_accuracy = 100 * val_correct / (len(valid_loader) * batch_size)

        # Find average training loss and training accuracy
        avg_train_loss = train_loss / (len(train_loader) * batch_size)

        # Find average training loss and training accuracy
        avg_valid_loss = valid_loss / (len(valid_loader) * batch_size)

        history.append(
            [
                avg_train_loss,
                avg_valid_loss,
                train_accuracy.detach().cpu(),
                val_accuracy.detach().cpu(),
            ]
        )

        epoch_end = time.time()

        print(
            "Epoch : {:03d}, Training: Loss: {:.4f}, Accuracy: {:.4f}%, \n\t\tValidation : Loss : {:.4f}, Accuracy: {:.4f}%, Time: {:.4f}s".format(
                epoch + 1,
                avg_train_loss,
                train_accuracy.detach().cpu(),
                avg_valid_loss,
                val_accuracy.detach().cpu(),
                epoch_end - epoch_start,
            )
        )
        # Saving state for fine_tuning (because we may overfit)
        if save_state:
            os.makedirs("check_points", exist_ok=True)
            torch.save(model.state_dict(), f"check_points/fine_tuning_{epoch + 1}.pth")

    return model, history


num_epochs = 20
trained_model, history = train_and_validate(
    model.to(device), criterion, optimizer, num_epochs
)

torch.save(history, "history_fresh.pt")

Epoch: 1/20
Epoch : 001, Training: Loss: 1.6833, Accuracy: 39.1544%, 
		Validation : Loss : 2.4529, Accuracy: 8.7500%, Time: 20.9827s
Epoch: 2/20
Epoch : 002, Training: Loss: 1.1396, Accuracy: 57.6287%, 
		Validation : Loss : 3.7425, Accuracy: 8.7500%, Time: 12.9362s
Epoch: 3/20
Epoch : 003, Training: Loss: 1.0403, Accuracy: 62.0404%, 
		Validation : Loss : 0.9845, Accuracy: 46.8750%, Time: 12.9204s
Epoch: 4/20
Epoch : 004, Training: Loss: 0.9564, Accuracy: 64.5680%, 
		Validation : Loss : 0.9148, Accuracy: 50.0000%, Time: 12.9076s
Epoch: 5/20
Epoch : 005, Training: Loss: 0.8677, Accuracy: 68.4743%, 
		Validation : Loss : 0.9954, Accuracy: 48.4375%, Time: 13.1667s
Epoch: 6/20
Epoch : 006, Training: Loss: 0.7869, Accuracy: 70.8640%, 
		Validation : Loss : 0.7944, Accuracy: 56.2500%, Time: 13.1206s
Epoch: 7/20
Epoch : 007, Training: Loss: 0.7766, Accuracy: 71.0478%, 
		Validation : Loss : 0.8605, Accuracy: 55.0000%, Time: 13.2928s
Epoch: 8/20
Epoch : 008, Training: Loss: 0.7428, Accuracy: 72.8401%, 
		Validation : Loss : 0.6109, Accuracy: 63.1250%, Time: 13.5449s
Epoch: 9/20
Epoch : 009, Training: Loss: 0.6979, Accuracy: 73.9890%, 
		Validation : Loss : 0.7091, Accuracy: 58.1250%, Time: 13.0479s
Epoch: 10/20
Epoch : 010, Training: Loss: 0.7157, Accuracy: 73.7132%, 
		Validation : Loss : 0.6613, Accuracy: 58.7500%, Time: 13.0548s
Epoch: 11/20
Epoch : 011, Training: Loss: 0.7081, Accuracy: 74.6324%, 
		Validation : Loss : 0.6852, Accuracy: 58.1250%, Time: 13.1791s
Epoch: 12/20
Epoch : 012, Training: Loss: 0.6620, Accuracy: 76.0110%, 
		Validation : Loss : 0.6173, Accuracy: 62.1875%, Time: 13.1287s
Epoch: 13/20
Epoch : 013, Training: Loss: 0.6407, Accuracy: 75.6893%, 
		Validation : Loss : 0.5484, Accuracy: 65.0000%, Time: 13.2165s
Epoch: 14/20
Epoch : 014, Training: Loss: 0.6198, Accuracy: 77.3897%, 
		Validation : Loss : 0.5837, Accuracy: 62.8125%, Time: 13.1706s
Epoch: 15/20
Epoch : 015, Training: Loss: 0.5599, Accuracy: 78.9522%, 
		Validation : Loss : 0.5946, Accuracy: 62.5000%, Time: 13.2250s
Epoch: 16/20
Epoch : 016, Training: Loss: 0.5354, Accuracy: 80.3768%, 
		Validation : Loss : 0.5517, Accuracy: 63.7500%, Time: 13.2174s
Epoch: 17/20
Epoch : 017, Training: Loss: 0.5385, Accuracy: 80.1011%, 
		Validation : Loss : 0.5519, Accuracy: 65.3125%, Time: 13.3673s
Epoch: 18/20
Epoch : 018, Training: Loss: 0.5141, Accuracy: 80.5607%, 
		Validation : Loss : 0.5671, Accuracy: 65.3125%, Time: 13.4340s
Epoch: 19/20
Epoch : 019, Training: Loss: 0.5267, Accuracy: 80.1011%, 
		Validation : Loss : 0.6413, Accuracy: 61.8750%, Time: 13.2895s
Epoch: 20/20
Epoch : 020, Training: Loss: 0.4901, Accuracy: 82.3070%, 
		Validation : Loss : 0.6876, Accuracy: 60.3125%, Time: 13.3084s


import matplotlib.pyplot as plt

fig, ax = plt.subplots(ncols=2, figsize=(10, 5))
fig.suptitle("Fresh learning", fontsize=14)

history = np.array(history)
ax[0].plot(history[:, :2])
ax[0].legend(["Train Loss", "Val Loss"])
ax[1].plot(history[:, 2:])
ax[1].legend(["Train Accuracy", "Val Accuracy"])
ax[0].set_xlabel("Epoch Number")
ax[1].set_xlabel("Epoch Number")
ax[0].set_ylabel("Loss")
ax[1].set_ylabel("Accuracy")
plt.savefig("loss_curve.png")
ax[0].grid()
ax[1].grid()
plt.show()


del model
model = models.mobilenet_v2(weights="MobileNet_V2_Weights.DEFAULT")

Downloading: "https://download.pytorch.org/models/mobilenet_v2-7ebf99e0.pth" to /root/.cache/torch/hub/checkpoints/mobilenet_v2-7ebf99e0.pth
100%|██████████| 13.6M/13.6M [00:00<00:00, 116MB/s]


# Freeze model parameters
for param in model.parameters():
    param.requires_grad = False


# Change the final layers of MobileNet Model for Transfer Learning

model.classifier[1] = nn.Linear(
    1280, 500
)  # replace last module to our custom, e.g. with 500 neurons
model.classifier.add_module("2", nn.ReLU())  # add activation
model.classifier.add_module(
    "3", nn.Linear(500, num_classes)
)  # add new output layer with 10  out classes

print(model.classifier)

Sequential(
  (0): Dropout(p=0.2, inplace=False)
  (1): Linear(in_features=1280, out_features=500, bias=True)
  (2): ReLU()
  (3): Linear(in_features=500, out_features=10, bias=True)
)


# Define Optimizer and Loss Function
criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=3e-4)


num_epochs = 20
trained_model, history = train_and_validate(
    model.to(device), criterion, optimizer, num_epochs
)

torch.save(history, "history_transfer_learning.pt")

Epoch: 1/20
Epoch : 001, Training: Loss: 1.7921, Accuracy: 51.2868%, 
		Validation : Loss : 1.3201, Accuracy: 52.1875%, Time: 8.7978s
Epoch: 2/20
Epoch : 002, Training: Loss: 1.0062, Accuracy: 73.7592%, 
		Validation : Loss : 0.7506, Accuracy: 67.1875%, Time: 8.5419s
Epoch: 3/20
Epoch : 003, Training: Loss: 0.7081, Accuracy: 80.7445%, 
		Validation : Loss : 0.5708, Accuracy: 70.0000%, Time: 9.4897s
Epoch: 4/20
Epoch : 004, Training: Loss: 0.6006, Accuracy: 80.9743%, 
		Validation : Loss : 0.4894, Accuracy: 72.5000%, Time: 9.0147s
Epoch: 5/20
Epoch : 005, Training: Loss: 0.5416, Accuracy: 82.1691%, 
		Validation : Loss : 0.4478, Accuracy: 72.8125%, Time: 8.1678s
Epoch: 6/20
Epoch : 006, Training: Loss: 0.5156, Accuracy: 82.2610%, 
		Validation : Loss : 0.3888, Accuracy: 74.6875%, Time: 8.9877s
Epoch: 7/20
Epoch : 007, Training: Loss: 0.4730, Accuracy: 83.6397%, 
		Validation : Loss : 0.3852, Accuracy: 72.8125%, Time: 8.5624s
Epoch: 8/20
Epoch : 008, Training: Loss: 0.4319, Accuracy: 85.3401%, 
		Validation : Loss : 0.3676, Accuracy: 74.0625%, Time: 8.3820s
Epoch: 9/20
Epoch : 009, Training: Loss: 0.4202, Accuracy: 85.5239%, 
		Validation : Loss : 0.3469, Accuracy: 73.4375%, Time: 8.8643s
Epoch: 10/20
Epoch : 010, Training: Loss: 0.3945, Accuracy: 85.7996%, 
		Validation : Loss : 0.3489, Accuracy: 73.1250%, Time: 8.3387s
Epoch: 11/20
Epoch : 011, Training: Loss: 0.3992, Accuracy: 86.4430%, 
		Validation : Loss : 0.3235, Accuracy: 75.3125%, Time: 8.6160s
Epoch: 12/20
Epoch : 012, Training: Loss: 0.3893, Accuracy: 85.7077%, 
		Validation : Loss : 0.3286, Accuracy: 75.6250%, Time: 9.0667s
Epoch: 13/20
Epoch : 013, Training: Loss: 0.3859, Accuracy: 86.4890%, 
		Validation : Loss : 0.3055, Accuracy: 75.9375%, Time: 8.0769s
Epoch: 14/20
Epoch : 014, Training: Loss: 0.3672, Accuracy: 87.2243%, 
		Validation : Loss : 0.3039, Accuracy: 74.6875%, Time: 8.7466s
Epoch: 15/20
Epoch : 015, Training: Loss: 0.3547, Accuracy: 87.1783%, 
		Validation : Loss : 0.2932, Accuracy: 76.2500%, Time: 8.9641s
Epoch: 16/20
Epoch : 016, Training: Loss: 0.3558, Accuracy: 87.1783%, 
		Validation : Loss : 0.2980, Accuracy: 75.3125%, Time: 8.0300s
Epoch: 17/20
Epoch : 017, Training: Loss: 0.3423, Accuracy: 87.7298%, 
		Validation : Loss : 0.2877, Accuracy: 75.6250%, Time: 8.9482s
Epoch: 18/20
Epoch : 018, Training: Loss: 0.3026, Accuracy: 89.8438%, 
		Validation : Loss : 0.2859, Accuracy: 76.5625%, Time: 8.5148s
Epoch: 19/20
Epoch : 019, Training: Loss: 0.3376, Accuracy: 87.3162%, 
		Validation : Loss : 0.2783, Accuracy: 76.2500%, Time: 7.8372s
Epoch: 20/20
Epoch : 020, Training: Loss: 0.3159, Accuracy: 88.3732%, 
		Validation : Loss : 0.2793, Accuracy: 77.1875%, Time: 8.7078s


fig, ax = plt.subplots(ncols=2, figsize=(10, 5))
fig.suptitle("Transfer learning", fontsize=14)

history = np.array(history)
ax[0].plot(history[:, :2])
ax[0].legend(["Train Loss", "Val Loss"])
ax[1].plot(history[:, 2:])
ax[1].legend(["Train Accuracy", "Val Accuracy"])
ax[0].set_xlabel("Epoch Number")
ax[1].set_xlabel("Epoch Number")
ax[0].set_ylabel("Loss")
ax[1].set_ylabel("Accuracy")
plt.savefig("loss_curve.png")
ax[0].grid()
ax[1].grid()
plt.show()


fig, ax = plt.subplots(ncols=2, figsize=(10, 5))
fig.suptitle("Fresh Learning (FL) vs Transfer Learning (TL)", fontsize=14)

history_fresh = np.array(torch.load("history_fresh.pt"))
history_transfer_learning = np.array(torch.load("history_transfer_learning.pt"))

ax[0].plot(history_fresh[:, :2], linestyle="--")
ax[0].set_prop_cycle("color", ["tab:blue", "tab:orange"])
ax[0].plot(history_transfer_learning[:, :2])
ax[0].legend(["Train Loss (FL)", "Val Loss (FL)", "Train Loss (TL)", "Val Loss (TL)"])

ax[1].plot(history_fresh[:, 2:], linestyle="--")
ax[1].set_prop_cycle("color", ["tab:blue", "tab:orange"])
ax[1].plot(history_transfer_learning[:, 2:])
ax[1].legend(
    [
        "Train Accuracy (FL)",
        "Val Accuracy (FL)",
        "Train Accuracy (TL)",
        "Val Accuracy (TL)",
    ]
)
ax[0].set_xlabel("Epoch Number")
ax[1].set_xlabel("Epoch Number")
ax[0].set_ylabel("Loss")
ax[1].set_ylabel("Accuracy")
plt.savefig("loss_curve.png")
ax[0].grid()
ax[1].grid()
plt.show()


for name, param in model.named_parameters():
    print(name, param.requires_grad)

features.0.0.weight False
features.0.1.weight False
features.0.1.bias False
features.1.conv.0.0.weight False
features.1.conv.0.1.weight False
features.1.conv.0.1.bias False
features.1.conv.1.weight False
features.1.conv.2.weight False
features.1.conv.2.bias False
features.2.conv.0.0.weight False
features.2.conv.0.1.weight False
features.2.conv.0.1.bias False
features.2.conv.1.0.weight False
features.2.conv.1.1.weight False
features.2.conv.1.1.bias False
features.2.conv.2.weight False
features.2.conv.3.weight False
features.2.conv.3.bias False
features.3.conv.0.0.weight False
features.3.conv.0.1.weight False
features.3.conv.0.1.bias False
features.3.conv.1.0.weight False
features.3.conv.1.1.weight False
features.3.conv.1.1.bias False
features.3.conv.2.weight False
features.3.conv.3.weight False
features.3.conv.3.bias False
features.4.conv.0.0.weight False
features.4.conv.0.1.weight False
features.4.conv.0.1.bias False
features.4.conv.1.0.weight False
features.4.conv.1.1.weight False
features.4.conv.1.1.bias False
features.4.conv.2.weight False
features.4.conv.3.weight False
features.4.conv.3.bias False
features.5.conv.0.0.weight False
features.5.conv.0.1.weight False
features.5.conv.0.1.bias False
features.5.conv.1.0.weight False
features.5.conv.1.1.weight False
features.5.conv.1.1.bias False
features.5.conv.2.weight False
features.5.conv.3.weight False
features.5.conv.3.bias False
features.6.conv.0.0.weight False
features.6.conv.0.1.weight False
features.6.conv.0.1.bias False
features.6.conv.1.0.weight False
features.6.conv.1.1.weight False
features.6.conv.1.1.bias False
features.6.conv.2.weight False
features.6.conv.3.weight False
features.6.conv.3.bias False
features.7.conv.0.0.weight False
features.7.conv.0.1.weight False
features.7.conv.0.1.bias False
features.7.conv.1.0.weight False
features.7.conv.1.1.weight False
features.7.conv.1.1.bias False
features.7.conv.2.weight False
features.7.conv.3.weight False
features.7.conv.3.bias False
features.8.conv.0.0.weight False
features.8.conv.0.1.weight False
features.8.conv.0.1.bias False
features.8.conv.1.0.weight False
features.8.conv.1.1.weight False
features.8.conv.1.1.bias False
features.8.conv.2.weight False
features.8.conv.3.weight False
features.8.conv.3.bias False
features.9.conv.0.0.weight False
features.9.conv.0.1.weight False
features.9.conv.0.1.bias False
features.9.conv.1.0.weight False
features.9.conv.1.1.weight False
features.9.conv.1.1.bias False
features.9.conv.2.weight False
features.9.conv.3.weight False
features.9.conv.3.bias False
features.10.conv.0.0.weight False
features.10.conv.0.1.weight False
features.10.conv.0.1.bias False
features.10.conv.1.0.weight False
features.10.conv.1.1.weight False
features.10.conv.1.1.bias False
features.10.conv.2.weight False
features.10.conv.3.weight False
features.10.conv.3.bias False
features.11.conv.0.0.weight False
features.11.conv.0.1.weight False
features.11.conv.0.1.bias False
features.11.conv.1.0.weight False
features.11.conv.1.1.weight False
features.11.conv.1.1.bias False
features.11.conv.2.weight False
features.11.conv.3.weight False
features.11.conv.3.bias False
features.12.conv.0.0.weight False
features.12.conv.0.1.weight False
features.12.conv.0.1.bias False
features.12.conv.1.0.weight False
features.12.conv.1.1.weight False
features.12.conv.1.1.bias False
features.12.conv.2.weight False
features.12.conv.3.weight False
features.12.conv.3.bias False
features.13.conv.0.0.weight False
features.13.conv.0.1.weight False
features.13.conv.0.1.bias False
features.13.conv.1.0.weight False
features.13.conv.1.1.weight False
features.13.conv.1.1.bias False
features.13.conv.2.weight False
features.13.conv.3.weight False
features.13.conv.3.bias False
features.14.conv.0.0.weight False
features.14.conv.0.1.weight False
features.14.conv.0.1.bias False
features.14.conv.1.0.weight False
features.14.conv.1.1.weight False
features.14.conv.1.1.bias False
features.14.conv.2.weight False
features.14.conv.3.weight False
features.14.conv.3.bias False
features.15.conv.0.0.weight False
features.15.conv.0.1.weight False
features.15.conv.0.1.bias False
features.15.conv.1.0.weight False
features.15.conv.1.1.weight False
features.15.conv.1.1.bias False
features.15.conv.2.weight False
features.15.conv.3.weight False
features.15.conv.3.bias False
features.16.conv.0.0.weight False
features.16.conv.0.1.weight False
features.16.conv.0.1.bias False
features.16.conv.1.0.weight False
features.16.conv.1.1.weight False
features.16.conv.1.1.bias False
features.16.conv.2.weight False
features.16.conv.3.weight False
features.16.conv.3.bias False
features.17.conv.0.0.weight False
features.17.conv.0.1.weight False
features.17.conv.0.1.bias False
features.17.conv.1.0.weight False
features.17.conv.1.1.weight False
features.17.conv.1.1.bias False
features.17.conv.2.weight False
features.17.conv.3.weight False
features.17.conv.3.bias False
features.18.0.weight False
features.18.1.weight False
features.18.1.bias False
classifier.1.weight True
classifier.1.bias True
classifier.3.weight True
classifier.3.bias True


# Unfreeze model parameters
for param in model.parameters():
    param.requires_grad = True

optimizer = optim.Adam(model.parameters(), lr=3e-5)


num_epochs = 20
trained_model, history = train_and_validate(
    model.to(device), criterion, optimizer, num_epochs, save_state=True
)

torch.save(history, "history_finetuning.pt")

Epoch: 1/20
Epoch : 001, Training: Loss: 0.2955, Accuracy: 90.1195%, 
		Validation : Loss : 0.2437, Accuracy: 76.5625%, Time: 13.6207s
Epoch: 2/20
Epoch : 002, Training: Loss: 0.2402, Accuracy: 91.8199%, 
		Validation : Loss : 0.2150, Accuracy: 77.5000%, Time: 13.3512s
Epoch: 3/20
Epoch : 003, Training: Loss: 0.2102, Accuracy: 92.2794%, 
		Validation : Loss : 0.2052, Accuracy: 77.1875%, Time: 13.9947s
Epoch: 4/20
Epoch : 004, Training: Loss: 0.2057, Accuracy: 92.0496%, 
		Validation : Loss : 0.1850, Accuracy: 78.4375%, Time: 13.3778s
Epoch: 5/20
Epoch : 005, Training: Loss: 0.2118, Accuracy: 92.5092%, 
		Validation : Loss : 0.1663, Accuracy: 80.0000%, Time: 13.4142s
Epoch: 6/20
Epoch : 006, Training: Loss: 0.1611, Accuracy: 93.9338%, 
		Validation : Loss : 0.1563, Accuracy: 79.3750%, Time: 13.5197s
Epoch: 7/20
Epoch : 007, Training: Loss: 0.1707, Accuracy: 93.1526%, 
		Validation : Loss : 0.1380, Accuracy: 80.0000%, Time: 13.3344s
Epoch: 8/20
Epoch : 008, Training: Loss: 0.1602, Accuracy: 93.8419%, 
		Validation : Loss : 0.1335, Accuracy: 80.6250%, Time: 13.3374s
Epoch: 9/20
Epoch : 009, Training: Loss: 0.1428, Accuracy: 94.2096%, 
		Validation : Loss : 0.1271, Accuracy: 80.6250%, Time: 13.4488s
Epoch: 10/20
Epoch : 010, Training: Loss: 0.1313, Accuracy: 94.7151%, 
		Validation : Loss : 0.1210, Accuracy: 80.9375%, Time: 13.4156s
Epoch: 11/20
Epoch : 011, Training: Loss: 0.1328, Accuracy: 94.5772%, 
		Validation : Loss : 0.1122, Accuracy: 81.2500%, Time: 13.4008s
Epoch: 12/20
Epoch : 012, Training: Loss: 0.1143, Accuracy: 95.4504%, 
		Validation : Loss : 0.1081, Accuracy: 80.9375%, Time: 13.4811s
Epoch: 13/20
Epoch : 013, Training: Loss: 0.1203, Accuracy: 95.0368%, 
		Validation : Loss : 0.1093, Accuracy: 80.3125%, Time: 13.3948s
Epoch: 14/20
Epoch : 014, Training: Loss: 0.1087, Accuracy: 95.4963%, 
		Validation : Loss : 0.1054, Accuracy: 81.2500%, Time: 13.3669s
Epoch: 15/20
Epoch : 015, Training: Loss: 0.0959, Accuracy: 95.5882%, 
		Validation : Loss : 0.1016, Accuracy: 80.6250%, Time: 13.4678s
Epoch: 16/20
Epoch : 016, Training: Loss: 0.0965, Accuracy: 96.2776%, 
		Validation : Loss : 0.0960, Accuracy: 81.2500%, Time: 13.4115s
Epoch: 17/20
Epoch : 017, Training: Loss: 0.1007, Accuracy: 95.5882%, 
		Validation : Loss : 0.0966, Accuracy: 81.5625%, Time: 14.0048s
Epoch: 18/20
Epoch : 018, Training: Loss: 0.0932, Accuracy: 95.8640%, 
		Validation : Loss : 0.0927, Accuracy: 81.2500%, Time: 13.2979s
Epoch: 19/20
Epoch : 019, Training: Loss: 0.0806, Accuracy: 96.8290%, 
		Validation : Loss : 0.0928, Accuracy: 81.5625%, Time: 13.4152s
Epoch: 20/20
Epoch : 020, Training: Loss: 0.0736, Accuracy: 96.6452%, 
		Validation : Loss : 0.0879, Accuracy: 82.1875%, Time: 13.2985s


fig, ax = plt.subplots(ncols=2, figsize=(16, 5))
fig.suptitle("Transfer Learning (TL) AND Finetuning (FT)", fontsize=14)

history_transfer_learning = np.array(torch.load("history_transfer_learning.pt"))
history_finetuning = np.array(torch.load("history_finetuning.pt"))

train_val_loss = np.concatenate(
    (history_transfer_learning[:, :2], history_finetuning[:, :2]), axis=0
)
ax[0].plot(train_val_loss)
ax[0].vlines(19, -0.1, 2.1, color="tab:green", linewidth=2, linestyle="--")
ax[0].legend(["Train Loss", "Val Loss", "TL/FT boundary"])

train_val_acc = np.concatenate(
    (history_transfer_learning[:, 2:], history_finetuning[:, 2:]), axis=0
)

ax[1].plot(train_val_acc)
ax[1].vlines(19, -5, 105, color="tab:green", linewidth=2, linestyle="--")
ax[1].legend(["Train Accuracy", "Val Accuracy", "TL/FT boundary"])

ax[0].set_xlabel("Epoch Number")
ax[1].set_xlabel("Epoch Number")
ax[0].set_ylabel("Loss")
ax[1].set_ylabel("Accuracy")
plt.savefig("loss_curve.png")
ax[0].grid()
ax[1].grid()
plt.show()


trained_model.load_state_dict(
    torch.load("check_points/fine_tuning_18.pth")
)  # 38 = 20 (TL) + 18 (FT)
trained_model.eval();


def predict(model, test_img_name, device):
    """
    Function to predict the class of a single test image
    Parameters
        :param model: Model to test
        :param test_img_name: Test image

    """

    transform = img_transforms["test"]
    test_img = torch.tensor(np.asarray(test_img_name))
    test_img = transforms.ToPILImage()(test_img)
    plt.imshow(test_img)

    test_img_tensor = test_img_name.unsqueeze(0).to(device)

    with torch.no_grad():
        model.eval()
        # Model outputs is logits
        out = model(test_img_tensor).to(device)
        probs = torch.softmax(out, dim=1).to(device)
        topk, topclass = probs.topk(3, dim=1)
        for i in range(3):
            print(
                "Predcition",
                i + 1,
                ":",
                idx_to_class[topclass.cpu().numpy()[0][i]],
                ", Score: ",
                round(topk.cpu().numpy()[0][i], 2),
            )


print("Shoud be %s\n" % idx_to_class[0])
predict(
    trained_model.to(device),
    test_set[np.where([x[1] == 0 for x in test_set])[0][0]][0],
    device,
)

Shoud be AnnualCrop

Predcition 1 : AnnualCrop , Score:  1.0
Predcition 2 : PermanentCrop , Score:  0.0
Predcition 3 : SeaLake , Score:  0.0


print("Shoud be %s\n" % idx_to_class[6])
predict(
    trained_model,
    test_set[np.where([x[1] == 6 for x in test_set])[0][0]][0],
    device,
)

Shoud be PermanentCrop

Predcition 1 : PermanentCrop , Score:  0.58
Predcition 2 : AnnualCrop , Score:  0.42
Predcition 3 : SeaLake , Score:  0.0


print("Shoud be %s\n" % idx_to_class[8])
predict(
    trained_model,
    test_set[np.where([x[1] == 8 for x in test_set])[0][0]][0],
    device,
)

Shoud be River

Predcition 1 : River , Score:  1.0
Predcition 2 : Highway , Score:  0.0
Predcition 3 : AnnualCrop , Score:  0.0


from torchvision.models import alexnet
import torch

face1 = torch.randn((3, 224, 224))
face2 = torch.randn((3, 224, 224))

model = alexnet(weights="AlexNet_Weights.DEFAULT")
# remove classification layer
model.fc = model.classifier[6] = torch.nn.Identity()

# get embeddings
embedding1 = model(face1.unsqueeze(0))
embedding2 = model(face2.unsqueeze(0))

diff = torch.nn.functional.pairwise_distance(embedding1, embedding2)
print("L2 distance: ", diff.item())

Downloading: "https://download.pytorch.org/models/alexnet-owt-7be5be79.pth" to /root/.cache/torch/hub/checkpoints/alexnet-owt-7be5be79.pth
100%|██████████| 233M/233M [00:01<00:00, 186MB/s]

L2 distance:  30.66541862487793


from torch import nn

triplet_loss = nn.TripletMarginLoss(margin=1.0, p=2)
anchor = torch.randn(100, 128, requires_grad=True)
positive = torch.randn(100, 128, requires_grad=True)
negative = torch.randn(100, 128, requires_grad=True)
loss = triplet_loss(anchor, positive, negative)
print(loss)

tensor(1.0878, grad_fn=<MeanBackward0>)


import torch.nn.functional as F

triplet_loss = nn.TripletMarginWithDistanceLoss(
    margin=1.0, distance_function=lambda x, y: 1.0 - F.cosine_similarity(x, y)
)
loss = triplet_loss(anchor, positive, negative)
print(loss)

tensor(0.9909, grad_fn=<MeanBackward0>)


!wget -qN https://edunet.kea.su/repo/EduNet-web_dependencies/datasets/small_face_dataset.zip
!unzip -qn small_face_dataset.zip


import numpy as np
import random


def set_random_seed(seed):
    torch.manual_seed(seed)
    torch.cuda.manual_seed(seed)
    torch.backends.cudnn.deterministic = True
    torch.backends.cudnn.benchmark = False
    np.random.seed(seed)
    random.seed(seed)


set_random_seed(42)


from torch.utils.data import Dataset
from glob import glob
from PIL import Image


class SiameseNetworkDataset(Dataset):
    def __init__(self, dir=None, transform=None, splitter="/"):
        self.dir = dir
        self.splitter = splitter
        self.transform = transform
        self.files = glob(f"{self.dir}/**/*.pgm", recursive=True)
        self.data = self.build_index()

    def build_index(self):
        index = {}
        for f in self.files:
            id = self.path2id(f)
            if not id in index:
                index[id] = []
            index[id].append(f)
        return index

    def path2id(self, path):
        return path.replace(self.dir, "").split(self.splitter)[0]

    def __getitem__(self, index):
        anchor_path = self.files[index]
        positive_path = self.find_positive(anchor_path)
        negative_path = self.find_negative(anchor_path)

        # Loading the images
        anchor = Image.open(anchor_path)
        positive = Image.open(positive_path)
        negative = Image.open(negative_path)

        if self.transform is not None:  # Apply image transformations
            anchor = self.transform(anchor)
            positive = self.transform(positive)
            negative = self.transform(negative)

        return anchor, positive, negative

    def find_positive(self, path):
        id = self.path2id(path)
        all_exept_my = self.data[id].copy()
        all_exept_my.remove(path)
        return random.choice(all_exept_my)

    def find_negative(self, path):
        all_exept_my_ids = list(self.data.keys())
        id = self.path2id(path)
        all_exept_my_ids.remove(id)
        selected_id = random.choice(all_exept_my_ids)
        return random.choice(self.data[selected_id])

    def __len__(self):
        return len(self.files)


from torch.utils.data import DataLoader
import torchvision
import matplotlib.pyplot as plt
import torchvision.transforms as transforms

# Create dataset instance
siamese_dataset = SiameseNetworkDataset(
    "faces/training/",
    transform=transforms.Compose(
        [
            transforms.Resize((105, 105)),
            transforms.ToTensor(),
        ]
    ),
)

# Create dataloader & extract batch of data from it
vis_dataloader = DataLoader(siamese_dataset, batch_size=8, shuffle=True)
dataiter = iter(vis_dataloader)
example_batch = next(dataiter)  # anc, pos, neg

# Show batch contents
concatenated = torch.cat((example_batch[0], example_batch[1], example_batch[2]), 0)
grid = torchvision.utils.make_grid(concatenated)

plt.axis("off")
plt.imshow(grid.permute(1, 2, 0).numpy())
plt.gcf().set_size_inches(20, 60)
plt.show()


from torchvision.models import resnet18


class SiameseNet(nn.Module):
    def __init__(self, latent_dim):
        super().__init__()
        self.model = resnet18(weights=None)
        # Because we use grayscale images reduce input channel count to one
        self.model.conv1 = nn.Conv2d(
            1, 64, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False
        )
        # Replace ImageNet 1000 class classifier with 64- out linear layer
        self.model.fc = nn.Linear(self.model.fc.in_features, latent_dim)

    def _forward(self, x):
        out = self.model(x)
        # normalize embedding to unit vector
        out = torch.nn.functional.normalize(out)
        return out

    def forward(self, anchor, positive, negative):
        output1 = self._forward(anchor)
        output2 = self._forward(positive)
        output3 = self._forward(negative)

        return output1, output2, output3


# Apply augmentations on train data
img_trans_train = transforms.Compose(
    [
        transforms.Resize((105, 105)),
        transforms.RandomHorizontalFlip(),
        transforms.ToTensor(),
    ]
)

img_trans_test = transforms.Compose(
    [transforms.Resize((105, 105)), transforms.ToTensor()]
)

train_dataset = SiameseNetworkDataset("faces/training/", transform=img_trans_train)
val_dataset = SiameseNetworkDataset("faces/testing/", transform=img_trans_test)

batch_size = 300
train_loader = DataLoader(
    train_dataset, num_workers=2, batch_size=batch_size, shuffle=True
)
val_loader = DataLoader(val_dataset, num_workers=2, batch_size=1, shuffle=False)


def train(num_epochs, model, criterion, optimizer, train_loader):
    loss_history = []
    model.train()
    for epoch in range(0, num_epochs):
        train_loss = 0
        for i, batch in enumerate(train_loader, 0):
            anc, pos, neg = batch
            output_anc, output_pos, output_neg = model(
                anc.to(device), pos.to(device), neg.to(device)
            )
            loss = criterion(output_anc, output_pos, output_neg)
            loss.backward()
            optimizer.step()
            optimizer.zero_grad()
            train_loss += loss.detach().cpu().item()

        loss_history.append(train_loss / len(train_loader))
        last_epoch_loss = torch.tensor(loss_history[-1])
        print("Epoch {} with {:.4f} loss".format(epoch, last_epoch_loss))

    return loss_history, last_epoch_loss


import torch.optim as optim

device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
latent_dim = 32
model = SiameseNet(latent_dim).to(device)
criterion = nn.TripletMarginWithDistanceLoss(
    margin=1.0, distance_function=lambda x, y: 1.0 - F.cosine_similarity(x, y)
)

optimizer = optim.Adam(model.parameters(), lr=0.001)
num_epochs = 9
loss_history, _ = train(num_epochs, model, criterion, optimizer, train_loader)

Epoch 0 with 0.8090 loss
Epoch 1 with 0.4584 loss
Epoch 2 with 0.4083 loss
Epoch 3 with 0.3571 loss
Epoch 4 with 0.3335 loss
Epoch 5 with 0.3602 loss
Epoch 6 with 0.3168 loss
Epoch 7 with 0.2326 loss
Epoch 8 with 0.2895 loss


plt.plot(range(1, len(loss_history) + 1), loss_history)
plt.ylabel("loss")
plt.xlabel("num of epochs")
plt.grid()
plt.show()


# Helper method for visualization
def show(img, text=None):
    img_np = img.numpy()
    plt.axis("off")
    plt.text(75, 120, text, fontweight="bold")
    plt.imshow(np.transpose(img_np, (1, 2, 0)))  # [CxHxW] -> [HxWxC] for imshow
    plt.show()


def plot_imgs(model, test_loader):
    similarity_pos = []
    similarity_neg = []
    model.eval()
    with torch.inference_mode():
        for i, batch in enumerate(test_loader, 0):
            anc, pos, neg = batch
            output_anc, output_pos, output_neg = model(
                anc.to(device), pos.to(device), neg.to(device)
            )
            # compute euc. distance
            sim_pos = F.cosine_similarity(output_anc, output_pos).item()
            sim_neg = F.cosine_similarity(output_anc, output_neg).item()

            similarity_pos.append(sim_pos)
            similarity_neg.append(sim_neg)

            if not i % 5:
                concatenated = torch.cat((anc, pos, neg))
                result = "OK" if sim_neg < sim_pos else "BAD"
                show(
                    torchvision.utils.make_grid(concatenated),
                    f"Positive / negative similarities: {sim_pos:.3f} / {sim_neg:.3f} - {result}",
                )

    return similarity_pos, similarity_neg


set_random_seed(42)
similarity_pos, similarity_neg = plot_imgs(model, val_loader)


import seaborn as sns

similarities = {"The same person": similarity_pos, "Another person": similarity_neg}

ax = sns.histplot(similarities, bins=20)
ax.set(xlabel="Pairwise similarity")
plt.show()


!pip install --quiet optuna

     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 390.6/390.6 kB 13.5 MB/s eta 0:00:00
     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 224.5/224.5 kB 22.8 MB/s eta 0:00:00
     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 78.7/78.7 kB 11.5 MB/s eta 0:00:00


import optuna
from optuna.samplers import RandomSampler


# define function which will optimized
def objective(trial):
    # boundaries for the optimizer's
    lr = trial.suggest_float("lr", 1e-4, 1e-2)
    latent_dim = trial.suggest_int("latent_dim", 8, 64, step=8)

    # create new model(and all parameters) every iteration
    model = SiameseNet(latent_dim).to(device)  # latent_dim regulates by optuna
    criterion = nn.TripletMarginWithDistanceLoss(
        margin=1.0, distance_function=lambda x, y: 1.0 - F.cosine_similarity(x, y)
    )

    optimizer = optim.Adam(
        model.parameters(), lr=lr
    )  # learning rate regulates by optuna

    # To save time, we will take only 3 epochs
    train_loader = DataLoader(
        train_dataset, num_workers=2, batch_size=batch_size, shuffle=True
    )
    _, last_epoch_loss = train(3, model, criterion, optimizer, train_loader)
    return last_epoch_loss


# Create "exploration"
study = optuna.create_study(
    direction="minimize", study_name="Optimizer", sampler=RandomSampler(42)
)

study.optimize(
    objective, n_trials=10
)  # The more iterations, the higher the chances of catching the most optimal hyperparameters

[I 2023-07-18 20:44:47,744] A new study created in memory with name: Optimizer

Epoch 0 with 0.8298 loss
Epoch 1 with 0.5833 loss

[I 2023-07-18 20:44:53,687] Trial 0 finished with value: 0.5804647207260132 and parameters: {'lr': 0.003807947176588889, 'latent_dim': 64}. Best is trial 0 with value: 0.5804647207260132.

Epoch 2 with 0.5805 loss
Epoch 0 with 0.8369 loss
Epoch 1 with 0.6785 loss

[I 2023-07-18 20:45:00,230] Trial 1 finished with value: 0.7354487180709839 and parameters: {'lr': 0.007346740023932911, 'latent_dim': 40}. Best is trial 0 with value: 0.5804647207260132.

Epoch 2 with 0.7354 loss
Epoch 0 with 0.8462 loss
Epoch 1 with 0.4905 loss

[I 2023-07-18 20:45:06,189] Trial 2 finished with value: 0.36206525564193726 and parameters: {'lr': 0.0016445845403801217, 'latent_dim': 16}. Best is trial 2 with value: 0.36206525564193726.

Epoch 2 with 0.3621 loss
Epoch 0 with 0.7979 loss
Epoch 1 with 0.5225 loss

[I 2023-07-18 20:45:12,623] Trial 3 finished with value: 0.3257625102996826 and parameters: {'lr': 0.0006750277604651748, 'latent_dim': 56}. Best is trial 3 with value: 0.3257625102996826.

Epoch 2 with 0.3258 loss
Epoch 0 with 0.8698 loss
Epoch 1 with 0.6307 loss


# show best params
study.best_params

{'lr': 0.0006750277604651748, 'latent_dim': 56}


optuna.visualization.plot_optimization_history(study)


set_random_seed(42)

model = SiameseNet(study.best_params["latent_dim"]).to(
    device
)  # take latent_dim, which choosen by Optuna
criterion = nn.TripletMarginWithDistanceLoss(
    margin=1.0, distance_function=lambda x, y: 1.0 - F.cosine_similarity(x, y)
)
optimizer = optim.Adam(
    model.parameters(), lr=study.best_params["lr"]
)  # take lr, which choosen by Optuna

num_epochs = 9
train_loader = DataLoader(
    train_dataset, num_workers=2, batch_size=batch_size, shuffle=True
)
l_optim, _ = train(num_epochs, model, criterion, optimizer, train_loader)

Epoch 0 with 0.7609 loss
Epoch 1 with 0.5261 loss
Epoch 2 with 0.4040 loss
Epoch 3 with 0.3303 loss
Epoch 4 with 0.3403 loss
Epoch 5 with 0.3373 loss
Epoch 6 with 0.2967 loss
Epoch 7 with 0.2273 loss
Epoch 8 with 0.2934 loss


plt.plot(range(1, len(loss_history) + 1), loss_history, label="no optimization")
plt.plot(range(1, len(l_optim) + 1), l_optim, label="optimal params")
plt.ylabel("loss")
plt.xlabel("num of epochs")
plt.grid()
plt.legend()
plt.show()


set_random_seed(42)
similarity_pos, similarity_neg = plot_imgs(model, val_loader)


similarities_optim = {
    "The same person": similarity_pos,
    "Another person": similarity_neg,
}

fig, axes = plt.subplots(1, 2, figsize=(15, 5))

sns.histplot(similarities, bins=20, alpha=0.5, ax=axes[0])
sns.histplot(similarities_optim, bins=20, alpha=0.5, ax=axes[1])

axes[0].set(title="No optimization")
axes[1].set(title="Optimization with Optuna")
axes[0].set(xlabel="Pairwise similarity")
axes[1].set(xlabel="Pairwise similarity")

plt.show()

Проблемы при работе с реальной задачей машинного обучения¶

Общие подходы при работе с реальными данными¶

Нехватка данных¶

Дисбаланс классов¶

Изменение баланса класса сэмплированием¶

Дублирование примеров меньшего класса (oversampling)¶

Уменьшение числа примеров большего класса (undersampling)¶

Ансамбли + undersampling¶

Балансирование представленности объектов в батчах¶

Генерация синтетических данных¶

SMOTE¶

Изменение функции потерь¶

Веса классов¶

Focal Loss¶

Обнаружение аномалий¶

Метрики качества на несбалансированных данных¶

Аугментация¶

Изображения¶

Random Rotation¶

Gaussian Blur¶

Random Erasing¶

ColorJitter¶

Совмещаем несколько аугментаций вместе¶

Совмещение нескольких аугментаций случайным образом¶

Random Apply¶

Random Choice¶

Пример создания собственной аугментации¶

Аугментация внутри Dataset¶

Нестандартные способы аугментации¶

Mixup¶

Аугментация при помощи генерации данных¶

Аугментация в реальных задачах¶

Аудио¶

Background Noise¶

Time Stretch¶

Pitch Shift¶

Совмещаем несколько аугментаций вместе¶

Текст¶

Аугментация символов¶

Аугментация слов¶

Аугментация предложений¶

Transfer learning¶

Порядок действий при transfer learning¶

Практический пример transfer learning¶

Обучение готовой архитектуры "с нуля"¶

Обучение готовой архитектуры с предобученными весами¶

Обучение классификационной "головы"¶

Дообучение всех слоев (Fine-tuning)¶

Metric learning¶

Формирование векторов-признаков (embedding)¶

Сиамская сеть (Siamese Network)¶

Triplet Loss¶

Реализация сиамской сети¶

Загрузка данных¶

Dataset for TripletLoss¶

Создание модели¶

Dataloaders¶

Обучение¶

Проверка¶

Оптимизация гиперпараметров¶

Аугментация внутри `Dataset`¶