DFC15 dataset: Example of the aitlas toolbox for multi label image classification#

This notebook shows a sample implementation of a multi label image classification using the aitlas toolbox using the DFC15 merced multi label dataset.

[ ]:
from aitlas.datasets import DFC15MultiLabelDataset
from aitlas.models import ResNet50MultiLabel
from aitlas.transforms import ResizeCenterCropFlipHVToTensor, ResizeCenterCropToTensor
from aitlas.utils import image_loader

Load the dataset#

[ ]:
dataset_config = {
    "data_dir": "./data/DFC15/images",
    "csv_file": "./data/DFC15/multilabels.txt"
}
dataset = DFC15MultiLabelDataset(dataset_config)

Show images from the dataset#

[ ]:
fig1 = dataset.show_image(1000)
fig2 = dataset.show_image(30)
fig3 = dataset.show_batch(15)

Inspect the data#

[ ]:
dataset.show_samples()
[ ]:
dataset.data_distribution_table()
[ ]:
fig = dataset.data_distribution_barchart()

Load train and test splits#

[ ]:
train_dataset_config = {
    "batch_size": 16,
    "shuffle": True,
    "num_workers": 4,
    "data_dir": "./data/DFC15/images",
    "csv_file": "./data/DFC15/train.csv"
}

train_dataset = DFC15MultiLabelDataset(train_dataset_config)
train_dataset.transform = ResizeCenterCropFlipHVToTensor()

test_dataset_config = {
    "batch_size": 4,
    "shuffle": False,
    "num_workers": 4,
    "data_dir": "./data/DFC15/images",
    "csv_file": "./data/DFC15/test.csv",
    "transforms": ["aitlas.transforms.ResizeCenterCropToTensor"]
}

test_dataset = DFC15MultiLabelDataset(test_dataset_config)
len(train_dataset), len(test_dataset)

Setup and create the model for training#

[ ]:
epochs = 10
model_directory = "./experiments/DFC15"
model_config = {
    "num_classes": 8,
    "learning_rate": 0.0001,
    "pretrained": True,
    "threshold": 0.5,
    "metrics": ["accuracy", "precision", "recall", "f1_score"]
}
model = ResNet50MultiLabel(model_config)
model.prepare()

Training and evaluation#

[ ]:
model.train_and_evaluate_model(
    train_dataset=train_dataset,
    epochs=epochs,
    model_directory=model_directory,
    val_dataset=test_dataset,
    run_id='1',
)

Predictions#

[ ]:
model_path = "./experiments/DFC15/checkpoint.pth.tar"
#labels = DFC15MultiLabelDataset.labels
labels = ["impervious", "water", "clutter", "vegetation", "building", "tree", "boat", "car"]
transform = ResizeCenterCropToTensor()
model.load_model(model_path)

image = image_loader('./data/predict/image1.tif')
fig = model.predict_image(image, labels, transform)

image = image_loader('./data/predict/image2.tif')
fig = model.predict_image(image, labels, transform)

image = image_loader('./data/predict/image3.tif')
fig = model.predict_image(image, labels, transform)

image = image_loader('./data/predict/image4.tif')
fig = model.predict_image(image, labels, transform)