Plugin example: Image Classification Package

Package available:

Tree folder of the package:

image_classification_package
│   LICENSE
│   pyproject.toml
│   README.md
└───src
    └───image_classification_package
            BasicFinetunnedModels.json
            basic_finetunned_models.py
            ImageDataLoader.json
            image_classification_model.py
            image_classification_task.py
            image_dataloader.json
            image_dataloader.py
            __init__.py

src/image_classification_package

BasicFinetunnedModels.json

Json file of BasicFinetunnedModels model parameters

{
    "additionalProperties": false,
    "error_msg": "BasicFinetunnedModel parameters must be one(s) of ['pretrained_model', 'epochs', 'batch size', 'weight decay', 'learning_rate', 'device'].",
    "description": "BasicFinetunnedModel use pre-trained models to classify images.",
    "properties": {
    "pretrained_model": {
        "oneOf": [
        {
            "error_msg": "The 'pretrained_model' parameter should be one of 'vgg16', 'resnet18', 'resnet34', 'resnext50_32x4d', 'maxvit_t', 'densenet121', 'efficientnet_b0', 'googlenet', 'mnasnet0_5', 'mobilenet_v2', 'regnet_x_16gf'.",
            "description": "The name of the pre-trained model to use. You can find the list of available models at https://pytorch.org/vision/stable/models.html in the Classification section. The default model is 'resnet18'.",
            "type": "string",
            "default": "resnet18",
            "enum": [
            "resnet18",
            "resnet34",
            "resnext50_32x4d",
            "vgg16",
            "maxvit_t",
            "densenet121",
            "efficientnet_b0",
            "googlenet",
            "mnasnet0_5",
            "mobilenet_v2",
            "regnet_x_16gf"
            ]
        }
        ]
    },
    "batch_size": {
        "oneOf": [
        {
            "error_msg": "A whole number greater than or equal to 1 must be entered.",
            "description": "The batch size per GPU/TPU core/CPU for training",
            "type": "integer",
            "minimum": 1,
            "default": 8
        }
        ]
    },
    "shuffle": {
        "oneOf": [
        {
            "error_msg": "Need to select 'true' if you have folders that define the splits, otherwise 'false'.",
            "description": "If you want to shuffle the splits select 'true', otherwise 'false'.",
            "type": "boolean",
            "default": true
        }
        ]
    },
    "learning_rate": {
        "oneOf": [
        {
            "error_msg": "Must be a positive number. A number between 10e-6 and 1 is recommended.",
            "description": "The initial learning rate for AdamW optimizer",
            "type": "number",
            "minimum": 0,
            "default": 1e-3
        }
        ]
    },
    "epochs": {
        "oneOf": [
        {
            "error_msg": "A whole number greater than or equal to 1 must be entered.",
            "description": "Total number of training epochs to perform.",
            "type": "integer",
            "minimum": 1,
            "default": 5
        }
        ]
    },
    "momentum": {
        "oneOf": [
        {
            "error_msg": "A number between 0 and 1 must be entered.",
            "description": "Weight decay is a regularization technique used in training neural networks to prevent overfitting. In the context of the AdamW optimizer, the 'weight_decay' parameter is the rate at which the weights of all layers are reduced during training, provided that this rate is not zero.",
            "type": "number",
            "minimum": 0,
            "default": 0
        }
        ]
    },
    "weight_decay": {
        "oneOf": [
        {
            "error_msg": "A number between 0 and 1 must be entered.",
            "description": "Weight decay is a regularization technique used in training neural networks to prevent overfitting. In the context of the AdamW optimizer, the 'weight_decay' parameter is the rate at which the weights of all layers are reduced during training, provided that this rate is not zero.",
            "type": "number",
            "minimum": 0,
            "default": 0
        }
        ]
    },
    "step_size": {
        "oneOf": [
        {
            "error_msg": "A number between 0 and 1 must be entered.",
            "description": "Weight decay is a regularization technique used in training neural networks to prevent overfitting. In the context of the AdamW optimizer, the 'weight_decay' parameter is the rate at which the weights of all layers are reduced during training, provided that this rate is not zero.",
            "type": "integer",
            "minimum": 0,
            "default": 6
        }
        ]
    },
    "gamma": {
        "oneOf": [
        {
            "error_msg": "A number between 0 and 1 must be entered.",
            "description": "Weight decay is a regularization technique used in training neural networks to prevent overfitting. In the context of the AdamW optimizer, the 'weight_decay' parameter is the rate at which the weights of all layers are reduced during training, provided that this rate is not zero.",
            "type": "number",
            "minimum": 0,
            "default": 0.1
        }
        ]
    }
    },
    "type": "object"
}

basic_finetunned_models.py

Python file of BasicFinetunnedModels class.

"""DashAI implementation of DistilBERT model for image classification."""

import json
import os
from typing import Any, Dict

import datasets
import torch
import torch.nn as nn
import torch.optim as optim
from torch.utils.data import DataLoader
from torchvision import models, transforms

from .image_classification_model import ImageClassificationModel

def fit(
    model: torch.nn.Module,
    train_loader: DataLoader,
    criterion: torch.nn.Module,
    optimizer: torch.optim.Optimizer,
    scheduler: torch.optim.lr_scheduler.StepLR,
    device: torch.device,
    num_epochs: int,
    dataset_len: int,
):
    for epoch in range(num_epochs):
        print("Epoch {}/{}".format(epoch, num_epochs - 1))
        print("-" * 10)

        # Train model
        scheduler.step()
        model.train()

        running_loss = 0.0
        running_corrects = 0.0

        for inputs, labels in train_loader:
            inputs, labels = inputs.to(device), labels.to(device)

            optimizer.zero_grad()

            outputs = model(inputs)
            _, preds = torch.max(outputs, 1)
            loss: torch.Tensor = criterion(outputs, labels)

            loss.backward()
            optimizer.step()

            running_loss += loss.item() * inputs.size(0)
            running_corrects += torch.sum(preds == labels.data)

        epoch_loss = running_loss / dataset_len
        epoch_acc = running_corrects.double() / dataset_len

        print("Train Loss: {:.4f} Acc: {:.4f}".format(epoch_loss, epoch_acc))
    return model

def predict(
    model: torch.nn.Module,
    test_dataloader: DataLoader,
    device: torch.device,
    criterion: torch.nn.Module,
    test_dataset_len: int,
):
    model.eval()
    running_loss = 0.0
    running_corrects = 0.0
    preds_without_processing = []

    for inputs, labels in test_dataloader:
        inputs = inputs.to(device)
        labels = labels.to(device)

        with torch.set_grad_enabled(False):
            outputs: torch.Tensor = model(inputs)
            preds_without_processing += outputs.tolist()
            _, preds = torch.max(outputs, 1)
            loss = criterion(outputs, labels)

        running_loss += loss.item() * inputs.size(0)
        running_corrects += torch.sum(preds == labels.data)

    epoch_loss = running_loss / test_dataset_len
    epoch_acc = running_corrects.double() / test_dataset_len

    print("Val Loss: {:.4f} Acc: {:.4f}".format(epoch_loss, epoch_acc))
    return preds_without_processing

class BasicFinetunnedModels(ImageClassificationModel):
    class ImagePytorchDataset(torch.utils.data.Dataset):
        def __init__(self, dataset: datasets.Dataset):
            self.dataset = dataset
            self.transform = transforms.Compose(
                [
                    transforms.Resize(256),
                    transforms.CenterCrop(224),
                    transforms.ToTensor(),
                    transforms.Normalize(
                        mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]
                    ),
                ]
            )

            column_names = list(self.dataset.features.keys())
            self.image_col_name = column_names[0]
            self.label_col_name = column_names[1]

        def __len__(self):
            return len(self.dataset)

        def __getitem__(self, idx):
            image = self.dataset[idx][self.image_col_name]
            image = self.transform(image)
            label = self.dataset[idx][self.label_col_name]
            return image, label

    def __init__(
        self,
        pretrained_model: str,
        batch_size: int = 8,
        shuffle: bool = True,
        learning_rate: float = 0.001,
        epochs: int = 5,
        momentum: float = 0.9,
        weight_decay: float = 1e-4,
        step_size: int = 6,
        gamma: float = 0.1,
    ) -> None:
        self.model_name = pretrained_model
        self.learning_rate = learning_rate
        self.momentum = momentum
        self.weight_decay = weight_decay
        self.step_size = step_size
        self.gamma = gamma
        self.batch_size = batch_size
        self.shuffle = shuffle
        self.epochs = epochs

        self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

        self.model = models.get_model(self.model_name, weights="DEFAULT")

        print(self.model._modules.keys())
        self.last_key = list(self.model._modules.keys())[-1]

        self.criterion: nn.CrossEntropyLoss = nn.CrossEntropyLoss()

    def determine_num_classes(self, dataset: datasets.Dataset):
        label_col_name = list(dataset.features.keys())[-1]
        label_values = dataset[label_col_name]
        return len(list(set(label_values)))

    def fit(self, dataset: datasets.Dataset):
        # 1. Determine the num of classes
        num_classes = self.determine_num_classes(dataset)

        # 2. Change the last layer of the model to have the correct number of classes
        try:
            in_features = self.model._modules[self.last_key][-1].in_features
            self.model._modules[self.last_key][-1] = nn.Linear(
                in_features, num_classes, bias=True
            )
        except TypeError:
            in_features = self.model._modules[self.last_key].in_features
            self.model._modules[self.last_key] = nn.Linear(
                in_features, num_classes, bias=True
            )
        self.model = self.model.to(self.device)

        # 3. Create the optimizer and scheduler
        optimizer: optim.SGD = optim.SGD(
            self.model.parameters(),
            lr=self.learning_rate,
            momentum=self.momentum,
            weight_decay=self.weight_decay,
        )
        scheduler: optim.lr_scheduler.StepLR = optim.lr_scheduler.StepLR(
            optimizer, step_size=self.step_size, gamma=self.gamma
        )

        # 4. Create the dataloader
        img_dataset = self.ImagePytorchDataset(dataset)
        self.train_dataloader = DataLoader(
            img_dataset, batch_size=self.batch_size, shuffle=self.shuffle
        )

        # 5. Train the model
        self.model = fit(
            self.model,
            self.train_dataloader,
            self.criterion,
            optimizer,
            scheduler,
            self.device,
            self.epochs,
            len(dataset),
        )

    def predict(self, dataset: datasets.Dataset):
        """
        Realiza predicciones sobre un conjunto de datos.

        Args:
            dataset: Dataset con las imágenes a predecir.

        Returns:
            Lista con las predicciones de la clase para cada imagen.
        """

        img_dataset = self.ImagePytorchDataset(dataset)
        dataloader = DataLoader(img_dataset, batch_size=self.batch_size, shuffle=False)
        preds = predict(
            self.model, dataloader, self.device, self.criterion, len(dataset)
        )
        return preds

    def save(self, filename: str):
        torch.save(self.model.state_dict(), filename)

    def load(self, filename: str):
        self.model.load_state_dict(torch.load(filename))

    @classmethod
    def get_schema(cls) -> Dict[str, Any]:
        # path es la carpeta donde está este archivo
        path = os.path.dirname(os.path.realpath(__file__))
        with open(os.path.join(path, f"{cls.__name__}.json")) as f:
            return json.load(f)

image_dataloader.json

{
    "additionalProperties": true,
    "error_msg": "You must specify the data configuration parameters.",
    "description": "Upload a .csv file with your dataset or a .zip file with CSV files to be uploaded.",
    "display": "modal",
    "properties": {
    "name": {
        "oneOf": [
        {
            "error_msg": "",
            "description": "Custom name to register your dataset. If no name is specified, the name of the uploaded file will be used.",
            "type": ["text", "null"],
            "default": ""
        }
        ]
    }
    },
    "splits": {
    "display": "div",
    "properties": {
        "train_size": {
        "oneOf": [
            {
            "error_msg": "The size of the training set must be between 0 and 1.",
            "description": "The training set contains the data to be used for training a model. Must be defined between 0 and 100% of the data.",
            "type": "number",
            "default": 0.7,
            "minimum": 0,
            "maximum": 1
            }
        ]
        },
        "test_size": {
        "oneOf": [
            {
            "error_msg": "The test set size must be between 0 and 1.",
            "description": "The test set contains the data that will be used to evaluate a model. Must be defined between 0 and 100% of the data.",
            "type": "number",
            "default": 0.2,
            "minimum": 0,
            "maximum": 1
            }
        ]
        },
        "val_size": {
        "oneOf": [
            {
            "error_msg": "The validation set size must be between 0 and 1.",
            "description": "The validation set contains the data to be used to validate a model. Must be defined between 0 and 100% of the data.",
            "type": "number",
            "default": 0.1,
            "minimum": 0,
            "maximum": 1
            }
        ]
        }
    },
    "more_options": {
        "display": "modal",
        "properties": {
        "shuffle": {
            "oneOf": [
            {
                "error_msg": "Must be true or false, choose if you want to shuffle the data when separating the sets.",
                "description": "Determines whether the data will be shuffle when defining the sets or not. It must be true for shuffle the data, otherwise false.",
                "type": "boolean",
                "default": true
            }
            ]
        },
        "seed": {
            "oneOf": [
            {
                "error_msg": "Must be an integer greater than or equal to 0.",
                "description": "A seed defines a value with which the same mixture of data will always be obtained. It must be an integer greater than or equal to 0.",
                "type": "integer",
                "default": 0,
                "minimum": 0
            }
            ]
        },
        "stratify": {
            "oneOf": [
            {
                "error_msg": "Must be true or false, choose if you want to separate the data into sets with the same proportion of samples per class as the original set or not.",
                "description": "Defines whether the data will be proportionally separated according to the distribution of classes in each set.",
                "type": "boolean",
                "default": false
            }
            ]
        }
        },
        "type": "object"
    },
    "type": "object"
    },
    "type": "object"
}

image_dataloader.py

"""DashAI Image Dataloader."""

import json
import logging
import os
from typing import Any, Dict, Union

from beartype import beartype
from datasets import DatasetDict, load_dataset
from starlette.datastructures import UploadFile

from DashAI.back.dataloaders.classes.dataloader import BaseDataLoader

logger = logging.getLogger(__name__)

class ImageDataLoader(BaseDataLoader):
    """Data loader for data from image files."""

    COMPATIBLE_COMPONENTS = ["ImageClassificationTask"]

    @beartype
    def load_data(
        self,
        filepath_or_buffer: Union[UploadFile, str],
        temp_path: str,
        params: Dict[str, Any],
    ) -> DatasetDict:
        """Load an image dataset.

        Parameters
        ----------
        filepath_or_buffer : Union[UploadFile, str], optional
            An URL where the dataset is located or a FastAPI/Uvicorn uploaded file
            object.
        temp_path : str
            The temporary path where the files will be extracted and then uploaded.
        params : Dict[str, Any]
            Dict with the dataloader parameters. The options are:
            - `separator` (str): The character that delimits the CSV data.

        Returns
        -------
        DatasetDict
            A HuggingFace's Dataset with the loaded data.
        """
        if isinstance(filepath_or_buffer, str):
            dataset = load_dataset("imagefolder", data_files=filepath_or_buffer)
        elif isinstance(filepath_or_buffer, UploadFile):
            if filepath_or_buffer.content_type == "application/zip":
                extracted_files_path = self.extract_files(temp_path, filepath_or_buffer)
                dataset = load_dataset(
                    "imagefolder",
                    data_dir=extracted_files_path,
                )
            else:
                raise Exception(
                    "The image dataloader requires the input file to be a zip file. "
                    f"The following content type was delivered: "
                    f"{filepath_or_buffer.content_type}"
                )

        return dataset

    @classmethod
    def get_schema(cls) -> Dict[str, Any]:
        """Load the JSON schema asocciated to the dataloader."""
        try:
            # path es la carpeta donde está este archivo
            path = os.path.dirname(os.path.realpath(__file__))
            with open(
                os.path.join(path, "ImageDataLoader.json"),
            ) as f:
                schema = json.load(f)
            return schema

        except FileNotFoundError:
            logger.exception(
                f"Could not load the schema for {cls.__name__} : File DashAI/back"
                f"/dataloaders/description_schemas/{cls.__name__}.json not found.",
            )
            return {}

    @staticmethod
    def get_squema(type, name):
        try:
            # path es la carpeta donde está este archivo
            path = os.path.dirname(os.path.realpath(__file__))
            with open(
                os.path.join(path, "image_dataloader.json"),
            ) as f:
                return json.load(f)

        except FileNotFoundError:
            with open(os.path.join(path, "image_dataloader.json")) as f:
                return json.load(f)