Source code for fusilli.fusionmodels.unimodal.image

"""
Unimodal model using only the image data.
"""

import torch.nn as nn
from fusilli.fusionmodels.base_model import ParentFusionModel
from torch.autograd import Variable
import torch
from fusilli.utils import check_model_validity


[docs] class ImgUnimodal(ParentFusionModel, nn.Module): """ A uni-modal model using only the image data. Attributes ---------- img_layers : nn.ModuleDict Dictionary containing the layers of the image data. fused_dim : int Number of features of the fused layers. This is the flattened output size of the image layers. fused_layers : nn.Sequential Sequential layer containing the fused layers. final_prediction : nn.Sequential Sequential layer containing the final prediction layers. """ #: str: Name of the method. method_name = "Image unimodal" #: str: Type of modality. modality_type = "img" #: str: Type of fusion. fusion_type = "unimodal"
[docs] def __init__(self, prediction_task, data_dims, multiclass_dimensions): """ Parameters ---------- prediction_task : str Type of prediction to be performed. data_dims : list List containing the dimensions of the data. multiclass_dimensions : int Number of classes in the multiclass classification task. """ ParentFusionModel.__init__( self, prediction_task, data_dims, multiclass_dimensions ) self.prediction_task = prediction_task self.set_img_layers() self.get_fused_dim() self.set_fused_layers(self.fused_dim) self.calc_fused_layers()
[docs] def get_fused_dim(self): """ Get the number of features of the fused layers. Returns ------- None """ dummy_conv_output = Variable(torch.rand((1,) + tuple(self.img_dim))) for layer in self.img_layers.values(): dummy_conv_output = layer(dummy_conv_output) flattened_img_output_size = dummy_conv_output.data.view(1, -1).size(1) self.fused_dim = flattened_img_output_size
[docs] def calc_fused_layers(self): """ Calculates the fused layers. Returns ------- None """ # check img layers check_model_validity.check_dtype(self.img_layers, nn.ModuleDict, "img_layers") check_model_validity.check_img_dim(self.img_layers, self.img_dim, "img_layers") # check fused layers self.get_fused_dim() self.fused_layers, out_dim = check_model_validity.check_fused_layers( self.fused_layers, self.fused_dim ) self.set_final_pred_layers(out_dim)
[docs] def forward(self, x): """ Forward pass of the model. Parameters ---------- x : torch.Tensor Tensor containing the image data. Returns ------- out_pred : torch.Tensor Tensor containing the predicted values. """ check_model_validity.check_model_input(x) x_img = x for layer in self.img_layers.values(): x_img = layer(x_img) x_img = x_img.view(x_img.size(0), -1) out_fuse = self.fused_layers(x_img) out_pred = self.final_prediction(out_fuse) return out_pred