Classification Inference Using PyTorch

The classification sample in CVCUDA uses the ResNet50 deep learning model from the torchvision library. Since the model does not come with the softmax layer at the end, we are going to add one. The following code snippet shows how the model is setup for inference use case with PyTorch.

class ClassificationPyTorch:  # noqa: E302
    def __init__(
        self,
        output_dir,
        batch_size,
        image_size,
        device_id,
        cvcuda_perf,
    ):
        self.logger = logging.getLogger(__name__)
        self.output_dir = output_dir
        self.device_id = device_id
        self.cvcuda_perf = cvcuda_perf
        # The underlying PyTorch model that we use for inference is the ResNet50 model
        # from torchvision.
        torch_model = torchvision_models.resnet50
        weights = torchvision_models.ResNet50_Weights.DEFAULT
        self.labels = weights.meta["categories"]
        # Save the list of labels so that the C++ sample can read it.
        with open(os.path.join(output_dir, "labels.txt"), "w") as f:
            for line in self.labels:
                f.write("%s\n" % line)

        # Inference uses PyTorch to run a classification model on the pre-processed
        # input and outputs the classification scores.
        class Resnet50_Softmax(torch.nn.Module):
            def __init__(self, resnet50):
                super(Resnet50_Softmax, self).__init__()
                self.resnet50 = resnet50

            def forward(self, x):
                infer_output = self.resnet50(x)
                return torch.nn.functional.softmax(infer_output, dim=1)

        resnet_base = torch_model(weights=weights)
        resnet_base.eval()
        self.model = Resnet50_Softmax(resnet_base).cuda(self.device_id)
        self.model.eval()

        self.logger.info("Using PyTorch as the inference engine.")

To run the inference the __call__ method is used. It makes sure to use the CUDA stream and perform the forward inference pass without computing gradients.

def __call__(self, tensor):
    self.cvcuda_perf.push_range("inference.torch")

    with torch.no_grad():

        if isinstance(tensor, torch.Tensor):
            if not tensor.is_cuda:
                tensor = tensor.to("cuda:%d" % self.device_id)
        else:
            # Convert CVCUDA tensor to Torch tensor.
            tensor = torch.as_tensor(
                tensor.cuda(), device="cuda:%d" % self.device_id
            )

        classification_scores = self.model(tensor)

    self.cvcuda_perf.pop_range()
    return classification_scores