release-08-01-10/doxygen/cnn__pid__ecl__module_8py_source.html

#!/usr/bin/env python3

# -*- coding: utf-8 -*-


""" This script includes the core of 'CNN_PID_ECL' module


"""


# @cond


import math

import numpy as np

import torch

import torch.nn.functional as F

from torch.utils.data import DataLoader


import basf2 as b2


from .cnn_pid_conv_net import ConvNet

from .cnn_pid_cluster_image import ClusterImage


class CNN_PID_ECL(b2.Module):

    """ Extracts CNN value for an image


    A model based on convolutional neural network was trained

    on pions and muons' pixel images together with 3 more information

    which were added after convolutional layer. This module uses

    a pretrained model which is used as inference on pions and muons

    in the particle list.


    This module works under the following conditions:

    1. The extrapolated tracks are inside ECL Barrel based

    on ThetaId of central pixel.

    2. Transverse momentum (pt) of extrapolated tracks are

    in [0.2, 1.0] range.


    The goal is better muon and pion separation in the ECL barrel for

    low pt tracks.

    """


    from ROOT import Belle2

    import pdg


    def __init__(

        self,

        path,

        image_length=7,

        threshold=0.001,

        thetaId_range=(13, 58),

        pt_range=(0.2, 1.0)

    ):

        super().__init__()


        self.image_length = image_length

        self.threshold = threshold

        self.thetaId_range = thetaId_range

        self.pt_range = pt_range

        self.path = path


        self.device = torch.device('cpu')


    def initialize(self):

        """ Initialize necessary arrays and/or objects """


        self.eclCalDigits = self.Belle2.PyStoreArray('ECLCalDigits')

        self.mapping = self.Belle2.PyStoreObj('ECLCellIdMapping')

        self.eclCnnMuon = self.Belle2.PyStoreArray(self.Belle2.ECLCNNPid.Class())

        self.eclCnnMuon.registerInDataStore()

        self.tracks = self.Belle2.PyStoreArray('Tracks')

        self.tracks.registerRelationTo(self.eclCnnMuon)


    def beginRun(self):

        """ Read CNN payloads which include weights and biases """


        self.charge = 'plus'

        self.model_plus = self.read_model()


        self.charge = 'minus'

        self.model_minus = self.read_model()


    def event(self):

        """ Event processing


        This function goes through the particleList and find eclcaldigit of

        an extrapolated track. Then it extracts the energy for a 7x7 pixel image

        around the entering position of the track. In addition it extracts

        ThetaId and PhiId of central pixel in a 7x7 image together with Pt of

        the track. Then, it calculates the CNN values for an extrapolated being

        muon- or pion-like.

        """


        variable_muon = 'cnn_pid_ecl_muon'


        for track in self.tracks:


            fit_result = track.getTrackFitResultWithClosestMass(self.Belle2.Const.pion)

            if not fit_result:

                continue


            charge = fit_result.getChargeSign()

            if charge == 0:

                continue


            extHit_dict = self.getExtCell(track)


            if (track and extHit_dict):

                maxCellId = extHit_dict['cellid']

                self.pt = extHit_dict['pt']

                self.pt = np.array([self.pt])


                if charge == -1.0:

                    model = self.model_minus

                elif charge == 1.0:

                    model = self.model_plus


                self.extThetaId = self.mapping.getCellIdToThetaId(maxCellId)

                self.extThetaId = np.array([self.extThetaId])

                self.extPhiId = self.mapping.getCellIdToPhiId(maxCellId)

                self.extPhiId = np.array([self.extPhiId])


                if maxCellId < 0:

                    b2.B2WARNING('maxCellId is less 0.')

                else:

                    # Since CNN can only predict PID of the tracks inside the barrel,

                    # there are two hard-coded numbers in the __init__ (13 and 58),

                    # representing the thetaID limit.

                    if (self.extThetaId > self.thetaId_range[0] and

                        self.extThetaId < self.thetaId_range[1] and

                        self.pt >= self.pt_range[0] and

                            self.pt <= self.pt_range[1]):


                        energy_list = []

                        neighbours = self.mapping.getCellIdToNeighbour7(maxCellId)


                        for posid in range(self.image_length ** 2):

                            if posid < neighbours.size():

                                neighbourid = neighbours[posid]


                                storearraypos = self.mapping.getCellIdToStoreArray(neighbourid)

                                energy = 0.0

                                if storearraypos >= 0:

                                    energy = self.eclCalDigits[storearraypos].getEnergy()

                                energy_list.append(energy)


                        self.energy_array = np.array(energy_list)


                        prob_CNN_dict = self.extract_cnn_value(model)

                        prob_CNN_muon = prob_CNN_dict['cnn_muon']


                        eclCnnMuon = self.eclCnnMuon.appendNew()

                        eclCnnMuon.setEclCnnMuon(prob_CNN_muon)

                        track.addRelationTo(eclCnnMuon)


                        b2.B2DEBUG(22, f'{variable_muon}: {prob_CNN_muon}')

                    else:

                        b2.B2DEBUG(22, 'Track is either outside ECL Barrel or Pt is outside [0.2, 1.0] GeV/c. No CNN value.')


    def getExtCell(self, track):

        """ Extract cellId and pt of an extrapolated track


        The output is dictionary which has cellId and pt.

        """


        myDetID = self.Belle2.Const.EDetector.ECL

        hypothesis = self.Belle2.Const.pion

        pdgCode = abs(hypothesis.getPDGCode())


        extHits = track.getRelationsTo('ExtHits')


        for extHit in extHits:

            if abs(extHit.getPdgCode()) != pdgCode:

                continue

            if extHit.getDetectorID() != myDetID:

                continue

            if extHit.getStatus() != self.Belle2.ExtHitStatus.EXT_EXIT:

                continue

            if extHit.isBackwardPropagated():

                continue

            copyid = extHit.getCopyID()

            if copyid == -1:

                continue

            cellid = copyid + 1


            px = extHit.getMomentum().X()

            py = extHit.getMomentum().Y()

            pt = math.sqrt(px**2 + py**2)


            extHit_dict = {

                'cellid': cellid,

                'pt': pt,

            }


            return(extHit_dict)


    def extract_cnn_value(self, model):

        """ Extract CNN values for an extrapolated track


        The output of this function is dictionary

        which includes two probabilities:


        cnn_pion: Probability of an extrapolated track being pion

        cnn_muon: Probability of an extrapolated track being muon


        NOTE: cnn_pion and cnn_muon are floats.

        """


        test_loader = self.prepare_images()

        model.eval()


        with torch.no_grad():

            for energy, theta, phi, pt in test_loader:


                energy = energy.to(self.device)

                theta = theta.to(self.device)

                phi = phi.to(self.device)

                pt = pt.to(self.device)


                output = model(energy, theta, phi, pt)

                output = F.softmax(output, dim=1)


        prob_CNN_pion = output[0][0].item()

        prob_CNN_muon = output[0][1].item()


        prob_dict = {

            'cnn_pion': prob_CNN_pion,

            'cnn_muon': prob_CNN_muon,

        }


        return(prob_dict)


    def prepare_images(self):

        """ Prepare images


        A dictionary is passed to a function (ClusterImage)

        in order to prepare proper format for CNN inputs.

        """


        params_image = {

            'image_length': self.image_length,

            'energy_image': self.energy_array,

            'thetaId': self.extThetaId,

            'phiId': self.extPhiId,

            'pt': self.pt,

            'threshold': self.threshold

        }


        dataset = ClusterImage(params_image)

        infer_loader = DataLoader(dataset, shuffle=False)


        return(infer_loader)


    def model_cnn_name(self):

        """ Create CNN model name


        The outputs of this function are:

        1. CNN model's name

        2. Models parameters which is important for

        initializing ConvNet.


        Models parameters should be exactly the same as the CNN model

        which was trained.

        """


        model_name = f'ECLCNNPID_charge_{self.charge}'


        params_model = {

            'input_shape': (1, self.image_length, self.image_length),

            'initial_filters': 64,

            'num_emb_theta': 44,

            'dim_emb_theta': 22,

            'num_emb_phi': 144,

            'dim_emb_phi': 18,

            'num_ext_input': 1,

            'num_fc1': 128,

            'dropout_rate': 0.1,

            'num_classes': 2,

            'energy': True

        }


        return(model_name, params_model)


    def read_model(self):

        """ Load the CNN model


        This function receives model's name and

        CNN parameters, then reads .pt file which

        includes weights and biases for CNN.

        """


        model_name, params_model = self.model_cnn_name()

        model = ConvNet(params_model)

        model = model.to(self.device)


        payload = f'{model_name}.pt'

        accessor = self.Belle2.DBAccessorBase(

            self.Belle2.DBStoreEntry.c_RawFile, payload, True)

        checkpoint = accessor.getFilename()


        model.load_state_dict(torch.load(checkpoint))


        return(model)


# @endcond