Source code for mowl.models.boxel.examples.model_ppi

from mowl.models.boxel.model import BoxEL
from mowl.evaluation import PPIEvaluator
import torch as th
import numpy as np



[docs]
class BoxELPPI(BoxEL):
    """
    Example of BoxEL for protein-protein interaction prediction.

    Customizes negative sampling to use only protein IDs from the evaluation
    classes instead of all ontology classes.
    """

    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)
        self.set_evaluator(PPIEvaluator)
        self.eval_gci_name = "gci2"
        self._protein_ids = None

    @property
    def protein_ids(self):
        if self._protein_ids is None:
            self._protein_ids = [
                self.class_index_dict[p]
                for p in self.dataset.evaluation_classes[0].as_str
            ]
        return self._protein_ids


[docs]
    def get_negative_sampling_config(self):
        return {
            "gci2": {"corrupt_column": 2}
        }



[docs]
    def generate_negatives(self, gci_name, gci_dataset):
        if gci_name != "gci2":
            return None

        data = gci_dataset[:]
        idxs_for_negs = np.random.choice(
            self.protein_ids, size=len(gci_dataset), replace=True
        )
        rand_index = th.tensor(idxs_for_negs, dtype=th.long, device=self.device)
        neg_data = th.cat([data[:, :2], rand_index.unsqueeze(1)], dim=1)
        return neg_data



[docs]
    def evaluate_ppi(self):
        self.init_module()
        print("Load the best model", self.model_filepath)
        self.load_best_model()
        with th.no_grad():
            metrics = self.evaluate()
            print(metrics)