Source code for GraphSL.GNN.IVGD.main

import torch.nn.functional as F
import numpy as np
import torch
import torch.nn as nn
from GraphSL.GNN.IVGD.correction import correction
from GraphSL.GNN.IVGD.diffusion_model import I_GCN
from sklearn.metrics import roc_auc_score, f1_score, accuracy_score, precision_score, recall_score
from GraphSL.utils import Metric
import torch.optim as optim
import warnings
warnings.filterwarnings("ignore")



[docs]
class IVGD_model(torch.nn.Module):
    """
     Invertible Validity-aware Graph Diffusion (IVGD) Model.
    """

    def __init__(self, alpha, tau, rho):
        """
        Initializes the IVGD_model.

        Args:

        - alpha (float): Value of alpha parameter.

        - tau (float): Value of tau parameter.

        - rho (float): Value of rho parameter.
        """
        super(IVGD_model, self).__init__()
        self.device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
        self.alpha1 = alpha
        self.alpha2 = alpha
        self.alpha3 = alpha

        self.tau1 = tau
        self.tau2 = tau
        self.tau3 = tau

        self.net1 = correction()
        self.net2 = correction()
        self.net3 = correction()

        self.rho1 = rho
        self.rho2 = rho
        self.rho3 = rho


[docs]
    def forward(self, x, label, lamda):
        """
        Perform the forward pass of IVGD_model.

        Args:

        - x (torch.Tensor): Input tensor.

        - label (torch.Tensor): Label tensor.

        - lamda (float): Value of lambda parameter.

        Returns:

        - x (torch.Tensor): Output tensor after forward pass.
        """
        self.net1.to(self.device)
        self.net2.to(self.device)
        self.net3.to(self.device)
        sum = torch.sum(label)
        label = torch.cat((1 - label, label), dim=1)
        x = torch.cat((1 - x, x), dim=1)
        prob = x[:, 1].unsqueeze(-1)
        x = (self.tau1 * self.net1(prob) - label * torch.softmax(x, dim=1) / label.shape[0] - lamda
             - self.rho1 * (torch.sum(x) - sum) + self.alpha1 * x) / (
            self.tau1 + self.alpha1)
        prob = x[:, 1].unsqueeze(-1)
        lamda = lamda + self.rho1 * (torch.sum(prob) - sum)
        x = (self.tau2 * self.net2(prob) - label * torch.softmax(x, dim=1) / label.shape[0] - lamda
             - self.rho2 * (torch.sum(x) - sum) + self.alpha2 * x) / (
            self.tau2 + self.alpha2)
        prob = x[:, 1].unsqueeze(-1)
        lamda = lamda + self.rho2 * (torch.sum(prob) - sum)
        x = (self.tau3 * self.net3(prob) - label * torch.softmax(x, dim=1) / label.shape[0] - lamda
             - self.rho3 * (torch.sum(x) - sum) + self.alpha3 * x) / (
            self.tau3 + self.alpha3)
        return x





[docs]
class IVGD:
    """
    Implement the Invertible Validity-aware Graph Diffusion (IVGD) model.

    Wang, Junxiang, Junji Jiang, and Liang Zhao. "An invertible graph diffusion neural network for source localization." Proceedings of the ACM Web Conference 2022. 2022.
    """

    def __init__(self):
        """
        Initializes the IVGD model.
        """

        self.device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')


[docs]
    def train_diffusion(self, adj, train_dataset, lr = 1e-4, weight_decay = 1e-4, num_epoch = 50, print_epoch = 10, random_seed=0):
        """
        Train the diffusion model.

        Args:

        - adj (scipy.sparse.csr_matrix): Adjacency matrix of the graph.

        - train_dataset (torch.utils.data.dataset.Subset): the training dataset (number of simulations * number of graph nodes * 2 (the first column is seed vector and the second column is diffusion vector)).

        - lr (float): Learning rate.

        - weight_decay (float): Weight decay.

        - epoch_num (int): Number of epochs.

        - print_epoch (int): Number of epochs every time to print loss.

        - random_seed (int): Random seed.
        
        Returns:

        - diffusion_model (torch.nn.Module): Trained diffusion model.

        Example:

        import os

        curr_dir = os.getcwd()

        from GraphSL.utils import load_dataset, diffusion_generation, split_dataset

        from GraphSL.GNN.IVGD.main import IVGD

        data_name = 'karate'

        graph = load_dataset(data_name, data_dir=curr_dir)

        dataset = diffusion_generation(graph=graph, infect_prob=0.3, diff_type='IC', sim_num=100, seed_ratio=0.1)

        adj, train_dataset, test_dataset =split_dataset(dataset)

        ivgd = IVGD()

        diffusion_model = ivgd.train_diffusion(adj, train_dataset)

        """
        torch.manual_seed(random_seed)
        
        print("train IVGD diffusion model:")

        diffusion_model = I_GCN()

        optimizer = optim.Adam(diffusion_model.parameters(), lr=lr, weight_decay=weight_decay)
        loss_function = nn.MSELoss()

        diffusion_model.train()

        for epoch in range(num_epoch):
            train_loss = 0

            for influ_mat in train_dataset:
                seed_vector = influ_mat[:, 0].unsqueeze(-1).to(self.device)
                diff_vector = influ_mat[:, 1].unsqueeze(-1).to(self.device)

                optimizer.zero_grad()

                output = diffusion_model(adj,seed_vector)+seed_vector
                loss = loss_function(output, diff_vector)

                loss.backward()
                optimizer.step()

            train_loss += loss.item()

            train_loss = train_loss / len(train_dataset)

            if epoch % print_epoch ==0:

                print(f'Epoch [{epoch}/{num_epoch}], Loss: {train_loss:.3f}')

        
        return diffusion_model



[docs]
    def train(
            self,
            adj,
            train_dataset,
            diffusion_model,
            num_thres=10,
            lr=1e-4,
            weight_decay=1e-4,
            num_epoch=200,
            print_epoch=10,
            random_seed=0):
        """
        Train the IVGD model.

        Args:

        - adj (scipy.sparse.csr_matrix): The adjacency matrix of the graph.

        - train_dataset (torch.utils.data.dataset.Subset): the training dataset (number of simulations * number of graph nodes * 2 (the first column is seed vector and the second column is diffusion vector)).

        - diffusion_model (torch.nn.Module): Trained diffusion model.

        - num_thres (int): Number of threshold values to try.

        - lr (float): Learning rate.

        - weight_decay (float): Weight decay.

        - num_epoch (int): Number of epochs for training.

        - print_epoch (int): Number of epochs every time to print loss.

        - random_epoch (int): Random seed.

        Returns:

        - ivgd (torch.nn.Module): Trained IVGD model.

        - opt_thres (float): Optimal threshold value.

        - train_auc (float): Training AUC.

        - opt_f1 (float): Optimal F1 score.

        - pred (numpy.ndarray): Predicted seed vector of the training set, every column is the prediction of every simulation. It is used to adjust thres_list.

        Example:

        import os

        curr_dir = os.getcwd()

        from GraphSL.utils import load_dataset, diffusion_generation, split_dataset

        from GraphSL.GNN.IVGD.main import IVGD

        data_name = 'karate'

        graph = load_dataset(data_name, data_dir=curr_dir)

        dataset = diffusion_generation(graph=graph, infect_prob=0.3, diff_type='IC', sim_num=100, seed_ratio=0.1)

        adj, train_dataset, test_dataset =split_dataset(dataset)

        ivgd = IVGD()

        diffusion_model = ivgd.train_diffusion(adj, train_dataset)

        ivgd_model, thres, auc, f1, pred =ivgd.train(adj, train_dataset, diffusion_model)

        print("IVGD:")

        print(f"train auc: {auc:.3f}, train f1: {f1:.3f}")

        """
        num_node = adj.shape[0]
        num_seed = torch.sum(train_dataset[0][:,0]).item()
        weight =torch.tensor([1,(num_node-num_seed)/num_seed]).to(self.device)
        criterion = nn.CrossEntropyLoss(weight=weight)
        # train_num = len(train_dataset)
        alpha = 0.01
        tau = 0.01
        rho = 1e-3
        lamda = 1e-3
        torch.manual_seed(random_seed)
        ivgd = IVGD_model(alpha=alpha, tau=tau, rho=rho).to(self.device)
        optimizer = optim.Adam(
            ivgd.parameters(),
            lr=lr,
            weight_decay=weight_decay)
        ivgd.train()
        train_num = len(train_dataset)

        seed_preds_list=list()

        print("train IVGD:")

        for influ_mat in train_dataset:
            seed_vec = influ_mat[:, 0].unsqueeze(-1).to(self.device)
            influ_vec = influ_mat[:, -1].unsqueeze(-1).to(self.device)
            # Get predictions
            seed_preds = diffusion_model.backward(adj,influ_vec).detach()
            seed_preds_list.append(seed_preds)
        

        for epoch in range(num_epoch):
            overall_loss = 0
            for i, influ_mat in enumerate(train_dataset):
                optimizer.zero_grad()
                
                # Ensure that influ_mat is on the correct device
                influ_mat = influ_mat.to(self.device)
                
                # Extract and prepare seed_vec
                seed_vec = influ_mat[:, 0].to(self.device)
                seed_vec_unsqueeze = seed_vec.unsqueeze(-1).float()
                
                # Ensure seed_preds_list[i] is detached if it's from a previous computation
                seed_preds_unsqueeze = seed_preds_list[i].detach().to(self.device)
                seed_correction = ivgd(seed_preds_unsqueeze, seed_preds_unsqueeze, lamda)
                
                # Prepare one-hot encoding
                seed_vec_onehot = torch.cat((1-seed_vec_unsqueeze, seed_vec_unsqueeze), dim=1)
                
                # Calculate loss
                loss = criterion(seed_correction, seed_vec_onehot)
                
                # Backward pass
                loss.backward()
                
                # Accumulate loss
                overall_loss += loss.item()
                
                # Update parameters
                optimizer.step()
            
            # Calculate and print average loss for the epoch
            if epoch % print_epoch ==0:
                average_loss = overall_loss / train_num
                print(f"Epoch [{epoch}/{num_epoch}], loss = {average_loss:.3f}")



        ivgd.eval()
        train_auc = 0
        for i, influ_mat in enumerate(train_dataset):
            seed_vec = influ_mat[:, 0]
            seed_preds_unsqueeze = seed_preds_list[i].to(self.device)
            seed_vec = seed_vec.unsqueeze(-1).float()
            seed_correction = ivgd(seed_preds_unsqueeze, seed_preds_unsqueeze, lamda)
            seed_correction = F.softmax(seed_correction, dim=1)
            seed_correction = seed_correction[:, 1].unsqueeze(-1)
            seed_correction = self.normalize(seed_correction)
            seed_correction = seed_correction.cpu().squeeze(-1).detach().numpy()
            seed_vec = seed_vec.detach().numpy()
            train_auc += roc_auc_score(seed_vec, seed_correction)
        train_auc = train_auc / train_num

        pred = np.zeros((num_node, train_num))
        seed_all = np.zeros((num_node, train_num))
        for i, influ_mat in enumerate(train_dataset):
            seed_all[:, i] = influ_mat[:, 0]
            seed_preds_unsqueeze = seed_preds_list[i].to(self.device)
            seed_correction = ivgd(seed_preds_unsqueeze, seed_preds_unsqueeze, lamda)
            seed_correction = F.softmax(seed_correction, dim=1)
            seed_correction = seed_correction[:, 1].unsqueeze(-1)
            seed_correction = self.normalize(seed_correction)
            seed_correction = seed_correction.squeeze(
                -1).cpu().detach().numpy()
            pred[:, i] = seed_correction

        opt_f1 = -1
        opt_thres = -1
        pred_min = pred.min()
        pred_max = pred.max()
        thres_list = np.linspace(pred_min, pred_max, num=num_thres+2)[1:-1].tolist()
        # Find optimal threshold and F1 score
        for thres in thres_list:
            train_f1 = 0
            for i in range(train_num):
                train_f1 += f1_score(seed_all[:, i], pred[:, i] >= thres)
            train_f1 = train_f1 / train_num
            print(f"thres = {thres:.3f}, train_f1 = {train_f1:.3f}")
            if train_f1 > opt_f1:
                opt_f1 = train_f1
                opt_thres = thres

        return ivgd, opt_thres, train_auc, opt_f1, pred



[docs]
    def test(self, adj, test_dataset, diffusion_model, IVGD_model, thres):
        """
        Test the IVGD model on the given test dataset.

        Args:

        - adj (scipy.sparse.csr_matrix): The adjacency matrix of the graph.

        - test_dataset (torch.utils.data.dataset.Subset): the test dataset (number of simulations * number of graph nodes * 2 (the first column is seed vector and the second column is diffusion vector)).

        - diffusion_model (torch.nn.Module): Trained diffusion model.

        - IVGD_model (torch.nn.Module): Trained IVGD model.

        - thres (float): Threshold value.

        Returns:

        - metric (Metric): Object containing test metrics.

        Example:

        import os

        curr_dir = os.getcwd()

        from GraphSL.utils import load_dataset, diffusion_generation, split_dataset

        from GraphSL.GNN.IVGD.main import IVGD

        data_name = 'karate'

        graph = load_dataset(data_name, data_dir=curr_dir)

        dataset = diffusion_generation(graph=graph, infect_prob=0.3, diff_type='IC', sim_num=100, seed_ratio=0.1)

        adj, train_dataset, test_dataset =split_dataset(dataset)

        ivgd = IVGD()

        diffusion_model = ivgd.train_diffusion(adj, train_dataset)

        ivgd_model, thres, auc, f1, pred =ivgd.train(adj, train_dataset, diffusion_model)

        print("IVGD:")

        print(f"train auc: {auc:.3f}, train f1: {f1:.3f}")

        metric = ivgd.test(adj, test_dataset, diffusion_model, ivgd_model, thres)

        print(f"test acc: {metric.acc:.3f}, test pr: {metric.pr:.3f}, test re: {metric.re:.3f}, test f1: {metric.f1:.3f}, test auc: {metric.auc:.3f}")
        """
        IVGD_model = IVGD_model.to(self.device)

        test_num = len(test_dataset)
        test_acc = 0
        test_pr = 0
        test_re = 0
        test_f1 = 0
        test_auc = 0

        lamda = 1e-3

        seed_preds_list=list()

        for influ_mat in test_dataset:

            influ_vec = influ_mat[:, -1].unsqueeze(-1).to(self.device)

            # Get predictions
            seed_preds = diffusion_model.backward(adj,influ_vec)
            seed_preds_list.append(seed_preds)

        # Loop through each test dataset
        for i, influ_mat in enumerate(test_dataset):
            seed_vec = influ_mat[:, 0]
            # Get seed predictions from the diffusion model
            seed_preds_unsqueeze = seed_preds_list[i].to(self.device)
            seed_vec = seed_vec.float().detach().cpu().numpy()

            # Obtain seed correction predictions from the IVGD model
            seed_correction = IVGD_model(seed_preds_unsqueeze, seed_preds_unsqueeze, lamda)
            seed_correction = F.softmax(seed_correction, dim=1)
            seed_correction = seed_correction[:, 1].unsqueeze(-1)
            seed_correction = self.normalize(seed_correction)
            seed_correction = seed_correction.squeeze(
                -1).cpu().detach().numpy()

            # Compute metrics
            test_acc += accuracy_score(seed_vec, seed_correction >= thres)
            test_pr += precision_score(seed_vec,
                                       seed_correction >= thres,
                                       zero_division=1)
            test_re += recall_score(seed_vec,
                                    seed_correction >= thres,
                                    zero_division=1)
            test_f1 += f1_score(seed_vec, seed_correction >=
                                thres, zero_division=1)
            test_auc += roc_auc_score(seed_vec, seed_correction)

        # Compute average metrics
        test_acc = test_acc / test_num
        test_pr = test_pr / test_num
        test_re = test_re / test_num
        test_f1 = test_f1 / test_num
        test_auc = test_auc / test_num

        # Create Metric object containing test metrics
        metric = Metric(test_acc, test_pr, test_re, test_f1, test_auc)
        return metric



[docs]
    def normalize(self, x):
        """
        The input tensor x is normalized to between 0 and 1.

        Args:

        - x (torch.Tensor): Input tensor to be normalized.

        Returns:

        - x (torch.Tensor): Normalized tensor.
        """
        # Compute minimum and maximum values along each dimension
        min_vals, _ = torch.min(x, dim=0)
        max_vals, _ = torch.max(x, dim=0)

        # Compute the range and handle cases where the range is too small
        rang = max_vals - min_vals
        rang[torch.lt(rang, 1e-6)] = 1e-6

        # Perform normalization
        x = (x - min_vals) / rang
        return x