Source code for rllm.transforms.graph_transforms.gdc

from typing import Any, Dict

import numpy as np
import scipy.sparse as sp
import torch
from torch import Tensor

from rllm.transforms.graph_transforms import EdgeTransform
from rllm.transforms.graph_transforms.functional import add_remaining_self_loops
from rllm.utils.sparse import sparse_mx_to_torch_sparse_tensor



[docs]
class GDC(EdgeTransform):
    r"""Processes the graph via Graph Diffusion Convolution (GDC) from the
    `"Diffusion Improves Graph Learning" <https://arxiv.org/abs/1911.05485>`_
    paper (functional name: :obj:`gdc`).

    Args:
        self_loop_weight (float, optional): Weight of the added self-loop.
            Set to :obj:`None` to add no self-loops. (default: :obj:`1`)

        normalize_in (str, optional): Normalization scheme of transition
            matrix on input graph. Possible values:
            :obj:`"sym"`, :obj:`"col"`, and :obj:`"row"`.
            (default: :obj:`"sym"`)

        normalize_out (str, optional): Normalization scheme of transition
            matrix on output graph. Possible values:
            :obj:`"sym"`, :obj:`"col"`, :obj:`"row"`, and :obj:`None`.
            (default: :obj:`"col"`)

        diffusion_kwargs (dict, optional): Dictionary containing the parameters
            for diffusion. Possible values:
            :obj:`"ppr"`, :obj:`"heat"`)
            Each diffusion method requires different additional parameters.
            (default: :obj:`dict(method='ppr', alpha=0.15)`)

        sparsification_kwargs (dict, optional): Dictionary containing the
            parameters for sparsification.Possible values:
            :obj:`"threshold"`, :obj:`"topk"`)
            Each sparsification method requires different additional
            parameters.
            (default: :obj:`dict(method='threshold', avg_degree=64)`)

    """

    def __init__(
        self,
        self_loop_weight: float = 1.0,
        normalize_in: str = "sym",
        normalize_out: str = "col",
        diffusion: Dict[str, Any] = dict(method="ppr", alpha=0.15),
        sparsification: Dict[str, Any] = dict(
            method="threshold",
            avg_degree=64,
        ),
    ) -> None:
        super().__init__()
        self.self_loop_weight = self_loop_weight
        self.normalize_in = normalize_in
        self.normalize_out = normalize_out
        self.diffusion = diffusion
        self.sparsification = sparsification

    @torch.no_grad()
    def forward(self, adj: Tensor) -> Tensor:
        if self.self_loop_weight:
            adj = add_remaining_self_loops(adj, fill_value=self.self_loop_weight)

        # 1.get the transition matrix
        trans_matrix = self.get_transition_matrix(adj, self.normalize_in)

        # 2.Sum over T^k, generalized graph diffusion
        diff_matrix = self.diffusion_matrix(trans_matrix, **self.diffusion)

        # 3.sparsify the graph
        diff_matrix_sparsified = self.sparsify_matrix(
            diff_matrix, **self.sparsification
        )

        # 4.get transition matrix on ~s
        adj = self.get_transition_matrix(
            diff_matrix_sparsified.to_sparse_coo(), self.normalize_out
        )

        return adj


[docs]
    def get_transition_matrix(
        self,
        adj: Tensor,
        normalize: str,
    ) -> Tensor:
        r"""Get the transition matrix of the given sparse matrix.

        Args:
            adj (Tensor): The adjacency matrix.
            normalize (str): The normalization scheme is adopted:

                1. :obj:`"sym"`: Symmetric normalization
                2. :obj:`"col"`: Column-wise normalization
                3. :obj:`"row"`: Row-wise normalization
                4. :obj:`None`: No normalization.

        """
        adj = adj.coalesce()
        indices = adj.indices()

        # D
        adj_data = adj.values()
        adj_sp = sp.csr_matrix((adj_data, (indices[0], indices[1])), shape=adj.shape)

        if normalize == "sym":
            # D-1/2
            deg = np.array(adj_sp.sum(axis=1)).flatten()
            deg[deg == 0] = 1e-10
            deg_sqrt_inv = np.power(deg, -0.5)
            deg_sqrt_inv[deg_sqrt_inv == 100000.0] = 0.0
            deg_sqrt_inv = sp.diags(deg_sqrt_inv)
            adj = sp.coo_matrix(deg_sqrt_inv * adj_sp * deg_sqrt_inv)

        elif normalize == "col":
            deg = np.array(adj_sp.sum(axis=1)).flatten()
            deg[deg == 0] = 1e-10
            deg_sqrt_inv = np.power(deg, -1)
            deg_sqrt_inv[deg_sqrt_inv == float(1e10)] = 0.0
            deg_sqrt_inv = sp.diags(deg_sqrt_inv)
            adj = sp.coo_matrix(adj_sp * deg_sqrt_inv)

        elif normalize == "row":
            deg = np.array(adj_sp.sum(axis=0)).flatten()
            deg[deg == 0] = 1e-10
            deg_sqrt_inv = np.power(deg, -1)
            deg_sqrt_inv[deg_sqrt_inv == float(1e10)] = 0.0
            deg_sqrt_inv = sp.diags(deg_sqrt_inv)
            adj = sp.coo_matrix(deg_sqrt_inv * adj_sp)

        elif normalize is None:
            pass
        else:
            raise ValueError(
                f"Unsupported normalization '{normalize}'. "
                "Expected one of: 'sym', 'col', 'row', None."
            )
        return sparse_mx_to_torch_sparse_tensor(adj)



[docs]
    def diffusion_matrix(  # noqa: D417
        self,
        adj: Tensor,
        method: str,
        **kwargs,
    ) -> Tensor:
        r"""Get the diffusion of the given sparse graph.

        Args:
            adj (Tensor): The adjacency matrix.
            num_nodes (int): Number of nodes.
            method (str): Diffusion method:

                1. :obj:`"ppr"`: Use personalized PageRank as diffusion.
                   Additionally expects the parameter:

                   - **alpha** (*float*) - Return probability in PPR.
                     default:obj:`[0.05, 0.2]`.

                2. :obj:`"heat"`: Use heat kernel diffusion.
                   Additionally expects the parameter:

                   - **t** (*float*) - Time of diffusion.
                     default:obj:`[2, 10]`.

        """
        if method == "ppr":
            # α (I_n + (α - 1) A)^-1
            diff_matrix = (kwargs["alpha"] - 1) * adj
            diff_matrix = add_remaining_self_loops(diff_matrix).to_dense()
            diff_matrix = kwargs["alpha"] * torch.inverse(diff_matrix)

        elif method == "heat":
            # exp(t (A - I_n))
            diff_matrix = add_remaining_self_loops(adj, fill_value=-1)
            diff_matrix = kwargs["t"] * diff_matrix
            diff_matrix = diff_matrix.exp()

        else:
            raise ValueError(f"Exact GDC diffusion '{method}' unknown")

        return diff_matrix



[docs]
    def sparsify_matrix(  # noqa: D417
        self,
        mx: Tensor,
        method: str,
        **kwargs,
    ) -> Tensor:
        r"""Sparsifies the given sparse graph.

        Args:
            adj (Tensor): The adjacency matrix.
            num_nodes (int): Number of nodes.
            method (str): Method of sparsification:

                1. :obj:`"threshold"`: Remove all edges with weights smaller
                   than :obj:`eps`.
                   Additionally expects two parameters:

                   - **eps** (*float*) - Threshold to bound edges at.

                   - **avg_degree** (*int*) - If `eps` is not given,
                     it can optionally be calculated by calculating the
                     value of `avg_degree`.

                2. :obj:`"topk"`: Keep top-k edges on the given dim.
                   Additionally expects two parameters:

                   - **k** (*int*) - The number of edges to keep.

                   - **dim** (*int*) - The dim along which to take the top.

        """
        if method == "threshold":
            if "eps" not in kwargs.keys():
                kwargs["eps"] = self.__calculate_eps__(
                    mx,
                    kwargs["avg_degree"],
                )
            mx[mx < kwargs["eps"]] = 0
        elif method == "topk":
            k, dim = min(mx.size(0), kwargs["k"]), kwargs["dim"]
            if dim not in [0, 1]:
                raise ValueError(f"Expected dim to be 0 or 1, but got {dim}.")
            sort_idx = torch.argsort(mx, dim=dim, descending=True)
            if dim == 0:
                top_idx = sort_idx[:k]
                edge_weight = torch.gather(mx, dim=dim, index=top_idx).flatten()
                row_idx = torch.arange(mx.size(0), device=mx.device).repeat(k)
                mx = torch.sparse_coo_tensor(
                    torch.stack([row_idx, top_idx.flatten()]), edge_weight, mx.size()
                )
            else:
                top_idx = sort_idx[:, :k]
                edge_weight = torch.gather(mx, dim=dim, index=top_idx).flatten()
                col_idx = torch.arange(mx.size(0), device=mx.device).repeat(k)
                mx = torch.sparse_coo_tensor(
                    torch.stack([top_idx, col_idx.flatten()]), edge_weight, mx.size()
                )
        else:
            raise ValueError(f"GDC sparsification '{method}' unknown")

        return mx


    def __calculate_eps__(
        self,
        adj: Tensor,
        avg_degree: int,
    ) -> float:
        r"""Get threshold necessary to achieve a given average degree.

        Args:
            adj (Tensor): The adjacency matrix.
            avg_degree (int): Target average degree.

        """
        edge_weights = adj.flatten()
        sorted_edges = torch.sort(edge_weights.flatten(), descending=True).values
        if avg_degree * adj.size(0) > len(sorted_edges):
            return -np.inf

        left = sorted_edges[avg_degree * adj.size(0) - 1]
        right = sorted_edges[avg_degree * adj.size(0)]
        return float(left + right) / 2.0