Source code for roksana.attack_methods.pagerank

"""
PageRankAttack Module
----------------------
This module implements the PageRankAttack class for adversarial attacks on graphs by selectively removing edges
connected to nodes based on their PageRank scores.

Classes:
    - PageRankAttack: A class to perform PageRank-based edge removal attacks on a graph dataset.
"""

from .base_attack import BaseAttack
import torch
from torch_geometric.utils import remove_self_loops, to_undirected, to_networkx
from networkx import pagerank
from typing import Any, List, Tuple



[docs]
class PageRankAttack(BaseAttack):
    """
    PageRankAttack Class
    ---------------------
    Implements an adversarial attack that removes edges connected to nodes based on their PageRank scores.

    Attributes:
        data (Any): The graph dataset.
        params (dict): Additional parameters for the attack.
    """


[docs]
    def __init__(self, data: Any, **kwargs):
        """
        Initialize the PageRankAttack method.

        Args:
            data (Any): The graph dataset.
            **kwargs: Additional parameters for the attack.
        """
        self.data = data
        self.params = kwargs
        self.device = kwargs.get('device', torch.device('cuda' if torch.cuda.is_available() else 'cpu'))




[docs]
    def attack(self, data: Any, selected_nodes: torch.Tensor) -> Tuple[Any, List[Tuple[int, int]]]:
        """
        Perform the PageRank-based attack on the graph dataset.

        Args:
            data (Any): The graph dataset.
            selected_nodes (torch.Tensor): Nodes to target for edge removal. Must be a 1D tensor.

        Returns:
            Tuple[Any, List[Tuple[int, int]]]:
                - updated_data (Any): The modified graph dataset with updated edges.
                - removed_edges (List[Tuple[int, int]]): A list of removed edges.
        """

        # Move data to the appropriate device
        original_data = data.to(self.device)
        edge_index = original_data.edge_index.clone().to(self.device)
        edges = edge_index.t().tolist()

        # Convert to a NetworkX graph for PageRank computation
        G = to_networkx(original_data.to('cpu'), to_undirected=True)  # NetworkX operates on CPU
        pagerank_scores = pagerank(G)

        # Ensure selected_nodes is a 1D tensor
        if isinstance(selected_nodes, torch.Tensor) and selected_nodes.ndimension() == 0:
            selected_nodes = selected_nodes.unsqueeze(0)

        selected_nodes = selected_nodes.to(self.device)

        removed_edges = []  # List to store removed edges

        # Track the number of edges removed to ensure only len(selected_nodes) edges are removed
        removed_edges_count = 0

        # Loop over each node in selected_nodes to remove one edge connected to the highest PageRank node
        for node in selected_nodes.tolist():
            if removed_edges_count >= len(selected_nodes):
                break  # Stop once len(selected_nodes) edges are removed

            # Find edges associated with the current node
            node_edges = [(i, (src, dst)) for i, (src, dst) in enumerate(edges) if src == node or dst == node]

            if node_edges:
                # Find the edge connected to the highest PageRank node
                edge_to_remove = max(
                    node_edges,
                    key=lambda x: pagerank_scores[x[1][1]] if x[1][0] == node else pagerank_scores[x[1][0]]
                )
                edges.pop(edge_to_remove[0])  # Remove the edge from the edge list
                removed_edges.append(edge_to_remove[1])  # Track the removed edge
                removed_edges_count += 1

        # Create a new edge_index tensor from the modified edges
        new_edge_index = torch.tensor(edges, dtype=torch.long, device=self.device).t().contiguous()

        # Remove any self-loops
        new_edge_index, _ = remove_self_loops(new_edge_index)

        # Assign the modified edge_index to the dataset
        updated_data = data.clone().to(self.device)
        updated_data.edge_index = new_edge_index

        return updated_data, removed_edges