|
| 1 | +from abc import ABC, abstractmethod |
| 2 | +from dataclasses import dataclass |
| 3 | +from typing import Any, List |
| 4 | + |
| 5 | +from graphgen.bases.base_storage import BaseGraphStorage |
| 6 | +from graphgen.bases.datatypes import Community |
| 7 | + |
| 8 | + |
| 9 | +@dataclass |
| 10 | +class BasePartitioner(ABC): |
| 11 | + @abstractmethod |
| 12 | + async def partition( |
| 13 | + self, |
| 14 | + g: BaseGraphStorage, |
| 15 | + **kwargs: Any, |
| 16 | + ) -> List[Community]: |
| 17 | + """ |
| 18 | + Graph -> Communities |
| 19 | + :param g: Graph storage instance |
| 20 | + :param kwargs: Additional parameters for partitioning |
| 21 | + :return: List of communities |
| 22 | + """ |
| 23 | + |
| 24 | + @staticmethod |
| 25 | + async def community2batch( |
| 26 | + communities: List[Community], g: BaseGraphStorage |
| 27 | + ) -> list[ |
| 28 | + tuple[ |
| 29 | + list[tuple[str, dict]], list[tuple[Any, Any, dict] | tuple[Any, Any, Any]] |
| 30 | + ] |
| 31 | + ]: |
| 32 | + """ |
| 33 | + Convert communities to batches of nodes and edges. |
| 34 | + :param communities |
| 35 | + :param g: Graph storage instance |
| 36 | + :return: List of batches, each batch is a tuple of (nodes, edges) |
| 37 | + """ |
| 38 | + batches = [] |
| 39 | + for comm in communities: |
| 40 | + nodes = comm.nodes |
| 41 | + edges = comm.edges |
| 42 | + nodes_data = [] |
| 43 | + for node in nodes: |
| 44 | + node_data = await g.get_node(node) |
| 45 | + if node_data: |
| 46 | + nodes_data.append((node, node_data)) |
| 47 | + edges_data = [] |
| 48 | + for u, v in edges: |
| 49 | + edge_data = await g.get_edge(u, v) |
| 50 | + if edge_data: |
| 51 | + edges_data.append((u, v, edge_data)) |
| 52 | + else: |
| 53 | + edge_data = await g.get_edge(v, u) |
| 54 | + if edge_data: |
| 55 | + edges_data.append((v, u, edge_data)) |
| 56 | + batches.append((nodes_data, edges_data)) |
| 57 | + return batches |
| 58 | + |
| 59 | + @staticmethod |
| 60 | + def _build_adjacency_list( |
| 61 | + nodes: List[tuple[str, dict]], edges: List[tuple[str, str, dict]] |
| 62 | + ) -> tuple[dict[str, List[str]], set[tuple[str, str]]]: |
| 63 | + """ |
| 64 | + Build adjacency list and edge set from nodes and edges. |
| 65 | + :param nodes |
| 66 | + :param edges |
| 67 | + :return: adjacency list, edge set |
| 68 | + """ |
| 69 | + adj: dict[str, List[str]] = {n[0]: [] for n in nodes} |
| 70 | + edge_set: set[tuple[str, str]] = set() |
| 71 | + for e in edges: |
| 72 | + adj[e[0]].append(e[1]) |
| 73 | + adj[e[1]].append(e[0]) |
| 74 | + edge_set.add((e[0], e[1])) |
| 75 | + edge_set.add((e[1], e[0])) |
| 76 | + return adj, edge_set |
0 commit comments