Adding some graph stats
This commit is contained in:
parent
68c103db4d
commit
9295e91181
|
@ -0,0 +1,90 @@
|
|||
#!/usr/bin/env python
|
||||
# -*- coding: utf-8 -*-
|
||||
|
||||
import logging
|
||||
import os
|
||||
import threading
|
||||
from inspect import getmembers, isfunction, signature
|
||||
|
||||
# import custom_graphgym # noqa, register custom modules
|
||||
import networkx as nx
|
||||
import pandas as pd
|
||||
from docstring_parser import parse
|
||||
from torch_geometric.data import Data
|
||||
# from torch_geometric.explain import Explanation
|
||||
from torch_geometric.utils import to_networkx
|
||||
|
||||
GRAPH_STAT_TYPE = ["int", "float", "bool", "boolean", "dict", "dictionary"]
|
||||
|
||||
|
||||
class GraphStat(object):
|
||||
def __init__(self):
|
||||
self.stat = {}
|
||||
self.maps = {
|
||||
"networkx": self.available_map_networkx(),
|
||||
"torch_geometric": self.available_map_torch_geometric(),
|
||||
}
|
||||
|
||||
def available_map_networkx(self):
|
||||
functions_list = getmembers(nx.algorithms, isfunction)
|
||||
maps = {}
|
||||
for func in functions_list:
|
||||
name, f = func
|
||||
if "all_" in name:
|
||||
continue
|
||||
docstring = parse(f.__doc__)
|
||||
try:
|
||||
# rt = docstring.returns.type_name
|
||||
# if rt in GRAPH_STAT_TYPE:
|
||||
maps[name] = f
|
||||
except AttributeError:
|
||||
continue
|
||||
return maps
|
||||
|
||||
def available_map_torch_geometric(self):
|
||||
names = [
|
||||
"num_nodes",
|
||||
"num_edges",
|
||||
"has_self_loops",
|
||||
"has_isolated_nodes",
|
||||
# "num_nodes_features",
|
||||
"y",
|
||||
]
|
||||
maps = {name:lambda x,name=name: x.__getattr__(name) for name in names}
|
||||
return maps
|
||||
|
||||
def to_series(self, name, val):
|
||||
self.stat.append(pd.Series(data={name: val}))
|
||||
|
||||
def __call__(self, data):
|
||||
data_ = data.__copy__()
|
||||
self.stat = []
|
||||
process = []
|
||||
for k, v in self.maps.items():
|
||||
if k == "networkx":
|
||||
_data_ = to_networkx(data)
|
||||
_data_ = _data_.to_undirected()
|
||||
elif k == "torch_geometric":
|
||||
_data_ = data.__copy__()
|
||||
for name, f in v.items():
|
||||
try:
|
||||
proc = f(_data_)
|
||||
if callable(proc) and k == "torch_geometric":
|
||||
proc = proc()
|
||||
self.to_series(name, proc)
|
||||
except:
|
||||
continue
|
||||
return self.stat
|
||||
|
||||
|
||||
from torch_geometric.datasets import KarateClub
|
||||
|
||||
d = KarateClub()
|
||||
a = d[0]
|
||||
st = GraphStat()
|
||||
stat = st(a)
|
||||
for item in stat:
|
||||
if item.dtypes == 'int' or item.dtypes == 'float':
|
||||
continue
|
||||
else:
|
||||
print(item)
|
Loading…
Reference in New Issue