Source code for easygraph.datasets.dynamic.email_eu
import json
import os
from easygraph.convert import dict_to_hypergraph
from easygraph.datasets.dynamic.load_dataset import request_json_from_url
from easygraph.datasets.graph_dataset_base import EasyGraphDataset
from easygraph.datasets.utils import _get_eg_url
from easygraph.datasets.utils import tensor
[docs]class Email_Eu(EasyGraphDataset):
_urls = {
"email-eu": "easygraph-data-email-eu/-/raw/main/email-eu.json?inline=false",
}
def __init__(
self,
raw_dir=None,
force_reload=False,
verbose=True,
transform=None,
save_dir="./",
):
name = "email-eu"
self.url = _get_eg_url(self._urls[name])
super(Email_Eu, self).__init__(
name=name,
url=self.url,
raw_dir=raw_dir,
force_reload=force_reload,
verbose=verbose,
transform=transform,
save_dir=save_dir,
)
@property
def url(self):
return self._url
@property
def save_name(self):
return self.name
def __getitem__(self, idx):
assert idx == 0, "This dataset has only one graph"
if self._transform is None:
return self._g
else:
return self._transform(self._g)
[docs] def load(self):
graph_path = os.path.join(self.save_path, self.save_name + ".json")
with open(graph_path, "r") as f:
self.load_data = json.load(f)
[docs] def has_cache(self):
graph_path = os.path.join(self.save_path, self.save_name + ".json")
if os.path.exists(graph_path):
return True
return False
[docs] def download(self):
if self.has_cache():
self.load()
else:
root = self.raw_dir
data = request_json_from_url(self.url)
with open(os.path.join(root, self.save_name + ".json"), "w") as f:
json.dump(data, f)
self.load_data = data
[docs] def process(self):
"""Loads input data from data directory and transfer to target graph for better analysis
"""
self._g, edge_feature_list = dict_to_hypergraph(self.load_data, is_dynamic=True)
self._g.ndata["hyperedge_feature"] = tensor(
range(1, len(edge_feature_list) + 1)
)
@url.setter
def url(self, value):
self._url = value