fix som bugs in merge stage

be6f0e70 · zlj · d8158bb9 · c2ce9bbc · be6f0e70 · be6f0e70
Commit be6f0e70 authored Jan 08, 2024 by zlj
220 changed files
--- a/.history/.gitmodules_20240108200910
+++ b/.history/.gitmodules_20240108200910
+[submodule "third_party/ldg_partition"]
+	path = third_party/ldg_partition
+	url = https://gitee.com/onlynagesha/graph-partition-v4
+[submodule "third_party/METIS"]
+	path = third_party/METIS
+	url = https://github.com/KarypisLab/METIS
+	branch = v5.1.1-DistDGL-v0.5
--- a/.history/CMakeLists_20240108200933.txt
+++ b/.history/CMakeLists_20240108200933.txt
+cmake_minimum_required(VERSION 3.15)
+
+project(starrygl VERSION 0.1)
+
+option(WITH_PYTHON "Link to Python when building" ON)
+option(WITH_CUDA "Link to CUDA when building" ON)
+option(WITH_METIS "Link to METIS when building" ON)
+option(WITH_MTMETIS "Link to multi-threaded METIS when building" OFF)
+option(WITH_LDG "Link to (multi-threaded optionally) LDG when building" ON)
+
+set(CMAKE_CXX_STANDARD 17)
+set(CMAKE_CXX_STANDARD_REQUIRED ON)
+set(CMAKE_EXPORT_COMPILE_COMMANDS ON)
+
+set(CMAKE_CUDA_STANDARD 14)
+set(CMAKE_CUDA_STANDARD_REQUIRED ON)
+
+find_package(OpenMP REQUIRED)
+link_libraries(OpenMP::OpenMP_CXX)
+
+find_package(Torch REQUIRED)
+include_directories(${TORCH_INCLUDE_DIRS})
+add_compile_options(${TORCH_CXX_FLAGS})
+
+if(WITH_PYTHON)
+    add_definitions(-DWITH_PYTHON)
+    find_package(Python3 COMPONENTS Interpreter Development REQUIRED)
+    include_directories(${Python3_INCLUDE_DIRS})
+endif()
+
+if(WITH_CUDA)
+    add_definitions(-DWITH_CUDA)
+    add_definitions(-DWITH_UVM)
+
+    find_package(CUDA REQUIRED)
+    include_directories(${CUDA_INCLUDE_DIRS})
+    set(CUDA_LIBRARIES "${CUDA_TOOLKIT_ROOT_DIR}/lib64/libcudart.so")
+
+    file(GLOB_RECURSE UVM_SRCS "csrc/uvm/*.cpp")
+
+    add_library(uvm_ops SHARED ${UVM_SRCS})
+    target_link_libraries(uvm_ops PRIVATE ${TORCH_LIBRARIES})
+endif()
+
+if(WITH_METIS)
+    # add_definitions(-DWITH_METIS)
+    # set(GKLIB_DIR "${CMAKE_SOURCE_DIR}/third_party/GKlib")
+    # set(METIS_DIR "${CMAKE_SOURCE_DIR}/third_party/METIS")
+
+    # set(GKLIB_INCLUDE_DIRS "${GKLIB_DIR}/include")
+    # file(GLOB_RECURSE GKLIB_LIBRARIES "${GKLIB_DIR}/lib/lib*.a")
+
+    # set(METIS_INCLUDE_DIRS "${METIS_DIR}/include")
+    # file(GLOB_RECURSE METIS_LIBRARIES "${METIS_DIR}/lib/lib*.a")
+
+    # include_directories(${METIS_INCLUDE_DIRS})
+
+    # add_library(metis_partition SHARED "csrc/partition/metis.cpp")
+    # target_link_libraries(metis_partition PRIVATE ${TORCH_LIBRARIES})
+    # target_link_libraries(metis_partition PRIVATE ${GKLIB_LIBRARIES})
+    # target_link_libraries(metis_partition PRIVATE ${METIS_LIBRARIES})
+
+    add_definitions(-DWITH_METIS)
+    set(METIS_DIR "${CMAKE_SOURCE_DIR}/third_party/METIS")
+    set(METIS_GKLIB_DIR "${METIS_DIR}/GKlib")
+
+    file(GLOB METIS_SRCS "${METIS_DIR}/libmetis/*.c")
+    file(GLOB METIS_GKLIB_SRCS "${METIS_GKLIB_DIR}/*.c")
+    
+    if (MSVC)
+        file(GLOB METIS_GKLIB_WIN32_SRCS "${METIS_GKLIB_DIR}/win32/*.c")
+        set(METIS_GKLIB_SRCS ${METIS_GKLIB_SRCS} ${METIS_GKLIB_WIN32_SRCS})
+    endif()
+
+    add_library(metis_partition SHARED
+        "csrc/partition/metis.cpp"
+        ${METIS_SRCS} ${METIS_GKLIB_SRCS}
+    )
+    target_include_directories(metis_partition PRIVATE "${METIS_DIR}/include")
+    target_include_directories(metis_partition PRIVATE "${METIS_GKLIB_DIR}")
+    if (MSVC)
+        target_include_directories(metis_partition PRIVATE "${METIS_GKLIB_DIR}/win32")
+    endif()
+
+    target_compile_definitions(metis_partition PRIVATE -DIDXTYPEWIDTH=64)
+    target_compile_definitions(metis_partition PRIVATE -DREALTYPEWIDTH=32)
+    target_compile_options(metis_partition PRIVATE -O3)
+
+    target_link_libraries(metis_partition PRIVATE ${TORCH_LIBRARIES})
+    if (UNIX)
+        target_link_libraries(metis_partition PRIVATE m)
+    endif()
+endif()
+
+if(WITH_MTMETIS)
+    add_definitions(-DWITH_MTMETIS)
+    set(MTMETIS_DIR "${CMAKE_SOURCE_DIR}/third_party/mt-metis")
+
+    set(MTMETIS_INCLUDE_DIRS "${MTMETIS_DIR}/include")
+    file(GLOB_RECURSE MTMETIS_LIBRARIES "${MTMETIS_DIR}/lib/lib*.a")
+
+    include_directories(${MTMETIS_INCLUDE_DIRS})
+    add_library(mtmetis_partition SHARED "csrc/partition/mtmetis.cpp")
+    target_link_libraries(mtmetis_partition PRIVATE ${TORCH_LIBRARIES})
+    target_link_libraries(mtmetis_partition PRIVATE ${MTMETIS_LIBRARIES})
+
+    target_compile_definitions(mtmetis_partition PRIVATE -DMTMETIS_64BIT_VERTICES)
+    target_compile_definitions(mtmetis_partition PRIVATE -DMTMETIS_64BIT_EDGES)
+    target_compile_definitions(mtmetis_partition PRIVATE -DMTMETIS_64BIT_WEIGHTS)
+    target_compile_definitions(mtmetis_partition PRIVATE -DMTMETIS_64BIT_PARTITIONS)
+endif()
+
+if (WITH_LDG)
+    # Imports neighbor-clustering based (e.g. LDG algorithm) graph partitioning implementation
+    add_definitions(-DWITH_LDG)
+    set(LDG_DIR "csrc/partition/neighbor_clustering")
+    
+    add_library(ldg_partition SHARED "csrc/partition/ldg.cpp")
+    target_link_libraries(ldg_partition PRIVATE ${TORCH_LIBRARIES})
+
+    add_subdirectory(${LDG_DIR})
+    target_include_directories(ldg_partition PRIVATE ${LDG_DIR})
+    target_link_libraries(ldg_partition PRIVATE ldg-vertex-partition)
+endif ()
+
+include_directories("csrc/include")
+add_library(${PROJECT_NAME} SHARED csrc/export.cpp)
+
+target_link_libraries(${PROJECT_NAME} PRIVATE ${TORCH_LIBRARIES})
+target_compile_definitions(${PROJECT_NAME} PRIVATE -DTORCH_EXTENSION_NAME=lib${PROJECT_NAME})
+
+if(WITH_PYTHON)
+    find_library(TORCH_PYTHON_LIBRARY torch_python PATHS "${TORCH_INSTALL_PREFIX}/lib")
+    target_link_libraries(${PROJECT_NAME} PRIVATE ${TORCH_PYTHON_LIBRARY})
+endif()
+
+if (WITH_CUDA)
+    target_link_libraries(${PROJECT_NAME} PRIVATE uvm_ops)
+endif()
+
+if (WITH_METIS)
+    message(STATUS "Current project '${PROJECT_NAME}' uses METIS graph partitioning algorithm.")
+    target_link_libraries(${PROJECT_NAME} PRIVATE metis_partition)
+endif()
+
+if (WITH_MTMETIS)
+    message(STATUS "Current project '${PROJECT_NAME}' uses multi-threaded METIS graph partitioning algorithm.")
+    target_link_libraries(${PROJECT_NAME} PRIVATE mtmetis_partition)
+endif()
+
+if (WITH_LDG)
+    message(STATUS "Current project '${PROJECT_NAME}' uses LDG graph partitioning algorithm.")
+    target_link_libraries(${PROJECT_NAME} PRIVATE ldg_partition)
+endif()
+
+# add libsampler.so
+set(SAMLPER_NAME "${PROJECT_NAME}_sampler")
+# set(BOOST_INCLUDE_DIRS "${CMAKE_SOURCE_DIR}/third_party/boost_1_83_0")
+# include_directories(${BOOST_INCLUDE_DIRS})
+
+file(GLOB_RECURSE SAMPLER_SRCS "csrc/sampler/*.cpp")
+add_library(${SAMLPER_NAME} SHARED ${SAMPLER_SRCS})
+
+target_include_directories(${SAMLPER_NAME} PRIVATE "csrc/sampler/include")
+
+target_compile_options(${SAMLPER_NAME} PRIVATE -O3)
+target_link_libraries(${SAMLPER_NAME} PRIVATE ${TORCH_LIBRARIES})
+target_compile_definitions(${SAMLPER_NAME} PRIVATE -DTORCH_EXTENSION_NAME=lib${SAMLPER_NAME})
+
+if(WITH_PYTHON)
+    find_library(TORCH_PYTHON_LIBRARY torch_python PATHS "${TORCH_INSTALL_PREFIX}/lib")
+    target_link_libraries(${SAMLPER_NAME} PRIVATE ${TORCH_PYTHON_LIBRARY})
+endif()
--- a/.history/csrc/export_20240108201054.cpp
+++ b/.history/csrc/export_20240108201054.cpp
+#include "extension.h"
+#include "uvm.h"
+#include "partition.h"
+
+
+PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
+    #ifdef WITH_CUDA
+    m.def("uvm_storage_new", &uvm_storage_new, "return storage of unified virtual memory");
+    m.def("uvm_storage_to_cuda", &uvm_storage_to_cuda, "share uvm storage with another cuda device");
+    m.def("uvm_storage_to_cpu", &uvm_storage_to_cpu, "share uvm storage with cpu");
+    m.def("uvm_storage_advise", &uvm_storage_advise, "apply cudaMemAdvise() to uvm storage");
+    m.def("uvm_storage_prefetch", &uvm_storage_prefetch, "apply cudaMemPrefetchAsync() to uvm storage");
+
+    py::enum_<cudaMemoryAdvise>(m, "cudaMemoryAdvise")
+        .value("cudaMemAdviseSetAccessedBy", cudaMemoryAdvise::cudaMemAdviseSetAccessedBy)
+        .value("cudaMemAdviseUnsetAccessedBy", cudaMemoryAdvise::cudaMemAdviseUnsetAccessedBy)
+        .value("cudaMemAdviseSetPreferredLocation", cudaMemoryAdvise::cudaMemAdviseSetPreferredLocation)
+        .value("cudaMemAdviseUnsetPreferredLocation", cudaMemoryAdvise::cudaMemAdviseUnsetPreferredLocation)
+        .value("cudaMemAdviseSetReadMostly", cudaMemoryAdvise::cudaMemAdviseSetReadMostly)
+        .value("cudaMemAdviseUnsetReadMostly", cudaMemoryAdvise::cudaMemAdviseUnsetReadMostly);
+    #endif
+
+    #ifdef WITH_METIS
+    m.def("metis_partition", &metis_partition, "metis graph partition");
+    m.def("metis_cache_friendly_reordering", &metis_cache_friendly_reordering, "metis cache-friendly reordering");
+    #endif
+
+    #ifdef WITH_MTMETIS
+    m.def("mt_metis_partition", &mt_metis_partition, "multi-threaded metis graph partition");
+    #endif
+
+    #ifdef WITH_LGD
+    // Note: the switch WITH_MULTITHREADING=ON shall be triggered during compilation
+    // to enable multi-threading functionality.
+    m.def("ldg_partition", &ldg_partition, "(multi-threaded optionally) LDG graph partition");
+    #endif
+}
--- a/.history/docs/source/advanced/index_20240108201112.rst
+++ b/.history/docs/source/advanced/index_20240108201112.rst
+Advanced Concepts
+=================
+
+.. toctree::
+    sampling_parallel/index
+    partition_parallel/index
+    timeline_parallel/index
--- a/.history/docs/source/api/python/index_20240108201119.rst
+++ b/.history/docs/source/api/python/index_20240108201119.rst
+Package References
+==================
+
+.. toctree::
+    distributed
+    neighbor_sampler
+    memory
+    data_loader
+    graph_core
+    cache
--- a/.history/docs/source/conf_20240108201103.py
+++ b/.history/docs/source/conf_20240108201103.py
+import os
+import sys
+
+sys.path.insert(0, os.path.abspath("../.."))
+import starrygl
+
+project = 'StarryGL'
+copyright = '2023, StarryGL Team'
+author = 'StarryGL Team'
+
+version = starrygl.__version__
+release = starrygl.__version__
+
+
+extensions = [
+    "sphinx.ext.autodoc",
+    "sphinx.ext.autosummary",
+    "sphinx.ext.duration",
+    "sphinx.ext.viewcode",
+]
+
+
+templates_path = ['_templates']
+exclude_patterns = []
+
+
+
+# -- Options for HTML output -------------------------------------------------
+# https://www.sphinx-doc.org/en/master/usage/configuration.html#options-for-html-output
+
+html_theme = 'sphinx_rtd_theme'
+html_static_path = ['_static']
--- a/.history/install_20240108200947.sh
+++ b/.history/install_20240108200947.sh
+#!/bin/bash
+
+mkdir -p build && cd build
+cmake .. \
+    -DCMAKE_EXPORT_COMPILE_COMMANDS=ON \
+    -DCMAKE_PREFIX_PATH="/home/zlj/.miniconda3/envs/sgl/lib/python3.10/site-packages" \
+    -DPython3_ROOT_DIR="/home/zlj/.miniconda3/envs/sgl" \
+    -DCUDA_TOOLKIT_ROOT_DIR="/home/zlj/.local/cuda-11.8" \
+&& make -j32 \
+&& rm -rf ../starrygl/lib \
+&& mkdir ../starrygl/lib \
+&& cp lib*.so ../starrygl/lib/ \
+&& patchelf --set-rpath '$ORIGIN:$ORIGIN/lib' --force-rpath ../starrygl/lib/*.so
--- a/.history/requirements_20240108200955.txt
+++ b/.history/requirements_20240108200955.txt
+--extra-index-url https://download.pytorch.org/whl/cu118
+torch==2.1.1+cu118
+torchvision==0.16.1+cu118
+torchaudio==2.1.1+cu118
+
+--extra-index-url https://data.pyg.org/whl/torch-2.1.0+cu118.html
+torch_geometric==2.4.0
+pyg_lib==0.3.1+pt21cu118
+torch_scatter==2.1.2+pt21cu118
+torch_sparse==0.6.18+pt21cu118
+torch_cluster==1.6.3+pt21cu118
+torch_spline_conv==1.2.2+pt21cu118
+
+ogb
+tqdm
+networkx
--- a/.history/starrygl/data/graph_20240108201310.py
+++ b/.history/starrygl/data/graph_20240108201310.py
--- a/.history/starrygl/distributed/utils_20240108201408.py
+++ b/.history/starrygl/distributed/utils_20240108201408.py
--- a/.history/starrygl/sample/batch_data_20240108201444.py
+++ b/.history/starrygl/sample/batch_data_20240108201444.py
+from typing import List, Tuple
+import torch
+import torch.distributed as dist
+from starrygl.distributed.utils import DistributedTensor
+from starrygl.module.memorys import MailBox
+from starrygl.sample.cache.fetch_cache import FetchFeatureCache
+from starrygl.sample.graph_core import DataSet
+from starrygl.sample.graph_core import DistributedGraphStore
+from starrygl.sample.sample_core.base import BaseSampler, NegativeSampling
+import dgl
+
+from starrygl.sample.stream_manager import PipelineManager, getPipelineManger
+"""
+入参不变，出参变为：
+sample_from_nodes
+node: list[tensor,tensor, tensor...]
+eid: list[tensor,tensor, tensor...]
+src_index: list[tensor,tensor, tensor...]
+
+sample_from_edges：
+node
+eid: list[tensor,tensor, tensor...]
+src_index: list[tensor,tensor, tensor...]
+delta_ts: list[tensor,tensor, tensor...]
+metadata
+"""
+def prepare_input(node_feat, edge_feat, mem_embedding,mfgs,dist_nid,dist_eid):
+    for mfg in mfgs:
+        for i,b in enumerate(mfg):
+            e_idx = b.edata['ID']
+            idx = b.srcdata['ID']
+            b.edata['ID'] = dist_eid[e_idx]
+            b.srcdata['ID'] = dist_nid[idx]
+            if edge_feat is not None:
+                b.edata['f'] = edge_feat[e_idx]
+            if i == 0:
+                if node_feat is not None:
+                    b.srcdata['h'] = node_feat[idx]
+                if mem_embedding is not None:
+                    node_memory,node_memory_ts,mailbox,mailbox_ts = mem_embedding
+                    b.srcdata['mem'] = node_memory[idx]
+                    b.srcdata['mem_ts'] = node_memory_ts[idx]
+                    b.srcdata['mem_input'] = mailbox[idx].reshape(b.srcdata['ID'].shape[0], -1)
+                    b.srcdata['mail_ts'] = mailbox_ts[idx]
+                    #print(idx.shape[0],b.srcdata['mem_ts'].shape)
+        return mfgs
+
+def to_block(graph: DistributedGraphStore, data, sample_out, mailbox:MailBox = None,device = torch.device('cuda'),group = None):
+    if len(sample_out) > 1:
+        sample_out,metadata = sample_out
+    else:
+        metadata = None
+    eid = [ret.eid() for ret in sample_out]
+    eid_len = [e.shape[0] for e in eid ]
+    eid_mapper: torch.Tensor = graph.eids_mapper
+    nid_mapper: torch.Tensor = graph.nids_mapper
+    eid_tensor = torch.cat(eid,dim = 0).to(eid_mapper.device)
+    dist_eid = eid_mapper[eid_tensor].to(device)
+    dist_eid,eid_inv = dist_eid.unique(return_inverse=True)
+    src_node = graph.sample_graph['edge_index'][0,eid_tensor*2].to(graph.nids_mapper.device)
+    src_ts = None  
+    if metadata is None:
+        root_node = data.nodes.to(graph.nids_mapper.device)
+        root_len = [root_node.shape[0]]
+        if hasattr(data,'ts'):
+            src_ts = torch.cat([data.ts,
+                                graph.sample_graph['ts'][eid_tensor*2].to(device)])
+    elif 'seed' in metadata:
+        root_node = metadata.pop('seed').to(graph.nids_mapper.device)
+        root_len = root_node.shape[0]
+        if 'seed_ts' in metadata:
+            src_ts = torch.cat([metadata.pop('seed_ts').to(device),\
+                                graph.sample_graph['ts'][eid_tensor*2].to(device)])
+        for k in metadata:
+            metadata[k] = metadata[k].to(device)
+
+    nid_tensor = torch.cat([root_node,src_node],dim = 0)
+    dist_nid = nid_mapper[nid_tensor].to(device)
+    dist_nid,nid_inv = dist_nid.unique(return_inverse = True)
+    
+    fetchCache = FetchFeatureCache.getFetchCache()
+    if fetchCache is None:
+        if isinstance(graph.edge_attr,DistributedTensor):
+            ind_dict = graph.edge_attr.all_to_all_ind2ptr(dist_eid,group = group)
+            edge_feat = graph.edge_attr.all_to_all_get(group = group,**ind_dict)
+        else:
+            edge_feat = graph._get_edge_attr(dist_eid)
+        ind_dict = None
+        if isinstance(graph.x,DistributedTensor):
+            ind_dict = graph.x.all_to_all_ind2ptr(dist_nid,group = group)
+            node_feat = graph.x.all_to_all_get(group = group,**ind_dict)
+        else:
+            node_feat = graph._get_node_attr(dist_nid)
+        if mailbox is not None:
+            if torch.distributed.get_world_size() > 1:
+                if node_feat is None:
+                    ind_dict = mailbox.node_memory.all_to_all_ind2ptr(dist_nid,group = group)
+                mem = mailbox.gather_memory(**ind_dict)
+            else:
+                mem = mailbox.get_memory(dist_nid)
+        else:
+            mem = None
+    else:
+        raw_nid = torch.empty_like(dist_nid)
+        raw_eid = torch.empty_like(dist_eid)
+        nid_tensor = nid_tensor.to(device)
+        eid_tensor = eid_tensor.to(device)
+        raw_nid[nid_inv] = nid_tensor
+        raw_eid[eid_inv] = eid_tensor
+        node_feat,edge_feat,mem = fetchCache.fetch_feature(raw_nid,
+                                 dist_nid,raw_eid,
+                                 dist_eid)
+    def build_block():
+        mfgs = list()
+        col = torch.arange(0,root_len,device = device)
+        col_len = 0
+        row_len = root_len
+        for r in range(len(eid_len)):
+            elen = eid_len[r]
+            row = torch.arange(row_len,row_len+elen,device = device)
+            b = dgl.create_block((row,col[sample_out[r].src_index().to(device)]),
+                                 num_src_nodes = row_len + elen,
+                                 num_dst_nodes = row_len,
+                                 device = device)
+            idx = nid_inv[0:row_len + elen]
+            e_idx = eid_inv[col_len:col_len+elen]
+            b.srcdata['ID'] = idx
+            if sample_out[r].delta_ts().shape[0] > 0:
+                b.edata['dt'] = sample_out[r].delta_ts().to(device)
+            if src_ts is not None:
+                b.srcdata['ts'] = src_ts[0:row_len + eid_len[r]]
+            b.edata['ID'] = e_idx
+            col = row
+            col_len += eid_len[r]
+            row_len += eid_len[r]
+            mfgs.append(b)
+        mfgs = list(map(list, zip(*[iter(mfgs)])))
+        mfgs.reverse()
+        return data,mfgs,metadata
+    data,mfgs,metadata = build_block()
+    mfgs = prepare_input(node_feat,edge_feat,mem,mfgs,dist_nid,dist_eid)
+        #return build_block(node_feat,edge_feat,mem)#data,mfgs,metadata
+    return (data,mfgs,metadata)
+
+
+def graph_sample(graph, sampler:BaseSampler,
+                      sample_fn, data, 
+                      neg_sampling = None,
+                      mailbox = None,
+                      device = torch.device('cuda'),
+                      async_op = False):
+    out = sample_fn(sampler,data,neg_sampling)
+    if async_op == False:
+        return to_block(graph,data,out,mailbox,device)
+    else:
+        manger =  getPipelineManger()
+        future = manger.submit('lookup',to_block,{'graph':graph,'data':data,\
+                                                  'sample_out':out,\
+                                                  'mailbox':mailbox,\
+                                                  'device':device})
+        return future
+
+def sample_from_nodes(sampler:BaseSampler,  data:DataSet, **kwargs):
+    out = sampler.sample_from_nodes(nodes=data.nodes.reshape(-1))
+    #out.metadata = None
+    return out
+
+def sample_from_edges(sampler:BaseSampler,  
+                      data:DataSet, 
+                      neg_sampling:NegativeSampling = None):
+    edge_label = data.labels if hasattr(data,'labels') else None
+    out = sampler.sample_from_edges(edges = data.edges, 
+                                    neg_sampling=neg_sampling)
+    return out
+    
+
+def sample_from_temporal_nodes(sampler:BaseSampler,data:DataSet,
+                               **kwargs):
+    out = sampler.sample_from_nodes(nodes=data.nodes.reshape(-1),
+                                    ts = data.ts.reshape(-1))
+    #out.metadata = None
+    return out
+
+
+def sample_from_temporal_edges(sampler:BaseSampler, data:DataSet,
+                               neg_sampling: NegativeSampling = None):
+    edge_label = data.labels if hasattr(data,'labels') else None
+    out = sampler.sample_from_edges(edges=data.edges.to('cpu'),
+                                    ets=data.ts.to('cpu'),
+                                    neg_sampling = neg_sampling
+                                    )
+    return out
+
+class SAMPLE_TYPE:
+    SAMPLE_FROM_NODES = sample_from_nodes,
+    SAMPLE_FROM_EDGES = sample_from_edges,
+    SAMPLE_FROM_TEMPORAL_NODES = sample_from_temporal_nodes,
+    SAMPLE_FROM_TEMPORAL_EDGES = sample_from_temporal_edges
+    
\ No newline at end of file
--- a/.history/starrygl/sample/data_loader_20240108201544.py
+++ b/.history/starrygl/sample/data_loader_20240108201544.py
+from collections import deque
+from enum import Enum
+import queue
+import torch
+import sys
+from os.path import abspath, join, dirname
+import numpy as np
+from starrygl.sample.batch_data import graph_sample
+
+from starrygl.sample.sample_core.PreNegSampling import PreNegativeSampling
+
+sys.path.insert(0, join(abspath(dirname(__file__))))
+from typing import Deque, Optional
+import torch.distributed as dist
+from torch_geometric.data import Data
+import os.path as osp
+import math
+
+
+    
+
+class DistributedDataLoader:
+    ''' 
+    We will perform feature fetch in the data loader.
+    you can simply define a data loader for use, while starrygl assisting in fetching node or edge features:
+
+        
+        
+    Args:
+        graph: distributed graph store
+    
+        data: the graph data
+        
+        sampler: a parallel sampler like `NeighborSampler` above
+        
+        sampler_fn: sample type
+        
+        neg_sampler: negative sampler
+        
+        batch_size: batch size
+        
+        mailbox: APAN's mailbox and TGN's memory implemented by starrygl
+    
+    Examples:
+
+        .. code-block:: python
+        
+            import torch
+
+            from starrygl.sample.data_loader import DistributedDataLoader
+            from starrygl.sample.part_utils.partition_tgnn import partition_load
+            from starrygl.sample.graph_core import DataSet, DistributedGraphStore, TemporalNeighborSampleGraph
+            from starrygl.sample.memory.shared_mailbox import SharedMailBox
+            from starrygl.sample.sample_core.neighbor_sampler import NeighborSampler
+            from starrygl.sample.sample_core.base import NegativeSampling
+            from starrygl.sample.batch_data import SAMPLE_TYPE
+
+            pdata = partition_load("PATH/{}".format(dataname), algo="metis_for_tgnn")    
+            graph = DistributedGraphStore(pdata = pdata, uvm_edge = False, uvm_node = False)
+            sample_graph = TemporalNeighborSampleGraph(sample_graph = pdata.sample_graph,mode = 'full')
+            mailbox = SharedMailBox(pdata.ids.shape[0], memory_param, dim_edge_feat=pdata.edge_attr.shape[1] if pdata.  edge_attr is not None else 0)
+            sampler = NeighborSampler(num_nodes=graph.num_nodes, num_layers=1, fanout=[10], graph_data=sample_graph,    workers=15,policy = 'recent',graph_name = "wiki_train")
+            neg_sampler = NegativeSampling('triplet')
+            train_data = torch.masked_select(graph.edge_index, pdata.train_mask.to(graph.edge_index.device)).reshape    (2, -1)
+            trainloader = DistributedDataLoader(graph, train_data, sampler=sampler, sampler_fn=SAMPLE_TYPE. SAMPLE_FROM_TEMPORAL_EDGES,neg_sampler=neg_sampler, batch_size=1000, shuffle=False, drop_last=True, chunk_size = None,train=True, mailbox=mailbox )
+
+    In the data loader, we will call the `graph_sample`, sourced from `starrygl.sample.batch_data`.
+
+    And the `to_block` function in the `graph_sample` will implement feature fetching.
+    If cache is not used, we will directly fetch node or edge features from the graph data, 
+    otherwise we will call `fetch_data` for feature fetching.     
+
+    '''
+    def __init__(
+            self,
+            graph,
+            dataset = None,
+            sampler = None,
+            sampler_fn = None,
+            neg_sampler = None,
+            batch_size: Optional[int]=None,
+            drop_last = False,
+            device: torch.device  = torch.device('cuda'),
+            shuffle:bool = True,
+            chunk_size = None,
+            train = False,
+            queue_size = 10,
+            mailbox = None,
+            is_pipeline = False,
+            **kwargs
+    ):
+        assert sampler is not None
+        self.chunk_size = chunk_size
+        self.batch_size = batch_size
+        self.queue_size = queue_size
+        self.num_pending = 0
+        self.current_pos = 0
+        self.recv_idxs = 0
+        self.drop_last = drop_last
+        self.result_queue = deque(maxlen = self.queue_size)
+        self.shuffle = shuffle
+        self.is_closed = False
+        self.sampler = sampler
+        self.sampler_fn = sampler_fn
+        self.neg_sampler = neg_sampler
+        self.graph = graph
+        self.shuffle=shuffle
+        self.dataset = dataset
+        self.mailbox = mailbox
+        self.device =  device
+        self.is_pipeline = is_pipeline
+        if train is True:
+            self._get_expected_idx(self.dataset.len)
+        else:
+            self._get_expected_idx(self.dataset.len,op = dist.ReduceOp.MAX)
+            #self.expected_idx = int(math.ceil(self.dataset.len/self.batch_size))
+        torch.distributed.barrier()
+              
+    def __iter__(self):
+        if self.chunk_size is None:
+            if self.shuffle:
+                self.input_dataset = self.dataset.shuffle()
+            else:
+                self.input_dataset = self.dataset
+            self.recv_idxs = 0
+            self.current_pos = 0
+            self.num_pending = 0
+            self.submitted = 0
+        else:
+            self.input_dataset = self.dataset
+            self.recv_idxs = 0
+            self.num_pending = 0
+            self.submitted = 0
+            if dist.get_rank == 0:
+                self.current_pos = int(
+                    math.floor(
+                        np.random.uniform(0,self.batch_size/self.chunk_size)
+                    )*self.chunk_size
+                )
+            else:
+                self.current_pos = 0
+            current_pos = torch.tensor([self.current_pos],dtype = torch.long,device=self.device) 
+            dist.broadcast(current_pos, src = 0)
+            self.current_pos = int(current_pos.item())
+            self._get_expected_idx(self.dataset.len-self.current_pos)
+
+
+        if self.neg_sampler is not None \
+            and isinstance(self.neg_sampler,PreNegativeSampling):
+            self.neg_sampler.set_next_pos(self.current_pos)
+        return self
+
+    def _get_expected_idx(self,data_size,op = dist.ReduceOp.MIN):
+        world_size = dist.get_world_size()
+        self.expected_idx = data_size // self.batch_size if self.drop_last is True else int(math.ceil(data_size/self.batch_size))
+
+        if dist.get_world_size() > 1:
+            num_epochs = torch.tensor([self.expected_idx],dtype = torch.long,device=self.device) 
+            print(num_epochs)
+            dist.all_reduce(num_epochs, op=op)
+            self.expected_idx = int(num_epochs.item())
+
+    def _next_data(self):   
+        if self.current_pos >= self.dataset.len:
+            return self.input_dataset._get_empty()
+
+        if self.current_pos + self.batch_size > self.input_dataset.len:
+            if self.drop_last:
+                return None
+            else:
+                next_data = self.input_dataset.get_next(
+                    slice(self.current_pos,None,None)
+                )
+                self.current_pos = 0
+        else:
+            next_data = self.input_dataset.get_next(
+                slice(self.current_pos,self.current_pos + self.batch_size,None)
+            )
+            self.current_pos += self.batch_size
+
+        return next_data
+    
+    def __next__(self):
+        if self.is_pipeline is False:
+            if self.recv_idxs < self.expected_idx:
+                data = self._next_data()
+                batch_data = graph_sample(self.graph,
+                                          self.sampler,
+                                          self.sampler_fn,
+                                          data,self.neg_sampler,
+                                          self.mailbox,
+                                          self.device)
+                self.recv_idxs += 1
+                assert batch_data is not None
+                torch.cuda.synchronize()
+                return batch_data
+            else :
+                raise StopIteration
+        else:
+            if self.recv_idxs == 0:
+                data = self._next_data()
+                batch_data = graph_sample(self.graph,
+                                          self.sampler,
+                                          self.sampler_fn,
+                                          data,self.neg_sampler,
+                                          self.mailbox,
+                                          self.device)
+                self.recv_idxs += 1
+            else:
+                if(self.recv_idxs < self.expected_idx):
+                    assert len(self.result_queue) > 0
+                    result= self.result_queue[0]
+                    self.result_queue.popleft()
+                    batch_data = result.result()
+                    self.recv_idxs += 1
+                else:
+                    raise StopIteration
+            if(self.recv_idxs+1<=self.expected_idx):
+                data = self._next_data()
+                next_batch =  graph_sample(self.graph,
+                                          self.sampler,
+                                          self.sampler_fn,
+                                          data,self.neg_sampler,
+                                          self.mailbox,
+                                          self.device,
+                                          async_op=True)
+                self.result_queue.append(next_batch)     
+        return batch_data
+                    
+
+        
+    
+
+
+    
+        
+        
+        
--- a/.history/starrygl/sample/graph_core/__init___20240108201727.py
+++ b/.history/starrygl/sample/graph_core/__init___20240108201727.py
+import starrygl
+from starrygl.distributed.context import DistributedContext
+from starrygl.distributed.utils import DistIndex, DistributedTensor
+from starrygl.sample.graph_core.utils import build_mapper
+import os.path as osp
+import torch
+import torch.distributed as dist
+from torch_geometric.data import Data
+
+
+class DistributedGraphStore:
+    '''
+
+    Initializes the DistributedGraphStore with distributed graph data.
+
+    Args:
+        pdata: Graph data object containing ids, eids, edge_index, edge_ts, sample_graph, x, and edge_attr.
+
+        device: Device to which tensors are moved (default is 'cuda').
+
+        uvm_node: If True, enables Unified Virtual Memory (UVM) for node data.
+
+        uvm_edge: If True, enables Unified Virtual Memory (UVM) for edge data.
+
+    '''
+    def __init__(self, pdata, device = torch.device('cuda'),
+                 uvm_node = False, 
+                 uvm_edge = False):
+        self.device = device
+        self.ids = pdata.ids.to(device)
+        self.eids = pdata.eids
+        self.edge_index = pdata.edge_index.to(device)
+        if hasattr(pdata,'edge_ts'):
+            self.edge_ts = pdata.edge_ts.to(device).to(torch.float)
+        else:
+            self.edge_ts = None
+        self.sample_graph = pdata.sample_graph
+        self.nids_mapper = build_mapper(nids=pdata.ids.to(device)).dist.to('cpu')
+        self.eids_mapper = build_mapper(nids=pdata.eids.to(device)).dist.to('cpu')
+        torch.cuda.empty_cache()
+
+        self.num_nodes = self.nids_mapper.data.shape[0]
+        self.num_edges = self.eids_mapper.data.shape[0]
+        world_size = dist.get_world_size()
+        self.uvm_node = uvm_node
+        self.uvm_edge = uvm_edge
+        
+        if hasattr(pdata,'x') and pdata.x is not None:
+            pdata.x = pdata.x.to(torch.float)
+            if uvm_node == False :
+                x = pdata.x.to(self.device)
+            else:
+                if self.device.type == 'cuda':
+                    x = starrygl.utils.uvm.uvm_empty(*pdata.x.size(),
+                                    dtype=pdata.x.dtype,
+                                    device=ctx.device)
+                    starrygl.utils.uvm.uvm_share(x,device = ctx.device)
+                    starrygl.utils.uvm.uvm_advise(x,starrygl.utils.uvm.cudaMemoryAdvise.cudaMemAdviseSetAccessedBy)
+                    starrygl.utils.uvm.uvm_prefetch(x)
+            if world_size > 1:
+                self.x = DistributedTensor(pdata.x.to(self.device).to(torch.float))
+            else:
+                self.x = x
+        else:
+            self.x = None
+            
+        if hasattr(pdata,'edge_attr') and pdata.edge_attr is not None:
+            ctx = DistributedContext.get_default_context()
+            pdata.edge_attr = pdata.edge_attr.to(torch.float)
+            if uvm_edge == False :
+                edge_attr = pdata.edge_attr.to(self.device)
+            else:
+                if self.device.type == 'cuda':
+                    edge_attr = starrygl.utils.uvm.uvm_empty(*pdata.edge_attr.size(),
+                                    dtype=pdata.edge_attr.dtype,
+                                    device=ctx.device)
+                    starrygl.utils.uvm.uvm_share(edge_attr,device = ctx.device)
+                    starrygl.utils.uvm.uvm_advise(edge_attr,starrygl.utils.uvm.cudaMemoryAdvise.cudaMemAdviseSetAccessedBy)
+                    starrygl.utils.uvm.uvm_prefetch(edge_attr)
+            if world_size > 1:
+                self.edge_attr = DistributedTensor(edge_attr)
+            else:
+                self.edge_attr = edge_attr
+        else:
+            self.edge_attr = None
+
+    def _get_node_attr(self,ids,asyncOp = False):
+        '''
+        Retrieves node attributes for the specified node IDs.
+
+        Args:
+            ids: Node IDs for which to retrieve attributes.
+
+            asyncOp: If True, performs asynchronous operation for distributed data.
+
+        '''
+        if self.x is None:
+            return None
+        elif dist.get_world_size() == 1:
+            return self.x[ids]
+        else:
+            if self.x.rrefs is None or asyncOp is False:
+                ids = self.x.all_to_all_ind2ptr(ids)
+                return self.x.all_to_all_get(**ids)
+            return self.x.index_select(ids)
+    
+    def _get_edge_attr(self,ids,asyncOp = False):
+        '''
+        Retrieves edge attributes for the specified edge IDs.
+
+        Args:
+            ids: Edge IDs for which to retrieve attributes.
+
+            asyncOp: If True, performs asynchronous operation for distributed data.
+
+        '''
+        if self.edge_attr is None:
+            return None
+        elif dist.get_world_size() == 1:
+            return self.edge_attr[ids]
+        else:
+            
+            if self.edge_attr.rrefs is None or asyncOp is False:
+                ids = self.edge_attr.all_to_all_ind2ptr(ids)
+                return self.edge_attr.all_to_all_get(**ids)
+            return self.edge_attr.index_select(ids)
+    
+    def _get_dist_index(self,ind,mapper):
+        '''
+        Retrieves the distributed index for the specified local index using the provided mapper.
+
+        Args:
+            ind: Local index for which to retrieve the distributed index.
+
+            mapper: Mapper providing the distributed index.
+
+        '''
+        return mapper[ind.to(mapper.device)]
+
+class DataSet:
+    '''
+
+    Args:
+        nodes: Tensor representing nodes. If not None, it is moved to the specified device.
+
+        edges: Tensor representing edges. If not None, it is moved to the specified device.
+
+        labels: Optional parameter for labels.
+
+        ts: Tensor representing timestamps. If not None, it is moved to the specified device.
+
+        device: Device to which tensors are moved (default is 'cuda').
+
+    '''
+    def __init__(self,nodes = None,
+                 edges = None,
+                 labels = None, 
+                 ts = None, 
+                 device = torch.device('cuda'),**kwargs):
+        if nodes is not None:
+            self.nodes = nodes.to(device)
+        if edges is not None:
+            self.edges = edges.to(device)
+        if ts is not None:
+            self.ts = ts.to(device)
+        if labels is not None:
+            self.labels = labels
+        self.len = self.nodes.shape[0] if nodes is not None else self.edges.shape[1] 
+        
+        for k, v in kwargs.items():
+            assert isinstance(v,torch.Tensor) and v.shape[0]==self.len
+            setattr(self, k, v.to(device))
+    def _get_empty(self):
+        '''
+        Creates an empty dataset with the same device and data types as the current instance.
+
+        '''
+        nodes = torch.empty([],dtype = self.nodes.dtype,device= self.nodes.device)if hasattr(self,'nodes') else None
+        edges = torch.empty([[],[]],dtype = self.edges.dtype,device= self.edge.device)if hasattr(self,'edges') else None
+        d = DataSet(nodes,edges)
+        for k,v in self.__dict__.items():
+            if k == 'edges' or k=='nodes' or k == 'len':
+                continue
+            else:
+                setattr(d,k,torch.empty([]))
+        return d
+
+    #@staticmethod
+    def get_next(self,indx):
+        '''
+        Retrieves the next dataset based on the provided index.
+
+        Args:
+            indx: Index specifying the dataset to retrieve.
+
+        '''
+        nodes = self.nodes[indx] if hasattr(self,'nodes') else None
+        edges = self.edges[:,indx] if hasattr(self,'edges') else None
+        d = DataSet(nodes,edges)
+        for k,v in self.__dict__.items():
+            if k == 'edges' or k=='nodes' or k == 'len':
+                continue
+            else:
+                setattr(d,k,v[indx])
+        return d
+
+    #@staticmethod
+    def shuffle(self):
+        '''
+        Shuffles the dataset and returns a new dataset with the same attributes.
+
+        '''
+        indx = torch.randperm(self.len)
+        nodes = self.nodes[indx] if hasattr(self,'nodes') else None
+        edges = self.edges[:,indx] if hasattr(self,'edges') else None
+        d = DataSet(nodes,edges)
+        for k,v in self.__dict__.items():
+            if k == 'edges' or k=='nodes' or k == 'len':
+                continue
+            else:
+                setattr(d,k,v[indx])
+        return d
+    
+class TemporalGraphData(DistributedGraphStore):
+    def __init__(self,pdata,device):
+        super(DistributedGraphStore,self).__init__(pdata,device)
+    def _set_temporal_batch_cache(self,size,pin_size):
+        pass
+    def _load_feature_to_cuda(self,ids):
+        pass
+    
+
+
+
+class TemporalNeighborSampleGraph(DistributedGraphStore):
+    '''
+
+    Args:
+        sample_graph: A dictionary containing graph structure information, including 'edge_index', 'ts' (edge timestamp), and 'eids' (edge identifiers).
+
+        mode: Specifies the dataset mode ('train', 'val', 'test', or 'full').
+
+        eids_mapper: Optional parameter for edge identifiers mapping.
+
+
+    '''
+    def __init__(self, sample_graph=None, mode='full', eids_mapper=None):
+        self.edge_index = sample_graph['edge_index']
+        self.num_edges = self.edge_index.shape[1]
+        if 'ts' in sample_graph:
+            self.edge_ts = sample_graph['ts']
+        else:
+            self.edge_ts = None
+        self.eid = sample_graph['eids']
+        if mode == 'train':
+            mask = sample_graph['train_mask']
+        if mode == 'val':
+            mask = sample_graph['val_mask']
+        if mode == 'test':
+            mask = sample_graph['test_mask']
+        if mode != 'full':
+            self.edge_index = self.edge_index[:, mask]
+            self.edge_ts = self.edge_ts[mask]
+            self.eid = self.eid[mask]  
+
+
+        
+    
+
+
--- a/.history/starrygl/sample/memory/shared_mailbox_20240108201850.py
+++ b/.history/starrygl/sample/memory/shared_mailbox_20240108201850.py
--- a/.history/starrygl/sample/part_utils/partition_tgnn_20240108201933.py
+++ b/.history/starrygl/sample/part_utils/partition_tgnn_20240108201933.py
--- a/.history/starrygl/sample/sample_core/neighbor_sampler_20240108202007.py
+++ b/.history/starrygl/sample/sample_core/neighbor_sampler_20240108202007.py
--- a/.history/train_tgnn_20240108200853.py
+++ b/.history/train_tgnn_20240108200853.py
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -110,6 +110,19 @@ if(WITH_MTMETIS)
    target_compile_definitions(mtmetis_partition PRIVATE -DMTMETIS_64BIT_PARTITIONS)
 endif()

+if (WITH_LDG)
+    # Imports neighbor-clustering based (e.g. LDG algorithm) graph partitioning implementation
+    add_definitions(-DWITH_LDG)
+    set(LDG_DIR "csrc/partition/neighbor_clustering")
+    
+    add_library(ldg_partition SHARED "csrc/partition/ldg.cpp")
+    target_link_libraries(ldg_partition PRIVATE ${TORCH_LIBRARIES})
+
+    add_subdirectory(${LDG_DIR})
+    target_include_directories(ldg_partition PRIVATE ${LDG_DIR})
+    target_link_libraries(ldg_partition PRIVATE ldg-vertex-partition)
+endif ()
+
 include_directories("csrc/include")
 add_library(${PROJECT_NAME} SHARED csrc/export.cpp)


--- a/csrc/export.cpp
+++ b/csrc/export.cpp
@@ -5,7 +5,6 @@

 PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
    #ifdef WITH_CUDA
-    #ifdef WITH_CUDA
    m.def("uvm_storage_new", &uvm_storage_new, "return storage of unified virtual memory");
    m.def("uvm_storage_to_cuda", &uvm_storage_to_cuda, "share uvm storage with another cuda device");
    m.def("uvm_storage_to_cpu", &uvm_storage_to_cpu, "share uvm storage with cpu");

--- a/saved_checkpoints/DyRep-LASTFM-0.pth
+++ b/saved_checkpoints/DyRep-LASTFM-0.pth
--- a/saved_checkpoints/DyRep-LASTFM-1.pth
+++ b/saved_checkpoints/DyRep-LASTFM-1.pth
--- a/saved_checkpoints/DyRep-LASTFM-10.pth
+++ b/saved_checkpoints/DyRep-LASTFM-10.pth
--- a/saved_checkpoints/DyRep-LASTFM-11.pth
+++ b/saved_checkpoints/DyRep-LASTFM-11.pth
--- a/saved_checkpoints/DyRep-LASTFM-12.pth
+++ b/saved_checkpoints/DyRep-LASTFM-12.pth
--- a/saved_checkpoints/DyRep-LASTFM-13.pth
+++ b/saved_checkpoints/DyRep-LASTFM-13.pth
--- a/saved_checkpoints/DyRep-LASTFM-14.pth
+++ b/saved_checkpoints/DyRep-LASTFM-14.pth
--- a/saved_checkpoints/DyRep-LASTFM-15.pth
+++ b/saved_checkpoints/DyRep-LASTFM-15.pth
--- a/saved_checkpoints/DyRep-LASTFM-16.pth
+++ b/saved_checkpoints/DyRep-LASTFM-16.pth
--- a/saved_checkpoints/DyRep-LASTFM-17.pth
+++ b/saved_checkpoints/DyRep-LASTFM-17.pth
--- a/saved_checkpoints/DyRep-LASTFM-18.pth
+++ b/saved_checkpoints/DyRep-LASTFM-18.pth
--- a/saved_checkpoints/DyRep-LASTFM-19.pth
+++ b/saved_checkpoints/DyRep-LASTFM-19.pth
--- a/saved_checkpoints/DyRep-LASTFM-2.pth
+++ b/saved_checkpoints/DyRep-LASTFM-2.pth
--- a/saved_checkpoints/DyRep-LASTFM-20.pth
+++ b/saved_checkpoints/DyRep-LASTFM-20.pth
--- a/saved_checkpoints/DyRep-LASTFM-21.pth
+++ b/saved_checkpoints/DyRep-LASTFM-21.pth
--- a/saved_checkpoints/DyRep-LASTFM-22.pth
+++ b/saved_checkpoints/DyRep-LASTFM-22.pth
--- a/saved_checkpoints/DyRep-LASTFM-23.pth
+++ b/saved_checkpoints/DyRep-LASTFM-23.pth
--- a/saved_checkpoints/DyRep-LASTFM-24.pth
+++ b/saved_checkpoints/DyRep-LASTFM-24.pth
--- a/saved_checkpoints/DyRep-LASTFM-25.pth
+++ b/saved_checkpoints/DyRep-LASTFM-25.pth
--- a/saved_checkpoints/DyRep-LASTFM-26.pth
+++ b/saved_checkpoints/DyRep-LASTFM-26.pth
--- a/saved_checkpoints/DyRep-LASTFM-3.pth
+++ b/saved_checkpoints/DyRep-LASTFM-3.pth
--- a/saved_checkpoints/DyRep-LASTFM-4.pth
+++ b/saved_checkpoints/DyRep-LASTFM-4.pth
--- a/saved_checkpoints/DyRep-LASTFM-5.pth
+++ b/saved_checkpoints/DyRep-LASTFM-5.pth
--- a/saved_checkpoints/DyRep-LASTFM-6.pth
+++ b/saved_checkpoints/DyRep-LASTFM-6.pth
--- a/saved_checkpoints/DyRep-LASTFM-7.pth
+++ b/saved_checkpoints/DyRep-LASTFM-7.pth
--- a/saved_checkpoints/DyRep-LASTFM-8.pth
+++ b/saved_checkpoints/DyRep-LASTFM-8.pth
--- a/saved_checkpoints/DyRep-LASTFM-9.pth
+++ b/saved_checkpoints/DyRep-LASTFM-9.pth
--- a/saved_checkpoints/DyRep-MOOC-0.pth
+++ b/saved_checkpoints/DyRep-MOOC-0.pth
--- a/saved_checkpoints/DyRep-MOOC-1.pth
+++ b/saved_checkpoints/DyRep-MOOC-1.pth
--- a/saved_checkpoints/DyRep-MOOC-10.pth
+++ b/saved_checkpoints/DyRep-MOOC-10.pth
--- a/saved_checkpoints/DyRep-MOOC-11.pth
+++ b/saved_checkpoints/DyRep-MOOC-11.pth
--- a/saved_checkpoints/DyRep-MOOC-12.pth
+++ b/saved_checkpoints/DyRep-MOOC-12.pth
--- a/saved_checkpoints/DyRep-MOOC-13.pth
+++ b/saved_checkpoints/DyRep-MOOC-13.pth
--- a/saved_checkpoints/DyRep-MOOC-14.pth
+++ b/saved_checkpoints/DyRep-MOOC-14.pth
--- a/saved_checkpoints/DyRep-MOOC-15.pth
+++ b/saved_checkpoints/DyRep-MOOC-15.pth
--- a/saved_checkpoints/DyRep-MOOC-16.pth
+++ b/saved_checkpoints/DyRep-MOOC-16.pth
--- a/saved_checkpoints/DyRep-MOOC-17.pth
+++ b/saved_checkpoints/DyRep-MOOC-17.pth
--- a/saved_checkpoints/DyRep-MOOC-18.pth
+++ b/saved_checkpoints/DyRep-MOOC-18.pth
--- a/saved_checkpoints/DyRep-MOOC-19.pth
+++ b/saved_checkpoints/DyRep-MOOC-19.pth
--- a/saved_checkpoints/DyRep-MOOC-2.pth
+++ b/saved_checkpoints/DyRep-MOOC-2.pth
--- a/saved_checkpoints/DyRep-MOOC-3.pth
+++ b/saved_checkpoints/DyRep-MOOC-3.pth
--- a/saved_checkpoints/DyRep-MOOC-4.pth
+++ b/saved_checkpoints/DyRep-MOOC-4.pth
--- a/saved_checkpoints/DyRep-MOOC-5.pth
+++ b/saved_checkpoints/DyRep-MOOC-5.pth
--- a/saved_checkpoints/DyRep-MOOC-6.pth
+++ b/saved_checkpoints/DyRep-MOOC-6.pth
--- a/saved_checkpoints/DyRep-MOOC-7.pth
+++ b/saved_checkpoints/DyRep-MOOC-7.pth
--- a/saved_checkpoints/DyRep-MOOC-8.pth
+++ b/saved_checkpoints/DyRep-MOOC-8.pth
--- a/saved_checkpoints/DyRep-MOOC-9.pth
+++ b/saved_checkpoints/DyRep-MOOC-9.pth
--- a/saved_checkpoints/DyRep-REDDIT-0.pth
+++ b/saved_checkpoints/DyRep-REDDIT-0.pth
--- a/saved_checkpoints/DyRep-REDDIT-1.pth
+++ b/saved_checkpoints/DyRep-REDDIT-1.pth
--- a/saved_checkpoints/DyRep-REDDIT-10.pth
+++ b/saved_checkpoints/DyRep-REDDIT-10.pth
--- a/saved_checkpoints/DyRep-REDDIT-11.pth
+++ b/saved_checkpoints/DyRep-REDDIT-11.pth
--- a/saved_checkpoints/DyRep-REDDIT-12.pth
+++ b/saved_checkpoints/DyRep-REDDIT-12.pth
--- a/saved_checkpoints/DyRep-REDDIT-13.pth
+++ b/saved_checkpoints/DyRep-REDDIT-13.pth
--- a/saved_checkpoints/DyRep-REDDIT-14.pth
+++ b/saved_checkpoints/DyRep-REDDIT-14.pth
--- a/saved_checkpoints/DyRep-REDDIT-15.pth
+++ b/saved_checkpoints/DyRep-REDDIT-15.pth
--- a/saved_checkpoints/DyRep-REDDIT-16.pth
+++ b/saved_checkpoints/DyRep-REDDIT-16.pth
--- a/saved_checkpoints/DyRep-REDDIT-17.pth
+++ b/saved_checkpoints/DyRep-REDDIT-17.pth
--- a/saved_checkpoints/DyRep-REDDIT-18.pth
+++ b/saved_checkpoints/DyRep-REDDIT-18.pth
--- a/saved_checkpoints/DyRep-REDDIT-19.pth
+++ b/saved_checkpoints/DyRep-REDDIT-19.pth
--- a/saved_checkpoints/DyRep-REDDIT-2.pth
+++ b/saved_checkpoints/DyRep-REDDIT-2.pth
--- a/saved_checkpoints/DyRep-REDDIT-20.pth
+++ b/saved_checkpoints/DyRep-REDDIT-20.pth
--- a/saved_checkpoints/DyRep-REDDIT-21.pth
+++ b/saved_checkpoints/DyRep-REDDIT-21.pth
--- a/saved_checkpoints/DyRep-REDDIT-22.pth
+++ b/saved_checkpoints/DyRep-REDDIT-22.pth
--- a/saved_checkpoints/DyRep-REDDIT-23.pth
+++ b/saved_checkpoints/DyRep-REDDIT-23.pth
--- a/saved_checkpoints/DyRep-REDDIT-24.pth
+++ b/saved_checkpoints/DyRep-REDDIT-24.pth
--- a/saved_checkpoints/DyRep-REDDIT-25.pth
+++ b/saved_checkpoints/DyRep-REDDIT-25.pth
--- a/saved_checkpoints/DyRep-REDDIT-26.pth
+++ b/saved_checkpoints/DyRep-REDDIT-26.pth
--- a/saved_checkpoints/DyRep-REDDIT-27.pth
+++ b/saved_checkpoints/DyRep-REDDIT-27.pth
--- a/saved_checkpoints/DyRep-REDDIT-28.pth
+++ b/saved_checkpoints/DyRep-REDDIT-28.pth
--- a/saved_checkpoints/DyRep-REDDIT-29.pth
+++ b/saved_checkpoints/DyRep-REDDIT-29.pth
--- a/saved_checkpoints/DyRep-REDDIT-3.pth
+++ b/saved_checkpoints/DyRep-REDDIT-3.pth
--- a/saved_checkpoints/DyRep-REDDIT-30.pth
+++ b/saved_checkpoints/DyRep-REDDIT-30.pth
--- a/saved_checkpoints/DyRep-REDDIT-31.pth
+++ b/saved_checkpoints/DyRep-REDDIT-31.pth
--- a/saved_checkpoints/DyRep-REDDIT-32.pth
+++ b/saved_checkpoints/DyRep-REDDIT-32.pth
--- a/saved_checkpoints/DyRep-REDDIT-33.pth
+++ b/saved_checkpoints/DyRep-REDDIT-33.pth
--- a/saved_checkpoints/DyRep-REDDIT-34.pth
+++ b/saved_checkpoints/DyRep-REDDIT-34.pth
--- a/saved_checkpoints/DyRep-REDDIT-35.pth
+++ b/saved_checkpoints/DyRep-REDDIT-35.pth
--- a/saved_checkpoints/DyRep-REDDIT-36.pth
+++ b/saved_checkpoints/DyRep-REDDIT-36.pth
--- a/saved_checkpoints/DyRep-REDDIT-4.pth
+++ b/saved_checkpoints/DyRep-REDDIT-4.pth
--- a/saved_checkpoints/DyRep-REDDIT-5.pth
+++ b/saved_checkpoints/DyRep-REDDIT-5.pth
--- a/saved_checkpoints/DyRep-REDDIT-6.pth
+++ b/saved_checkpoints/DyRep-REDDIT-6.pth
--- a/saved_checkpoints/DyRep-REDDIT-7.pth
+++ b/saved_checkpoints/DyRep-REDDIT-7.pth
--- a/saved_checkpoints/DyRep-REDDIT-8.pth
+++ b/saved_checkpoints/DyRep-REDDIT-8.pth
--- a/saved_checkpoints/DyRep-REDDIT-9.pth
+++ b/saved_checkpoints/DyRep-REDDIT-9.pth
--- a/saved_checkpoints/TGN-LASTFM-0.pth
+++ b/saved_checkpoints/TGN-LASTFM-0.pth
--- a/saved_checkpoints/TGN-LASTFM-1.pth
+++ b/saved_checkpoints/TGN-LASTFM-1.pth
--- a/saved_checkpoints/TGN-LASTFM-10.pth
+++ b/saved_checkpoints/TGN-LASTFM-10.pth
--- a/saved_checkpoints/TGN-LASTFM-11.pth
+++ b/saved_checkpoints/TGN-LASTFM-11.pth
--- a/saved_checkpoints/TGN-LASTFM-12.pth
+++ b/saved_checkpoints/TGN-LASTFM-12.pth
--- a/saved_checkpoints/TGN-LASTFM-13.pth
+++ b/saved_checkpoints/TGN-LASTFM-13.pth
--- a/saved_checkpoints/TGN-LASTFM-14.pth
+++ b/saved_checkpoints/TGN-LASTFM-14.pth
--- a/saved_checkpoints/TGN-LASTFM-15.pth
+++ b/saved_checkpoints/TGN-LASTFM-15.pth
--- a/saved_checkpoints/TGN-LASTFM-16.pth
+++ b/saved_checkpoints/TGN-LASTFM-16.pth
--- a/saved_checkpoints/TGN-LASTFM-17.pth
+++ b/saved_checkpoints/TGN-LASTFM-17.pth
--- a/saved_checkpoints/TGN-LASTFM-18.pth
+++ b/saved_checkpoints/TGN-LASTFM-18.pth
--- a/saved_checkpoints/TGN-LASTFM-19.pth
+++ b/saved_checkpoints/TGN-LASTFM-19.pth
--- a/saved_checkpoints/TGN-LASTFM-2.pth
+++ b/saved_checkpoints/TGN-LASTFM-2.pth
--- a/saved_checkpoints/TGN-LASTFM-3.pth
+++ b/saved_checkpoints/TGN-LASTFM-3.pth
--- a/saved_checkpoints/TGN-LASTFM-4.pth
+++ b/saved_checkpoints/TGN-LASTFM-4.pth
--- a/saved_checkpoints/TGN-LASTFM-5.pth
+++ b/saved_checkpoints/TGN-LASTFM-5.pth
--- a/saved_checkpoints/TGN-LASTFM-6.pth
+++ b/saved_checkpoints/TGN-LASTFM-6.pth
--- a/saved_checkpoints/TGN-LASTFM-7.pth
+++ b/saved_checkpoints/TGN-LASTFM-7.pth
--- a/saved_checkpoints/TGN-LASTFM-8.pth
+++ b/saved_checkpoints/TGN-LASTFM-8.pth
--- a/saved_checkpoints/TGN-LASTFM-9.pth
+++ b/saved_checkpoints/TGN-LASTFM-9.pth
--- a/saved_checkpoints/TGN-MOOC-0.pth
+++ b/saved_checkpoints/TGN-MOOC-0.pth
--- a/saved_checkpoints/TGN-MOOC-1.pth
+++ b/saved_checkpoints/TGN-MOOC-1.pth
--- a/saved_checkpoints/TGN-MOOC-10.pth
+++ b/saved_checkpoints/TGN-MOOC-10.pth
--- a/saved_checkpoints/TGN-MOOC-11.pth
+++ b/saved_checkpoints/TGN-MOOC-11.pth
--- a/saved_checkpoints/TGN-MOOC-12.pth
+++ b/saved_checkpoints/TGN-MOOC-12.pth
--- a/saved_checkpoints/TGN-MOOC-13.pth
+++ b/saved_checkpoints/TGN-MOOC-13.pth
--- a/saved_checkpoints/TGN-MOOC-14.pth
+++ b/saved_checkpoints/TGN-MOOC-14.pth
--- a/saved_checkpoints/TGN-MOOC-15.pth
+++ b/saved_checkpoints/TGN-MOOC-15.pth
--- a/saved_checkpoints/TGN-MOOC-16.pth
+++ b/saved_checkpoints/TGN-MOOC-16.pth
--- a/saved_checkpoints/TGN-MOOC-17.pth
+++ b/saved_checkpoints/TGN-MOOC-17.pth
--- a/saved_checkpoints/TGN-MOOC-18.pth
+++ b/saved_checkpoints/TGN-MOOC-18.pth
--- a/saved_checkpoints/TGN-MOOC-19.pth
+++ b/saved_checkpoints/TGN-MOOC-19.pth
--- a/saved_checkpoints/TGN-MOOC-2.pth
+++ b/saved_checkpoints/TGN-MOOC-2.pth
--- a/saved_checkpoints/TGN-MOOC-3.pth
+++ b/saved_checkpoints/TGN-MOOC-3.pth
--- a/saved_checkpoints/TGN-MOOC-4.pth
+++ b/saved_checkpoints/TGN-MOOC-4.pth
--- a/saved_checkpoints/TGN-MOOC-5.pth
+++ b/saved_checkpoints/TGN-MOOC-5.pth
--- a/saved_checkpoints/TGN-MOOC-6.pth
+++ b/saved_checkpoints/TGN-MOOC-6.pth
--- a/saved_checkpoints/TGN-MOOC-7.pth
+++ b/saved_checkpoints/TGN-MOOC-7.pth
--- a/saved_checkpoints/TGN-MOOC-8.pth
+++ b/saved_checkpoints/TGN-MOOC-8.pth
--- a/saved_checkpoints/TGN-MOOC-9.pth
+++ b/saved_checkpoints/TGN-MOOC-9.pth
--- a/saved_checkpoints/TGN-REDDIT-0.pth
+++ b/saved_checkpoints/TGN-REDDIT-0.pth
--- a/saved_checkpoints/TGN-REDDIT-1.pth
+++ b/saved_checkpoints/TGN-REDDIT-1.pth
--- a/saved_checkpoints/TGN-REDDIT-10.pth
+++ b/saved_checkpoints/TGN-REDDIT-10.pth
--- a/saved_checkpoints/TGN-REDDIT-11.pth
+++ b/saved_checkpoints/TGN-REDDIT-11.pth
--- a/saved_checkpoints/TGN-REDDIT-12.pth
+++ b/saved_checkpoints/TGN-REDDIT-12.pth
--- a/saved_checkpoints/TGN-REDDIT-13.pth
+++ b/saved_checkpoints/TGN-REDDIT-13.pth
--- a/saved_checkpoints/TGN-REDDIT-14.pth
+++ b/saved_checkpoints/TGN-REDDIT-14.pth
--- a/saved_checkpoints/TGN-REDDIT-15.pth
+++ b/saved_checkpoints/TGN-REDDIT-15.pth
--- a/saved_checkpoints/TGN-REDDIT-16.pth
+++ b/saved_checkpoints/TGN-REDDIT-16.pth
--- a/saved_checkpoints/TGN-REDDIT-17.pth
+++ b/saved_checkpoints/TGN-REDDIT-17.pth
--- a/saved_checkpoints/TGN-REDDIT-18.pth
+++ b/saved_checkpoints/TGN-REDDIT-18.pth
--- a/saved_checkpoints/TGN-REDDIT-19.pth
+++ b/saved_checkpoints/TGN-REDDIT-19.pth
--- a/saved_checkpoints/TGN-REDDIT-2.pth
+++ b/saved_checkpoints/TGN-REDDIT-2.pth
--- a/saved_checkpoints/TGN-REDDIT-3.pth
+++ b/saved_checkpoints/TGN-REDDIT-3.pth
--- a/saved_checkpoints/TGN-REDDIT-4.pth
+++ b/saved_checkpoints/TGN-REDDIT-4.pth
--- a/saved_checkpoints/TGN-REDDIT-5.pth
+++ b/saved_checkpoints/TGN-REDDIT-5.pth
--- a/saved_checkpoints/TGN-REDDIT-6.pth
+++ b/saved_checkpoints/TGN-REDDIT-6.pth
--- a/saved_checkpoints/TGN-REDDIT-7.pth
+++ b/saved_checkpoints/TGN-REDDIT-7.pth
--- a/saved_checkpoints/TGN-REDDIT-8.pth
+++ b/saved_checkpoints/TGN-REDDIT-8.pth
--- a/saved_checkpoints/TGN-REDDIT-9.pth
+++ b/saved_checkpoints/TGN-REDDIT-9.pth
--- a/saved_checkpoints/TIGE-LASTFM-0.pth
+++ b/saved_checkpoints/TIGE-LASTFM-0.pth
--- a/saved_checkpoints/TIGE-LASTFM-1.pth
+++ b/saved_checkpoints/TIGE-LASTFM-1.pth
--- a/saved_checkpoints/TIGE-LASTFM-10.pth
+++ b/saved_checkpoints/TIGE-LASTFM-10.pth
--- a/saved_checkpoints/TIGE-LASTFM-11.pth
+++ b/saved_checkpoints/TIGE-LASTFM-11.pth
--- a/saved_checkpoints/TIGE-LASTFM-12.pth
+++ b/saved_checkpoints/TIGE-LASTFM-12.pth
--- a/saved_checkpoints/TIGE-LASTFM-2.pth
+++ b/saved_checkpoints/TIGE-LASTFM-2.pth
--- a/saved_checkpoints/TIGE-LASTFM-3.pth
+++ b/saved_checkpoints/TIGE-LASTFM-3.pth
--- a/saved_checkpoints/TIGE-LASTFM-4.pth
+++ b/saved_checkpoints/TIGE-LASTFM-4.pth
--- a/saved_checkpoints/TIGE-LASTFM-5.pth
+++ b/saved_checkpoints/TIGE-LASTFM-5.pth
--- a/saved_checkpoints/TIGE-LASTFM-6.pth
+++ b/saved_checkpoints/TIGE-LASTFM-6.pth
--- a/saved_checkpoints/TIGE-LASTFM-7.pth
+++ b/saved_checkpoints/TIGE-LASTFM-7.pth
--- a/saved_checkpoints/TIGE-LASTFM-8.pth
+++ b/saved_checkpoints/TIGE-LASTFM-8.pth
--- a/saved_checkpoints/TIGE-LASTFM-9.pth
+++ b/saved_checkpoints/TIGE-LASTFM-9.pth
--- a/saved_checkpoints/TIGE-MOOC-0.pth
+++ b/saved_checkpoints/TIGE-MOOC-0.pth
--- a/saved_checkpoints/TIGE-MOOC-1.pth
+++ b/saved_checkpoints/TIGE-MOOC-1.pth
--- a/saved_checkpoints/TIGE-MOOC-10.pth
+++ b/saved_checkpoints/TIGE-MOOC-10.pth
--- a/saved_checkpoints/TIGE-MOOC-11.pth
+++ b/saved_checkpoints/TIGE-MOOC-11.pth
--- a/saved_checkpoints/TIGE-MOOC-12.pth
+++ b/saved_checkpoints/TIGE-MOOC-12.pth
--- a/saved_checkpoints/TIGE-MOOC-13.pth
+++ b/saved_checkpoints/TIGE-MOOC-13.pth
--- a/saved_checkpoints/TIGE-MOOC-14.pth
+++ b/saved_checkpoints/TIGE-MOOC-14.pth
--- a/saved_checkpoints/TIGE-MOOC-15.pth
+++ b/saved_checkpoints/TIGE-MOOC-15.pth
--- a/saved_checkpoints/TIGE-MOOC-2.pth
+++ b/saved_checkpoints/TIGE-MOOC-2.pth
--- a/saved_checkpoints/TIGE-MOOC-3.pth
+++ b/saved_checkpoints/TIGE-MOOC-3.pth
--- a/saved_checkpoints/TIGE-MOOC-4.pth
+++ b/saved_checkpoints/TIGE-MOOC-4.pth
--- a/saved_checkpoints/TIGE-MOOC-5.pth
+++ b/saved_checkpoints/TIGE-MOOC-5.pth
--- a/saved_checkpoints/TIGE-MOOC-6.pth
+++ b/saved_checkpoints/TIGE-MOOC-6.pth
--- a/saved_checkpoints/TIGE-MOOC-7.pth
+++ b/saved_checkpoints/TIGE-MOOC-7.pth
--- a/saved_checkpoints/TIGE-MOOC-8.pth
+++ b/saved_checkpoints/TIGE-MOOC-8.pth
--- a/saved_checkpoints/TIGE-MOOC-9.pth
+++ b/saved_checkpoints/TIGE-MOOC-9.pth
--- a/saved_checkpoints/TIGE-REDDIT-0.pth
+++ b/saved_checkpoints/TIGE-REDDIT-0.pth
--- a/saved_checkpoints/TIGE-REDDIT-1.pth
+++ b/saved_checkpoints/TIGE-REDDIT-1.pth
--- a/saved_checkpoints/TIGE-REDDIT-10.pth
+++ b/saved_checkpoints/TIGE-REDDIT-10.pth
--- a/saved_checkpoints/TIGE-REDDIT-11.pth
+++ b/saved_checkpoints/TIGE-REDDIT-11.pth
--- a/saved_checkpoints/TIGE-REDDIT-12.pth
+++ b/saved_checkpoints/TIGE-REDDIT-12.pth
--- a/saved_checkpoints/TIGE-REDDIT-13.pth
+++ b/saved_checkpoints/TIGE-REDDIT-13.pth
--- a/saved_checkpoints/TIGE-REDDIT-14.pth
+++ b/saved_checkpoints/TIGE-REDDIT-14.pth
--- a/saved_checkpoints/TIGE-REDDIT-15.pth
+++ b/saved_checkpoints/TIGE-REDDIT-15.pth
--- a/saved_checkpoints/TIGE-REDDIT-16.pth
+++ b/saved_checkpoints/TIGE-REDDIT-16.pth
--- a/saved_checkpoints/TIGE-REDDIT-17.pth
+++ b/saved_checkpoints/TIGE-REDDIT-17.pth
--- a/saved_checkpoints/TIGE-REDDIT-2.pth
+++ b/saved_checkpoints/TIGE-REDDIT-2.pth
--- a/saved_checkpoints/TIGE-REDDIT-3.pth
+++ b/saved_checkpoints/TIGE-REDDIT-3.pth
--- a/saved_checkpoints/TIGE-REDDIT-4.pth
+++ b/saved_checkpoints/TIGE-REDDIT-4.pth
--- a/saved_checkpoints/TIGE-REDDIT-5.pth
+++ b/saved_checkpoints/TIGE-REDDIT-5.pth
--- a/saved_checkpoints/TIGE-REDDIT-6.pth
+++ b/saved_checkpoints/TIGE-REDDIT-6.pth
--- a/saved_checkpoints/TIGE-REDDIT-7.pth
+++ b/saved_checkpoints/TIGE-REDDIT-7.pth
--- a/saved_checkpoints/TIGE-REDDIT-8.pth
+++ b/saved_checkpoints/TIGE-REDDIT-8.pth
--- a/saved_checkpoints/TIGE-REDDIT-9.pth
+++ b/saved_checkpoints/TIGE-REDDIT-9.pth
--- a/saved_models/DyRep-LASTFM.pth
+++ b/saved_models/DyRep-LASTFM.pth
--- a/saved_models/DyRep-REDDIT.pth
+++ b/saved_models/DyRep-REDDIT.pth
--- a/saved_models/TGN-LASTFM.pth
+++ b/saved_models/TGN-LASTFM.pth
--- a/saved_models/TGN-MOOC.pth
+++ b/saved_models/TGN-MOOC.pth
--- a/saved_models/TGN-REDDIT.pth
+++ b/saved_models/TGN-REDDIT.pth
--- a/saved_models/TIGE-LASTFM.pth
+++ b/saved_models/TIGE-LASTFM.pth
--- a/saved_models/TIGE-MOOC.pth
+++ b/saved_models/TIGE-MOOC.pth
--- a/saved_models/TIGE-REDDIT.pth
+++ b/saved_models/TIGE-REDDIT.pth
--- a/starrygl/sample/data_loader.py
+++ b/starrygl/sample/data_loader.py
--- a/train_tgnn.py
+++ b/train_tgnn.py