add time count

e0711e14 · zlj · ae8b45b0 · e0711e14 · e0711e14 · e0711e14
Commit e0711e14 authored Sep 12, 2024 by zlj
Expand all Hide whitespace changes
Inline Side-by-side

Showing with 15 additions and 7 deletions

examples/train_static.py
+0 -0

starrygl/module/modules.py
+8 -6

starrygl/sample/data_loader.py
+7 -1

No files found.
--- a/examples/train_static.py
+++ b/examples/train_static.py
--- a/starrygl/module/modules.py
+++ b/starrygl/module/modules.py
@@ -114,14 +114,13 @@ class GeneralModel(torch.nn.Module):
            
                
    def forward(self, mfgs, metadata = None,neg_samples=1, mode = 'triplet',async_param = None):
-        t0 = time.time()
+        t0 = tt.start_gpu()
        if self.memory_param['type'] == 'node':
            self.memory_updater(mfgs[0],async_param)
+        t_mem = tt.elapsed_event(t0)
+        tt.time_memory_updater += t_mem
        out = list()
-        start = torch.cuda.Event(enable_timing=True)
-        end = torch.cuda.Event(enable_timing=True)
-
-        start.record()
+        t1 = tt.start_gpu()
        for l in range(self.gnn_param['layer']):
            for h in range(self.sample_param['history']):
                rst = self.layers['l' + str(l) + 'h' + str(h)](mfgs[l][h])
@@ -145,7 +144,10 @@ class GeneralModel(torch.nn.Module):
        #print('time {}\n'.format(elapsed_time_ms))
        #print('pos src {} \n pos dst {} \n neg dst{} \n'.format(h_pos_src, h_pos_dst,h_neg_dst))
        #print('pre predict {}'.format(mfgs[0][0].srcdata['ID']))
-        return self.edge_predictor(h_pos_src, h_pos_dst, None , h_neg_dst, neg_samples=neg_samples, mode = mode)
+        pred = self.edge_predictor(h_pos_src, h_pos_dst, None , h_neg_dst, neg_samples=neg_samples, mode = mode)
+        t_embedding = tt.elapsed_event(t1)
+        tt.time_embedding+=t_embedding
+        return pred
    

 class NodeClassificationModel(torch.nn.Module):

--- a/starrygl/sample/data_loader.py
+++ b/starrygl/sample/data_loader.py
@@ -23,7 +23,7 @@ import torch.distributed as dist
 from torch_geometric.data import Data
 import os.path as osp
 import math
-
+from starrygl.sample.count_static import time_count as tt
 import data_loader as data_loader
 import concurrent.futures
 executor = concurrent.futures.ThreadPoolExecutor(max_workers=1) 
@@ -294,6 +294,7 @@ class DistributedDataLoader:
        #with torch.cuda.stream(stream):
        if self.is_pipeline is False:
            if self.recv_idxs < self.expected_idx:
+                t0 = tt.start_gpu()
                data = self._next_data()
                batch_data,dist_nid,dist_eid = graph_sample(
                    self.graph,
@@ -305,9 +306,14 @@ class DistributedDataLoader:
                                      eid_mapper = self.graph.eids_mapper)

                root,mfgs,metadata = batch_data
+                t_sample = tt.elapsed_event(t0)
+                tt.time_sample_and_build+=t_sample
+                t1 = tt.start_gpu()
                edge_feat = get_edge_feature_by_dist(self.graph,dist_eid,is_local,out_device=self.device)
                node_feat,mem = get_node_feature_by_dist(self.graph,self.mailbox,dist_nid, is_local,out_device=self.device)
                prepare_input(node_feat,edge_feat,mem,mfgs,dist_nid,dist_eid)
+                t_fetch = tt.elapsed_event(t1)
+                tt.time_memory_fetch += t_fetch
                #if(self.mailbox is not None and self.mailbox.historical_cache is not None):
                #    id = batch_data[1][0][0].srcdata['ID']
                #    mask = DistIndex(id).is_shared