hpcgroup · bhatele · Nov 14, 2023 · Sep 11, 2022 · Sep 12, 2022 · Sep 12, 2022
diff --git a/pipit/graph.py b/pipit/graph.py
@@ -9,13 +9,17 @@ class Node:
     referenced by any calling_context_id directly under it
     """
 
-    def __init__(self, name_id, name, parent) -> None:
+    def __init__(self, name_id, name, parent, level=None) -> None:
         self.calling_context_ids = []
         self.name_id = name_id
         self.name = name
         self.children = []
         self.parent = parent
-        self.level = self.__calculate_level()
+
+        if level is None:
+            self.level = self.__calculate_level()
+        else:
+            self.level = level
 
     def add_child(self, child_node):
         self.children.append(child_node)

diff --git a/pipit/readers/hpctoolkit_reader.py b/pipit/readers/hpctoolkit_reader.py
@@ -307,4 +307,4 @@ def read(self):
             by="Time", axis=0, ascending=True, inplace=True, ignore_index=True
         )
         self.trace_df = trace_df
-        return pipit.trace.Trace(None, trace_df)
+        return pipit.trace.Trace(None, trace_df, graph)
diff --git a/pipit/readers/otf2_reader.py b/pipit/readers/otf2_reader.py
@@ -3,6 +3,7 @@
 #
 # SPDX-License-Identifier: MIT
 
+
 import math
 import otf2
 import pandas as pd
@@ -375,4 +376,8 @@ def read(self):
             # close the trace and open it later per process
             trace.close()
         self.events = self.read_events()  # events
-        return pipit.trace.Trace(self.definitions, self.events)
+
+        trace = pipit.trace.Trace(self.definitions, self.events, None)
+        trace.create_cct()  # create cct
+
+        return trace
diff --git a/pipit/trace.py b/pipit/trace.py
@@ -3,16 +3,23 @@
 #
 # SPDX-License-Identifier: MIT
 
+import numpy as np
+
+
+from pipit.graph import Graph, Node
+
 
 class Trace:
-    """A trace dataset is read into an object of this type, which includes one
-    or more dataframes.
+    """
+    A trace dataset is read into an object of this type, which
+    includes one or more dataframes and a calling context tree.
     """
 
-    def __init__(self, definitions, events):
+    def __init__(self, definitions, events, cct):
         """Create a new Trace object."""
         self.definitions = definitions
         self.events = events
+        self.cct = cct
 
     @staticmethod
     def from_otf2(dirname):
@@ -29,3 +36,216 @@ def from_hpctoolkit(dirname):
         from .readers.hpctoolkit_reader import HPCToolkitReader
 
         return HPCToolkitReader(dirname).read()
+
+    def create_cct(self):
+        """
+        Generic function to iterate through the trace events and create a CCT.
+        Uses pipit's graph data structure for this. Populates the trace's CCT
+        field and creates a new column in the trace's Events DataFrame that stores
+        a reference to each row's corresponding node in the CCT.
+
+        Thoughts/Concerns:
+        Currently, the DataFrame index of the entry row is being stored
+        in the node's calling context ids. This doesn't really have much of a
+        purpose right now. What should we be storing as calling context ids
+        for OTF2? Perhaps there should also be a way to map entry rows to
+        corresponding exit rows.
+        """
+
+        # only create the cct if it doesn't exist already
+        if self.cct is None:
+            graph = Graph()
+            callpath_to_node = dict()  # used to determine the existence of a node
+            graph_nodes = [
+                None for i in range(len(self.events))
+            ]  # list of nodes in the DataFrame
+            node_id = 0  # each node has a unique id
+
+            """
+            Iterate through each Location ID which is analagous to a thread
+            and iterate over its events using a stack to add to the cct
+            """
+            for location_id in set(self.events["Location ID"]):
+                """
+                Filter the DataFrame by Location ID and
+                events that are only of type Enter/Leave.
+                """
+                location_df = self.events.loc[
+                    (self.events["Name"] != "N/A")
+                    & (self.events["Location ID"] == location_id)
+                ]
+
+                curr_depth = 0
+                callpath = ""
+
+                """
+                Instead of iterating over the DataFrame columns,
+                we save them as lists and iterate over those as
+                that is more efficient.
+                """
+                df_indices = list(location_df.index)
+                function_names = list(location_df["Name"])
+                event_types = list(location_df["Event Type"])
+
+                # stacks used to iterate through the trace and add nodes to the cct
+                functions_stack, nodes_stack = [], []
+
+                # iterating over the events of the current location id's trace
+                for i in range(len(location_df)):
+                    curr_df_index, evt_type, function_name = (
+                        df_indices[i],
+                        event_types[i],
+                        function_names[i],
+                    )
+
+                    # encounter a new function through its entry point.
+                    if evt_type == "Enter":
+                        # add the function to the stack and get the call path
+                        functions_stack.append(function_name)
+                        callpath = "->".join(functions_stack)
+
+                        # get the parent node of the function if it exists
+                        if curr_depth == 0:
+                            parent_node = None
+                        else:
+                            parent_node = nodes_stack[-1]
+
+                        if callpath in callpath_to_node:
+                            """
+                            if a node with the call path
+                            exists, don't create a new one
+                            """
+                            curr_node = callpath_to_node[callpath]
+                        else:
+                            """
+                            create a new node with the call path
+                            if it doesn't exist yet
+                            """
+                            curr_node = Node(
+                                node_id, function_name, parent_node, curr_depth
+                            )
+                            callpath_to_node[callpath] = curr_node
+                            node_id += 1
+
+                            if curr_depth == 0:
+                                """
+                                add the newly created node as a
+                                root to the cct if the depth is 0
+                                """
+                                graph.add_root(curr_node)
+                            else:
+                                """
+                                add the newly created node as a child
+                                of its parent if it is not a root
+                                """
+                                parent_node.add_child(curr_node)
+
+                        """
+                        add the Enter DataFrame index as a calling context id
+                        to the node (multiple function invocations with the
+                        same call path)
+                        """
+                        curr_node.add_calling_context_id(curr_df_index)
+
+                        """
+                        maps the Enter DataFrame index to the node
+
+                        note:
+                        this seems redundant because the node will already
+                        exist in the row's Graph_Node column
+                        """
+                        graph.add_to_map(curr_df_index, curr_node)
+
+                        # Update nodes stack, column, and current depth
+                        nodes_stack.append(curr_node)
+                        graph_nodes[curr_df_index] = curr_node
+                        curr_depth += 1
+                    else:
+                        """
+                        Once you encounter the Leave event for a function,
+                        get the corresponding node from the top of the nodes stack.
+                        """
+                        curr_node = nodes_stack.pop()
+                        graph_nodes[curr_df_index] = curr_node
+
+                        # Update functions stack and current depth
+                        functions_stack.pop()
+                        curr_depth -= 1
+
+            # Update the Trace with the generated cct
+            self.events["Graph_Node"] = graph_nodes
+            self.cct = graph
+
+    def comm_matrix(self, comm_type="bytes"):
+        """
+        Communication Matrix for Peer-to-Peer (P2P) MPI messages
+
+        Arguments:
+
+        1) comm_type -
+        string to choose whether the communication volume should be measured
+        by bytes transferred between two processes or the number of messages
+        sent (two choices - "bytes" or "counts")
+
+        Returns:
+        A 2D Numpy Array that represents the communication matrix for all P2P
+        messages of the given trace
+
+        Note:
+        The first dimension of the returned 2d array
+        is senders and the second dimension is receivers
+        ex) comm_matrix[sender_rank][receiver_rank]
+        """
+
+        # get the list of ranks/process ids
+        # (mpi messages are sent between processes)
+        ranks = set(
+            self.events.loc[self.events["Location Group Type"] == "PROCESS"][
+                "Location Group ID"
+            ]
+        )
+
+        # create a 2d numpy array that will be returned
+        # at the end of the function
+        communication_matrix = np.zeros(shape=(len(ranks), len(ranks)))
+
+        # filter the dataframe by MPI Send and Isend events
+        sender_dataframe = self.events.loc[
+            self.events["Event Type"].isin(["MpiSend", "MpiIsend"]),
+            ["Location Group ID", "Attributes"],
+        ]
+
+        # get the mpi ranks of all the sender processes
+        sender_ranks = sender_dataframe["Location Group ID"].to_list()
+
+        # get the corresponding mpi ranks of the receivers
+        receiver_ranks = (
+            sender_dataframe["Attributes"]
+            .apply(lambda attrDict: attrDict["receiver"])
+            .to_list()
+        )
+
+        # number of bytes communicated
+        if comm_type == "bytes":
+            # (1 communication is a single row in the sender dataframe)
+            message_volumes = (
+                sender_dataframe["Attributes"]
+                .apply(lambda attrDict: attrDict["msg_length"])
+                .to_list()
+            )
+        elif comm_type == "counts":
+            # 1 message between the pairs of processes
+            # for each row in the sender dataframe
+            message_volumes = np.full(len(sender_dataframe), 1)
+
+        for i in range(len(sender_ranks)):
+            """
+            loops through all the communication events and adds the
+            message volumes to the corresponding entry of the 2d array
+            using the sender and receiver ranks
+            """
+            communication_matrix[sender_ranks[i], receiver_ranks[i]] += message_volumes[
+                i
+            ]
+
+        return communication_matrix