diff --git a/src/converter/converter.py b/src/converter/converter.py
index acc85dab..df65dae3 100644
--- a/src/converter/converter.py
+++ b/src/converter/converter.py
@@ -6,8 +6,8 @@
 import traceback
 from logging import FileHandler
 
-from .pytorch2chakra_converter import PyTorch2ChakraConverter
-from .text2chakra_converter import Text2ChakraConverter
+from .pytorch_converter import PyTorchConverter
+from .text_converter import TextConverter
 
 
 def get_logger(log_filename: str) -> logging.Logger:
@@ -52,12 +52,12 @@ def main() -> None:
 
     try:
         if args.input_type == "Text":
-            converter = Text2ChakraConverter(
+            converter = TextConverter(
                 args.input_filename, args.output_filename, args.num_npus, args.num_passes, logger
             )
             converter.convert()
         elif args.input_type == "PyTorch":
-            converter = PyTorch2ChakraConverter(args.input_filename, args.output_filename, logger)
+            converter = PyTorchConverter(args.input_filename, args.output_filename, logger)
             converter.convert()
         else:
             logger.error(f"{args.input_type} unsupported")
diff --git a/src/converter/pytorch2chakra_converter.py b/src/converter/pytorch2chakra_converter.py
index 2c552cff..37224ae6 100644
--- a/src/converter/pytorch2chakra_converter.py
+++ b/src/converter/pytorch2chakra_converter.py
@@ -27,7 +27,7 @@
 from .pytorch_node import PyTorchNode, PyTorchNodeType
 
 
-class PyTorch2ChakraConverter:
+class PyTorchConverter:
     """
     Converter class for transforming PyTorch execution traces into Chakra format.
 
diff --git a/src/converter/pytorch_converter.py b/src/converter/pytorch_converter.py
new file mode 100644
index 00000000..37224ae6
--- /dev/null
+++ b/src/converter/pytorch_converter.py
@@ -0,0 +1,684 @@
+#!/usr/bin/env python3
+
+import json
+import logging
+from typing import Dict, List, Optional, Set, Tuple
+
+from ....schema.protobuf.et_def_pb2 import (
+    ALL_GATHER,
+    ALL_REDUCE,
+    ALL_TO_ALL,
+    BROADCAST,
+    COMM_COLL_NODE,
+    COMP_NODE,
+    REDUCE_SCATTER,
+    GlobalMetadata,
+)
+from ....schema.protobuf.et_def_pb2 import (
+    AttributeProto as ChakraAttr,
+)
+from ....schema.protobuf.et_def_pb2 import (
+    Node as ChakraNode,
+)
+from ....schema.protobuf.et_def_pb2 import (
+    NodeType as ChakraNodeType,
+)
+from ..third_party.protolib import encodeMessage as encode_message
+from .pytorch_node import PyTorchNode, PyTorchNodeType
+
+
+class PyTorchConverter:
+    """
+    Converter class for transforming PyTorch execution traces into Chakra format.
+
+    This class is responsible for converting the execution traces collected
+    from PyTorch into a format that is compatible with Chakra, a performance
+    analysis tool. It handles the intricate mappings and transformations
+    required to accurately represent the execution in a different format.
+
+    Attributes:
+        input_filename (str): Input file name containing PyTorch execution trace.
+        output_filename (str): Output file name for the converted Chakra trace.
+        chakra_et(IO[bytes]): File handle for the Chakra execution trace output file.
+        logger (logging.Logger): Logger for logging information during conversion.
+        pytorch_schema (Optional[str]): Schema info of the PyTorch trace.
+        pytorch_pid (Optional[int]): Process ID associated with the PyTorch trace.
+        pytorch_time (Optional[str]): Time info of the PyTorch trace.
+        pytorch_start_ts (Optional[int]): Start timestamp of the PyTorch trace.
+        pytorch_finish_ts (Optional[int]): Finish timestamp of the PyTorch trace.
+        pytorch_nodes (Dict[int, Any]): Map of PyTorch node IDs to nodes.
+        pytorch_root_nids (List[int]): List of root node IDs in the PyTorch trace.
+        pytorch_cpu_node_id_gpu_node_map (Dict[int, List[int]]): Map of PyTorch
+            CPU node IDs to GPU node IDs.
+        chakra_nodes (Dict[int, Any]): Map of Chakra node IDs to nodes.
+        parent_to_children_map (Dict[int, List[int]]): Map of Chakra parent node
+                                                       IDs to their child node
+                                                       IDs. Used to simulate
+                                                       execution based on data
+                                                       dependencies.
+    """
+
+    def __init__(self, input_filename: str, output_filename: str, logger: logging.Logger) -> None:
+        """
+        Initializes the PyTorch to Chakra converter. It sets up necessary
+        attributes and prepares the environment for the conversion process.
+
+        Args:
+            input_filename (str): Name of the input file containing PyTorch execution trace.
+            output_filename (str): Name of the output file for the converted Chakra trace.
+            logger (logging.Logger): Logger for logging information during the conversion.
+        """
+        self.input_filename = input_filename
+        self.output_filename = output_filename
+        self.chakra_et = None
+        self.logger = logger
+        self.initialize_attributes()
+
+    def initialize_attributes(self) -> None:
+        # Initialize file and trace-related attributes
+        self.pytorch_schema = None
+        self.pytorch_pid = None
+        self.pytorch_time = None
+        self.pytorch_start_ts = None
+        self.pytorch_finish_ts = None
+        self.pytorch_nodes = None
+        self.pytorch_root_nids = []
+
+        # Initialize node mapping dictionaries
+        self.pytorch_cpu_node_id_gpu_node_map = {}
+        self.chakra_nodes = {}
+
+        self.parent_to_children_map = {}
+
+    def convert(self) -> None:
+        """
+        Converts PyTorch execution traces into the Chakra format. Orchestrates
+        the conversion process including trace loading, trace opening, phase
+        end node construction, node splitting, and node conversion.
+        """
+        self.load_pytorch_execution_traces()
+
+        self.open_chakra_execution_trace()
+
+        for _, pytorch_node in self.pytorch_nodes.items():
+            if (pytorch_node.get_op_type() == PyTorchNodeType.CPU_OP) or (
+                pytorch_node.get_op_type() == PyTorchNodeType.LABEL
+            ):
+                chakra_node = self.convert_to_chakra_node(pytorch_node)
+                self.chakra_nodes[chakra_node.id] = chakra_node
+
+                for pytorch_gpu_node in pytorch_node.gpu_children:
+                    chakra_gpu_node = self.convert_to_chakra_node(pytorch_gpu_node)
+
+                    if chakra_node.type == COMM_COLL_NODE:
+                        collective_comm_type = self.get_collective_comm_type(pytorch_gpu_node.name)
+                        chakra_gpu_node.attr.extend(
+                            [
+                                ChakraAttr(name="comm_type", int64_val=collective_comm_type),
+                                ChakraAttr(name="comm_size", int64_val=pytorch_gpu_node.comm_size),
+                            ]
+                        )
+
+                    self.chakra_nodes[chakra_gpu_node.id] = chakra_gpu_node
+
+        root_nodes = [node for node in self.chakra_nodes.values() if self.is_root_node(node)]
+        for root_node in root_nodes:
+            self.convert_ctrl_dep_to_data_dep(root_node)
+
+        self.remove_dangling_nodes()
+
+        self.update_parent_to_children_map()
+
+        self.identify_cyclic_dependencies()
+
+        self.write_chakra_et()
+
+        self.close_chakra_execution_trace()
+
+        self.simulate_execution()
+
+    def load_pytorch_execution_traces(self) -> None:
+        """
+        Loads PyTorch execution traces from a file.
+
+        Reads and parses the PyTorch execution trace data from a file, creating
+        PyTorchNode objects and establishing node relationships.
+
+        Raises:
+            Exception: If there is an IOError in opening the file.
+        """
+        self.logger.info("Loading PyTorch execution traces from file.")
+        try:
+            with open(self.input_filename, "r") as pytorch_et:
+                pytorch_et_data = json.load(pytorch_et)
+            self._parse_and_instantiate_nodes(pytorch_et_data)
+        except IOError as e:
+            self.logger.error(f"Error opening file {self.input_filename}: {e}")
+            raise Exception(f"Could not open file {self.input_filename}") from e
+
+    def _parse_and_instantiate_nodes(self, pytorch_et_data: Dict) -> None:
+        """
+        Parses and instantiates PyTorch nodes from execution trace data.
+
+        Args:
+            pytorch_et_data (Dict): The execution trace data.
+
+        Extracts node information, sorts nodes by timestamp, and establishes
+        parent-child relationships among them.
+        """
+        self.logger.info("Extracting and processing node data from execution trace.")
+        self.pytorch_schema = pytorch_et_data["schema"]
+        self.pytorch_pid = pytorch_et_data["pid"]
+        self.pytorch_time = pytorch_et_data["time"]
+        self.pytorch_start_ts = pytorch_et_data["start_ts"]
+        self.pytorch_finish_ts = pytorch_et_data["finish_ts"]
+
+        pytorch_nodes = pytorch_et_data["nodes"]
+        pytorch_node_objects = {
+            node_data["id"]: PyTorchNode(self.pytorch_schema, node_data) for node_data in pytorch_nodes
+        }
+        self._establish_parent_child_relationships(pytorch_node_objects)
+
+    def _establish_parent_child_relationships(self, pytorch_node_objects: Dict[int, PyTorchNode]) -> None:  # noqa: C901
+        """
+        Establishes parent-child relationships among PyTorch nodes and counts
+        the node types.
+
+        Args:
+            pytorch_node_objects (Dict[int, PyTorchNode]): Dictionary of PyTorch
+            node objects.
+        """
+        # Initialize counters for different types of nodes
+        node_type_counts = {
+            "total_op": 0,
+            "cpu_op": 0,
+            "gpu_op": 0,
+            "record_param_comms_op": 0,
+            "nccl_op": 0,
+            "root_op": 0,
+        }
+
+        # Establish parent-child relationships
+        for pytorch_node in pytorch_node_objects.values():
+            parent_id = pytorch_node.parent
+            if parent_id in pytorch_node_objects:
+                parent_node = pytorch_node_objects[parent_id]
+                parent_node.add_child(pytorch_node)
+
+                if pytorch_node.is_gpu_op():
+                    parent_node.add_gpu_child(pytorch_node)
+
+                if pytorch_node.is_record_param_comms_op():
+                    parent_node.record_param_comms_node = pytorch_node
+
+                if pytorch_node.is_nccl_op():
+                    parent_node.nccl_node = pytorch_node
+
+            if pytorch_node.name in [
+                "[pytorch|profiler|execution_graph|thread]",
+                "[pytorch|profiler|execution_trace|thread]",
+            ]:
+                self.pytorch_root_nids.append(pytorch_node.id)
+                node_type_counts["root_op"] += 1
+
+            # Collect statistics
+            node_type_counts["total_op"] += 1
+            if pytorch_node.is_cpu_op():
+                node_type_counts["cpu_op"] += 1
+            if pytorch_node.is_gpu_op():
+                node_type_counts["gpu_op"] += 1
+            if pytorch_node.is_record_param_comms_op():
+                node_type_counts["record_param_comms_op"] += 1
+            if pytorch_node.is_nccl_op():
+                node_type_counts["nccl_op"] += 1
+
+        # Log the counts of each node type
+        for node_type, count in node_type_counts.items():
+            self.logger.info(f"{node_type}: {count}")
+
+        self.pytorch_nodes = pytorch_node_objects
+
+    def open_chakra_execution_trace(self) -> None:
+        """
+        Opens the Chakra execution trace file for writing.
+
+        Raises:
+            Exception: If there is an IOError in opening the file.
+        """
+        self.logger.info(f"Opening Chakra execution trace file: {self.output_filename}")
+        try:
+            self.chakra_et = open(self.output_filename, "wb")  # noqa: SIM115
+        except IOError as e:
+            err_msg = f"Error opening file {self.output_filename}: {e}"
+            self.logger.error(err_msg)
+            raise Exception(err_msg) from e
+
+    def convert_to_chakra_node(self, pytorch_node: PyTorchNode) -> ChakraNode:
+        """
+        Converts a PyTorchNode to a ChakraNode.
+
+        Args:
+            pytorch_node (PyTorchNode): The PyTorch node to convert.
+
+        Returns:
+            ChakraNode: The converted Chakra node.
+        """
+        self.logger.debug(f"Converting PyTorch node ID {pytorch_node.id} to Chakra node.")
+
+        chakra_node = ChakraNode()
+        chakra_node.id = pytorch_node.id
+        chakra_node.name = pytorch_node.name
+        chakra_node.type = self.get_chakra_node_type_from_pytorch_node(pytorch_node)
+        if pytorch_node.parent in self.chakra_nodes:
+            chakra_node.ctrl_deps.append(pytorch_node.parent)
+        chakra_node.duration_micros = int(pytorch_node.exclusive_dur)
+        chakra_node.inputs.values = str(pytorch_node.inputs["values"])
+        chakra_node.inputs.shapes = str(pytorch_node.inputs["shapes"])
+        chakra_node.inputs.types = str(pytorch_node.inputs["types"])
+        chakra_node.outputs.values = str(pytorch_node.outputs["values"])
+        chakra_node.outputs.shapes = str(pytorch_node.outputs["shapes"])
+        chakra_node.outputs.types = str(pytorch_node.outputs["types"])
+        chakra_node.attr.extend(
+            [
+                ChakraAttr(name="rf_id", int64_val=pytorch_node.rf_id),
+                ChakraAttr(name="fw_parent", int64_val=pytorch_node.fw_parent),
+                ChakraAttr(name="seq_id", int64_val=pytorch_node.seq_id),
+                ChakraAttr(name="scope", int64_val=pytorch_node.scope),
+                ChakraAttr(name="tid", int64_val=pytorch_node.tid),
+                ChakraAttr(name="fw_tid", int64_val=pytorch_node.fw_tid),
+                ChakraAttr(name="op_schema", string_val=pytorch_node.op_schema),
+                ChakraAttr(name="is_cpu_op", int32_val=not pytorch_node.is_gpu_op()),
+            ]
+        )
+        return chakra_node
+
+    def get_chakra_node_type_from_pytorch_node(self, pytorch_node: PyTorchNode) -> ChakraNodeType:
+        """
+        Determines the Chakra node type from a PyTorch node.
+
+        Args:
+            pytorch_node (PyTorchNode): The PyTorch node to determine the type of.
+
+        Returns:
+            int: The corresponding Chakra node type.
+        """
+        if (
+            pytorch_node.is_gpu_op()
+            and ("ncclKernel" in pytorch_node.name or "ncclDevKernel" in pytorch_node.name)
+            or (("c10d::" in pytorch_node.name) or ("nccl:" in pytorch_node.name))
+        ):
+            return COMM_COLL_NODE
+        return COMP_NODE
+
+    def get_collective_comm_type(self, name: str) -> int:
+        """
+        Returns the collective communication type of the node.
+
+        Args:
+            name (str): The name of the node.
+
+        Raises:
+            ValueError: If the communication type is not found in the mapping.
+
+        Returns:
+            int: The collective communication type of the node.
+        """
+        comm_type_mapping = {
+            "allreduce": ALL_REDUCE,
+            "alltoall": ALL_TO_ALL,
+            "allgather": ALL_GATHER,
+            "reducescatter": REDUCE_SCATTER,
+            "broadcast": BROADCAST,
+            # Additional cases can be added here
+        }
+
+        normalized_name = name.replace("_", "").replace("-", "").lower()
+        for key in comm_type_mapping:
+            if key in normalized_name:
+                return comm_type_mapping[key]
+
+        raise ValueError(
+            f"'{name}' not found in collective communication mapping. "
+            "Please add this collective communication name to the mapping."
+        )
+
+    def is_root_node(self, node):
+        """
+        Determines whether a given node is a root node in the execution trace.
+
+        In the context of PyTorch execution traces, root nodes are the starting
+        points of execution graphs or execution traces. These nodes typically do
+        not have parent nodes and act as the original sources of execution flow.
+        This method identifies such root nodes based on their names. Specifically,
+        nodes with names indicating they are part of the PyTorch execution graph or
+        execution trace threads are considered root nodes.
+
+        Args:
+            node (ChakraNode): The node to be evaluated.
+
+        Returns:
+            bool: True if the node is a root node, False otherwise.
+        """
+        if node.name in ["[pytorch|profiler|execution_graph|thread]", "[pytorch|profiler|execution_trace|thread]"]:
+            return True
+
+    def convert_ctrl_dep_to_data_dep(self, chakra_node: ChakraNode) -> None:  # noqa: C901
+        """
+        Traverses nodes based on control dependencies (parent nodes) and encodes
+        data dependencies appropriately. This method is crucial for converting the
+        dependency structure from PyTorch execution traces to Chakra execution
+        traces. In PyTorch traces, control dependencies are represented by a
+        parent field in each node, denoting the parent node ID. This structure
+        indicates which functions (operators) are called by a particular operator.
+
+        In contrast, Chakra execution traces, while retaining control dependencies
+        for compatibility, primarily rely on data dependencies to represent
+        relationships between nodes. Data dependencies in Chakra are more broadly
+        defined compared to those in PyTorch, where they are implicitly encoded in
+        tensor input-output relationships. In Chakra, data dependencies are explicit
+        and represent a general dependency between nodes.
+
+        To convert PyTorch's control dependencies to Chakra's data dependencies, a
+        Depth-First Search (DFS) is performed. The DFS traversal starts from a given
+        Chakra node, traversing through its children (based on control
+        dependencies). During traversal, data dependencies are encoded by linking
+        nodes that have been visited in sequence. These dependencies form a chain,
+        mirroring the function call order from the PyTorch trace.
+
+        Special attention is given to the types of nodes involved. CPU and label
+        nodes (non-GPU) in PyTorch can only depend on other CPU or label nodes.
+        However, GPU nodes can depend on any type of node. Thus, while traversing,
+        if a GPU node is encountered, it can establish a data dependency with the
+        last visited node of any type. For CPU and label nodes, the dependency is
+        only established with the last visited non-GPU node. This distinction
+        ensures that the converted dependencies accurately reflect the execution
+        dynamics of the original PyTorch trace within the Chakra framework.
+
+        Additionally, this method enforces sequential dependencies between GPU
+        operators within the same stream. It ensures that the execution order of
+        GPU operators is preserved in the Chakra trace, reflecting the sequential
+        execution within the same GPU stream in the original PyTorch trace.
+
+        Furthermore, inter-thread dependencies are explicitly encoded in the Chakra
+        execution traces. This feature allows for the representation of dependencies
+        across different CPU threads, which are observed in Kineto traces via
+        chrome://tracing. These dependencies are crucial for understanding the
+        interaction between CPU threads and ensuring accurate modeling and analysis
+        of concurrent operations within the Chakra framework.
+
+        Args:
+            chakra_node (ChakraNode): The starting node for the traversal and
+            dependency processing.
+        """
+        visited: Set[int] = set()
+        stack: List[ChakraNode] = [chakra_node]
+        last_visited_non_gpu: Optional[ChakraNode] = None
+        last_visited_any: Optional[ChakraNode] = None
+
+        while stack:
+            current_node = stack.pop()
+            if current_node.id in visited:
+                continue
+
+            visited.add(current_node.id)
+
+            # Determine the operator type of the current node
+            pytorch_node = self.pytorch_nodes.get(current_node.id)
+            if not pytorch_node:
+                continue
+
+            node_op_type = pytorch_node.get_op_type()
+
+            if node_op_type == PyTorchNodeType.GPU_OP:
+                if (last_visited_any) and (last_visited_any.id not in current_node.data_deps):
+                    current_node.data_deps.append(last_visited_any.id)
+                    self.logger.debug(
+                        f"GPU Node ID {current_node.id} now has a data " f"dependency on Node ID {last_visited_any.id}"
+                    )
+
+                last_visited_any = last_visited_non_gpu
+            else:
+                if pytorch_node.inter_thread_dep:
+                    id = pytorch_node.inter_thread_dep
+                    if id not in current_node.data_deps:
+                        current_node.data_deps.append(id)
+                        self.logger.debug(
+                            f"CPU Node ID {current_node.id} now has an inter-thread data dependency on Node ID {id}"
+                        )
+
+                if (last_visited_non_gpu) and (last_visited_non_gpu.id not in current_node.data_deps):
+                    current_node.data_deps.append(last_visited_non_gpu.id)
+                    self.logger.debug(
+                        f"CPU Node ID {current_node.id} now has a data "
+                        f"dependency on non-GPU Node ID {last_visited_non_gpu.id}"
+                    )
+                last_visited_non_gpu = current_node
+                last_visited_any = current_node
+
+            # Add children to the stack
+            children_chakra_ids = [child.id for child in pytorch_node.children]
+            for child_chakra_id in sorted(children_chakra_ids, reverse=True):
+                child_chakra_node = self.chakra_nodes.get(child_chakra_id)
+                if child_chakra_node and child_chakra_node.id not in visited:
+                    stack.append(child_chakra_node)
+
+    def remove_dangling_nodes(self) -> None:
+        """
+        Removes any dangling nodes from the chakra_nodes dictionary.
+        A node is considered dangling if it has no parents and no children.
+        """
+        parent_ids = set()
+        for node in self.chakra_nodes.values():
+            parent_ids.update(node.data_deps)
+
+        dangling_nodes = []
+        for node_id, node in list(self.chakra_nodes.items()):
+            if node_id not in parent_ids and not node.data_deps:
+                dangling_nodes.append(node)
+                del self.chakra_nodes[node_id]
+                if node_id in self.pytorch_nodes:
+                    del self.pytorch_nodes[node_id]
+
+        if dangling_nodes:
+            self.logger.info(f"Identified and removed {len(dangling_nodes)} dangling nodes:")
+            for node in dangling_nodes:
+                self.logger.info(f" - Node ID {node.id}: {node.name}")
+
+    def update_parent_to_children_map(self) -> None:
+        """
+        Updates the parent_to_children_map based on the data dependencies of each node.
+        This map is used to efficiently simulate node execution based on data dependencies.
+        """
+        for node_id, node in self.chakra_nodes.items():
+            for dep_id in node.data_deps:
+                # Ensure the dependency is registered as a parent of the current node
+                if dep_id not in self.parent_to_children_map:
+                    self.parent_to_children_map[dep_id] = []
+                self.parent_to_children_map[dep_id].append(node_id)
+
+    def identify_cyclic_dependencies(self) -> None:
+        """
+        Identifies if there are any cyclic dependencies among Chakra nodes.
+
+        This method checks for cycles in the graph of Chakra nodes using a
+        depth-first search (DFS) algorithm. It logs an error message and raises
+        an exception if a cycle is detected, ensuring the graph is a Directed
+        Acyclic Graph (DAG).
+
+        Raises:
+            Exception: If a cyclic dependency is detected among the Chakra nodes.
+        """
+        visited = set()
+        stack = set()
+
+        def dfs(node_id: int, path: List[int]) -> bool:
+            """
+            Depth-first search to detect cycles.
+
+            Args:
+                node_id (int): The node ID to start the DFS from.
+                path (List[int]): The path traversed so far, for tracing the cycle.
+
+            Returns:
+                bool: True if a cycle is detected, False otherwise.
+            """
+            if node_id in stack:
+                cycle_nodes = " -> ".join([self.chakra_nodes[n].name for n in path + [node_id]])
+                self.logger.error(f"Cyclic dependency detected: {cycle_nodes}")
+                return True
+            if node_id in visited:
+                return False
+
+            visited.add(node_id)
+            stack.add(node_id)
+            path.append(node_id)
+            for child_id in self.chakra_nodes[node_id].data_deps:
+                if dfs(child_id, path.copy()):
+                    return True
+            stack.remove(node_id)
+            path.pop()
+            return False
+
+        for node_id in self.chakra_nodes:
+            if dfs(node_id, []):
+                raise Exception(f"Cyclic dependency detected starting from node {self.chakra_nodes[node_id].name}")
+
+    def write_chakra_et(self) -> None:
+        """
+        Writes the Chakra execution trace by encoding global metadata and nodes.
+
+        Encodes and writes both the metadata and individual nodes to create a
+        complete execution trace.
+        """
+        self.logger.info("Writing Chakra execution trace.")
+        self._write_global_metadata()
+        self._encode_and_write_nodes()
+        self.logger.info("Chakra execution trace writing completed.")
+
+    def _write_global_metadata(self) -> None:
+        """
+        Encodes and writes global metadata for the Chakra execution trace.
+
+        This process includes encoding metadata like schema, process ID, timestamps,
+        and other relevant information for the Chakra execution trace.
+        """
+        self.logger.info("Encoding global metadata for Chakra execution trace.")
+        global_metadata = GlobalMetadata(
+            attr=[
+                ChakraAttr(name="schema", string_val=self.pytorch_schema),
+                ChakraAttr(name="pid", uint64_val=self.pytorch_pid),
+                ChakraAttr(name="time", string_val=self.pytorch_time),
+                ChakraAttr(name="start_ts", uint64_val=self.pytorch_start_ts),
+                ChakraAttr(name="finish_ts", uint64_val=self.pytorch_finish_ts),
+            ]
+        )
+        encode_message(self.chakra_et, global_metadata)
+
+    def _encode_and_write_nodes(self) -> None:
+        """
+        Encodes and writes nodes for the Chakra execution trace.
+
+        Each node from the PyTorch execution trace is encoded and written into the
+        Chakra format. This includes node IDs, names, types, dependencies, and
+        other attributes.
+        """
+        self.logger.info("Encoding and writing nodes for Chakra execution trace.")
+        seen_nids = set()
+        for nid in sorted(self.chakra_nodes.keys()):
+            if nid in seen_nids:
+                err_msg = f"Duplicate NID {nid} detected in Chakra nodes."
+                self.logger.error(err_msg)
+                raise ValueError(err_msg)
+            seen_nids.add(nid)
+            chakra_node = self.chakra_nodes[nid]
+            encode_message(self.chakra_et, chakra_node)
+
+    def close_chakra_execution_trace(self) -> None:
+        """
+        Closes the Chakra execution trace file if it is open.
+
+        Ensures proper closure of the trace file to preserve data integrity.
+        """
+        self.logger.info("Closing Chakra execution trace file.")
+        if self.chakra_et and not self.chakra_et.closed:
+            self.chakra_et.close()
+
+    def simulate_execution(self) -> None:
+        """
+        Simulates the execution of Chakra nodes based on data dependencies.
+
+        This method considers both CPU and GPU nodes. Nodes are issued for
+        execution based on the readiness determined by dependency resolution.
+        A simplistic global clock is used to model the execution time.
+        """
+        self.logger.info("Simulating execution of Chakra nodes based on data " "dependencies.")
+
+        # Initialize queues for ready CPU and GPU nodes
+        ready_cpu_nodes = [
+            (node_id, self.chakra_nodes[node_id])
+            for node_id in self.chakra_nodes
+            if not self.chakra_nodes[node_id].data_deps and not self.pytorch_nodes[node_id].is_gpu_op()
+        ]
+        ready_gpu_nodes = [
+            (node_id, self.chakra_nodes[node_id])
+            for node_id in self.chakra_nodes
+            if not self.chakra_nodes[node_id].data_deps and self.pytorch_nodes[node_id].is_gpu_op()
+        ]
+        ready_cpu_nodes.sort(key=lambda x: x[1].id)
+        ready_gpu_nodes.sort(key=lambda x: x[1].id)
+
+        issued_nodes: Set[int] = set()
+        current_cpu_node: Optional[Tuple[int, int]] = None
+        current_gpu_node: Optional[Tuple[int, int]] = None
+
+        current_time: int = 0  # Simulated global clock in microseconds
+
+        while any([ready_cpu_nodes, ready_gpu_nodes, current_cpu_node, current_gpu_node]):
+            if ready_cpu_nodes and not current_cpu_node:
+                cpu_node_id, cpu_node = ready_cpu_nodes.pop(0)
+                current_cpu_node = (cpu_node_id, current_time)
+                issued_nodes.add(cpu_node_id)
+                self.logger.info(
+                    f"Issuing CPU Node ID {cpu_node_id} ({cpu_node.name}) at "
+                    f"{current_time}us with duration {cpu_node.duration_micros}us"
+                )
+
+            if ready_gpu_nodes and not current_gpu_node:
+                gpu_node_id, gpu_node = ready_gpu_nodes.pop(0)
+                current_gpu_node = (gpu_node_id, current_time)
+                issued_nodes.add(gpu_node_id)
+                self.logger.info(
+                    f"Issuing GPU Node ID {gpu_node_id} ({gpu_node.name}) at "
+                    f"{current_time}us with duration {gpu_node.duration_micros}us"
+                )
+
+            current_time += 1
+
+            if (
+                current_cpu_node
+                and current_time - current_cpu_node[1] >= self.chakra_nodes[current_cpu_node[0]].duration_micros
+            ):
+                self.logger.info(f"CPU Node ID {current_cpu_node[0]} completed at {current_time}us")
+                current_cpu_node = None
+
+            if (
+                current_gpu_node
+                and current_time - current_gpu_node[1] >= self.chakra_nodes[current_gpu_node[0]].duration_micros
+            ):
+                self.logger.info(f"GPU Node ID {current_gpu_node[0]} completed at {current_time}us")
+                current_gpu_node = None
+
+            for node_id in list(issued_nodes):
+                children_ids = self.parent_to_children_map.get(node_id, [])
+                for child_id in children_ids:
+                    child_node = self.chakra_nodes[child_id]
+                    child_node.data_deps.remove(node_id)
+                    if not child_node.data_deps:
+                        if not self.pytorch_nodes[child_id].is_gpu_op():
+                            ready_cpu_nodes.append((child_id, child_node))
+                        else:
+                            ready_gpu_nodes.append((child_id, child_node))
+
+            issued_nodes.clear()
+
+        self.logger.info("Simulation of Chakra node execution completed.")
diff --git a/src/converter/text2chakra_converter.py b/src/converter/text2chakra_converter.py
index 3c15c35b..1c229a02 100644
--- a/src/converter/text2chakra_converter.py
+++ b/src/converter/text2chakra_converter.py
@@ -50,7 +50,7 @@ def __init__(self, line: str) -> None:
             raise ValueError(f'Cannot parse the following layer -- "{line}"')
 
 
-class Text2ChakraConverter:
+class TextConverter:
     def __init__(
         self, input_filename: str, output_filename: str, num_npus: int, num_passes: int, logger: logging.Logger
     ) -> None:
diff --git a/src/converter/text_converter.py b/src/converter/text_converter.py
new file mode 100644
index 00000000..1c229a02
--- /dev/null
+++ b/src/converter/text_converter.py
@@ -0,0 +1,445 @@
+#!/usr/bin/env python3
+
+import logging
+from io import TextIOWrapper
+from typing import Any, List
+
+from ....schema.protobuf.et_def_pb2 import (
+    ALL_GATHER,
+    ALL_REDUCE,
+    ALL_TO_ALL,
+    COMM_COLL_NODE,
+    COMP_NODE,
+    REDUCE_SCATTER,
+    GlobalMetadata,
+    Node,
+    NodeType,
+    AttributeProto as ChakraAttr,
+)
+from ..third_party.protolib import encodeMessage as encode_message
+
+
+class Layer:
+    def __init__(self, line: str) -> None:
+        try:
+            col = line.strip().split()
+            self.name = col[0]
+
+            # forward
+            self.fwd_comp_time = int(col[2])
+            self.fwd_comm_type = str(col[3])
+            self.fwd_comm_size = int(col[4])
+            self.fwd_comp_node = None
+            self.fwd_comm_node = None
+
+            # backward input gradient
+            self.bwd_ig_comp_time = int(col[5])
+            self.bwd_ig_comm_type = str(col[6])
+            self.bwd_ig_comm_size = int(col[7])
+            self.bwd_ig_comp_node = None
+            self.bwd_ig_comm_node = None
+
+            # backward weight gradient
+            self.bwd_wg_comp_time = int(col[8])
+            self.bwd_wg_comm_type = str(col[9])
+            self.bwd_wg_comm_size = int(col[10])
+            self.bwd_wg_update_time = str(col[11])
+            self.bwd_wg_comp_node = None
+            self.bwd_wg_comm_node = None
+        except Exception:
+            raise ValueError(f'Cannot parse the following layer -- "{line}"')
+
+
+class TextConverter:
+    def __init__(
+        self, input_filename: str, output_filename: str, num_npus: int, num_passes: int, logger: logging.Logger
+    ) -> None:
+        self.input_filename = input_filename
+        self.output_filename = output_filename
+        self.num_npus = num_npus
+        self.num_passes = num_passes
+        self.logger = logger
+        self.next_node_id = 0
+
+    def get_global_metadata(self):
+        input_text = ""
+        with open(self.input_filename, "r") as input_file:
+            input_text = input_file.read()
+        attr = [
+            ChakraAttr(name="schema", string_val="1.0.2-chakra.0.0.4"),
+            ChakraAttr(name="input_file", string_val=input_text),
+        ]
+        metadata = GlobalMetadata(attr=attr)
+        return metadata
+
+    def get_layers(self, f: TextIOWrapper, num_layers: int) -> List[Layer]:
+        layers = []
+        for line in f:
+            layers.append(Layer(line))
+        return layers
+
+    def get_node(self, name: str, node_type: NodeType) -> Any:
+        node = Node()
+        node.id = self.next_node_id
+        self.next_node_id += 1
+        node.name = name
+        node.type = node_type
+        return node
+
+    def get_comp_node(self, layer_name: str, phase: str, comp_time: int) -> Any:
+        node = self.get_node("COMP_NODE_" + layer_name + "_" + phase, COMP_NODE)
+        node.duration_micros = comp_time
+        return node
+
+    def get_comm_type(self, comm_type: str) -> int:
+        if comm_type == "ALLREDUCE":
+            return ALL_REDUCE
+        elif comm_type == "ALLTOALL":
+            return ALL_TO_ALL
+        elif comm_type == "ALLGATHER":
+            return ALL_GATHER
+        elif comm_type == "REDUCESCATTER":
+            return REDUCE_SCATTER
+        return 0
+
+    def get_comm_coll_node(self, layer_name: str, comm_type: str, comm_size: int) -> Any:
+        node = self.get_node(f"COMM_COLL_NODE_{layer_name}_{comm_type}", COMM_COLL_NODE)
+        node.attr.append(ChakraAttr(name="comm_type", int64_val=self.get_comm_type(comm_type)))
+        node.attr.append(ChakraAttr(name="comm_size", uint64_val=comm_size))
+        return node
+
+    def add_parent(self, child_node: Any, parent_node: Any) -> None:
+        child_node.data_deps.append(parent_node.id)
+
+    def convert(self) -> None:
+        with open(self.input_filename, "r") as f:
+            first_line = f.readline().strip().split()
+            parallelism_type = first_line[0]
+            num_layers = int(f.readline().strip())
+
+            if parallelism_type == "MICRO":
+                self.convert_microbenchmark(f, num_layers)
+            elif parallelism_type == "DATA":
+                self.convert_data_parallel(f, num_layers)
+            elif parallelism_type == "MODEL":
+                self.convert_model_parallel(f, num_layers)
+            elif parallelism_type == "HYBRID_DATA_MODEL":
+                self.convert_hybrid_data_model(f, num_layers)
+            elif parallelism_type == "HYBRID_MODEL_DATA":
+                self.convert_hybrid_model_data(f, num_layers)
+            elif (parallelism_type == "HYBRID_DLRM") or (parallelism_type == "HYBRID_DLRM_ENHANCED"):
+                last_bottom_layer = int(first_line[1])
+                self.convert_hybrid_dlrm(f, num_layers, last_bottom_layer)
+            else:
+                raise ValueError(f"Unsupported parallelism type, {parallelism_type}")
+
+    def convert_microbenchmark(self, f: TextIOWrapper, num_layers: int) -> None:
+        layers = self.get_layers(f, num_layers)
+        for npu_id in range(self.num_npus):
+            output_filename = "%s.%d.et" % (self.output_filename, npu_id)
+            with open(output_filename, "wb") as g:
+                global_metadata = self.get_global_metadata()
+                encode_message(g, global_metadata)
+                for i in range(self.num_passes):
+                    for layer in layers:
+                        bwd_wg_comm_node = self.get_comm_coll_node(
+                            layer.name, layer.bwd_wg_comm_type, layer.bwd_wg_comm_size
+                        )
+                        encode_message(g, bwd_wg_comm_node)
+
+    def convert_data_parallel(self, f: TextIOWrapper, num_layers: int) -> None:
+        layers = self.get_layers(f, num_layers)
+        for npu_id in range(self.num_npus):
+            output_filename = "%s.%d.et" % (self.output_filename, npu_id)
+            with open(output_filename, "wb") as g:
+                global_metadata = self.get_global_metadata()
+                encode_message(g, global_metadata)
+                for i in range(self.num_passes):
+                    fwd_comp_node = None
+
+                    # forward pass
+                    for idx, layer in enumerate(layers):
+                        fwd_comp_node = self.get_comp_node(layer.name, "FWD", layer.fwd_comp_time)
+                        if idx != 0:
+                            self.add_parent(fwd_comp_node, layers[idx - 1].fwd_comp_node)
+                        if layer.bwd_wg_comm_node is not None:
+                            self.add_parent(fwd_comp_node, layer.bwd_wg_comm_node)
+                        layer.fwd_comp_node = fwd_comp_node
+                        encode_message(g, fwd_comp_node)
+
+                    # backward pass
+                    for idx, layer in enumerate(reversed(layers)):
+                        bwd_wg_comp_node = self.get_comp_node(layer.name, "BWD_WG", layer.bwd_wg_comp_time)
+                        if idx == 0:
+                            if fwd_comp_node is None:
+                                raise ValueError("fwd_comp_node is None")
+                            self.add_parent(bwd_wg_comp_node, fwd_comp_node)
+                        else:
+                            self.add_parent(bwd_wg_comp_node, layers[len(layers) - idx].bwd_ig_comp_node)
+                        encode_message(g, bwd_wg_comp_node)
+
+                        bwd_wg_comm_node = self.get_comm_coll_node(
+                            layer.name, layer.bwd_wg_comm_type, layer.bwd_wg_comm_size
+                        )
+
+                        self.add_parent(bwd_wg_comm_node, bwd_wg_comp_node)
+                        layer.bwd_wg_comm_node = bwd_wg_comm_node
+                        encode_message(g, bwd_wg_comm_node)
+
+                        if idx != (len(layers) - 1):
+                            bwd_ig_comp_node = self.get_comp_node(layer.name, "BWD_IG", layer.bwd_ig_comp_time)
+                            self.add_parent(bwd_ig_comp_node, bwd_wg_comp_node)
+                            layer.bwd_ig_comp_node = bwd_ig_comp_node
+                            encode_message(g, bwd_ig_comp_node)
+
+                for layer in layers:
+                    layer.bwd_wg_comm_node = None
+
+    def convert_model_parallel(self, f: TextIOWrapper, num_layers: int) -> None:
+        layers = self.get_layers(f, num_layers)
+        for npu_id in range(self.num_npus):
+            output_filename = "%s.%d.et" % (self.output_filename, npu_id)
+            with open(output_filename, "wb") as g:
+                global_metadata = self.get_global_metadata()
+                encode_message(g, global_metadata)
+                for i in range(self.num_passes):
+                    fwd_comm_node = None
+
+                    # forward pass
+                    for idx, layer in enumerate(layers):
+                        fwd_comp_node = self.get_comp_node(layer.name, "FWD", layer.fwd_comp_time)
+                        if idx != 0:
+                            self.add_parent(fwd_comp_node, layers[idx - 1].fwd_comm_node)
+                        if layer.bwd_wg_comp_node is not None:
+                            self.add_parent(fwd_comp_node, layer.bwd_wg_comp_node)
+                        layer.fwd_comp_node = fwd_comp_node
+                        encode_message(g, fwd_comp_node)
+
+                        fwd_comm_node = self.get_comm_coll_node(layer.name, layer.fwd_comm_type, layer.fwd_comm_size)
+                        layer.fwd_comm_node = fwd_comm_node
+                        self.add_parent(fwd_comm_node, fwd_comp_node)
+                        encode_message(g, fwd_comm_node)
+
+                    # backward pass
+                    for idx, layer in enumerate(reversed(layers)):
+                        bwd_ig_comp_node = self.get_comp_node(layer.name, "BWD_IG", layer.bwd_ig_comp_time)
+                        if idx == 0:
+                            if fwd_comm_node is None:
+                                raise ValueError("fwd_comm_node is None")
+                            self.add_parent(bwd_ig_comp_node, fwd_comm_node)
+                        else:
+                            self.add_parent(bwd_ig_comp_node, layers[len(layers) - idx].bwd_wg_comp_node)
+                            self.add_parent(bwd_ig_comp_node, layers[len(layers) - idx].bwd_ig_comm_node)
+                        encode_message(g, bwd_ig_comp_node)
+
+                        if idx != (num_layers - 1):
+                            bwd_ig_comm_node = self.get_comm_coll_node(
+                                layer.name, layer.bwd_ig_comm_type, layer.bwd_ig_comm_size
+                            )
+                            self.add_parent(bwd_ig_comm_node, bwd_ig_comp_node)
+                            layer.bwd_ig_comm_node = bwd_ig_comm_node
+                            encode_message(g, bwd_ig_comm_node)
+
+                        bwd_wg_comp_node = self.get_comp_node(layer.name, "BWD_WG", layer.bwd_wg_comp_time)
+                        self.add_parent(bwd_wg_comp_node, bwd_ig_comp_node)
+                        layer.bwd_wg_comp_node = bwd_wg_comp_node
+                        encode_message(g, bwd_wg_comp_node)
+
+                for layer in layers:
+                    layer.bwd_wg_comp_node = None
+
+    def convert_hybrid_data_model(self, f: TextIOWrapper, num_layers: int) -> None:
+        layers = self.get_layers(f, num_layers)
+        for npu_id in range(self.num_npus):
+            output_filename = "%s.%d.et" % (self.output_filename, npu_id)
+            with open(output_filename, "wb") as g:
+                global_metadata = self.get_global_metadata()
+                encode_message(g, global_metadata)
+                for i in range(self.num_passes):
+                    fwd_comm_node = None
+
+                    # forward pass
+                    for idx, layer in enumerate(layers):
+                        fwd_comp_node = self.get_comp_node(layer.name, "FWD", layer.fwd_comp_time)
+                        if layer.bwd_wg_comm_node is not None:
+                            self.add_parent(fwd_comp_node, layer.bwd_wg_comm_node)
+                        if idx != 0:
+                            self.add_parent(fwd_comp_node, layers[idx - 1].fwd_comm_node)
+                        encode_message(g, fwd_comp_node)
+
+                        fwd_comm_node = self.get_comm_coll_node(layer.name, layer.fwd_comm_type, layer.fwd_comm_size)
+                        self.add_parent(fwd_comm_node, fwd_comp_node)
+                        layer.fwd_comm_node = fwd_comm_node
+                        encode_message(g, fwd_comm_node)
+
+                    # backward pass
+                    for idx, layer in enumerate(reversed(layers)):
+                        bwd_ig_comp_node = self.get_comp_node(layer.name, "BWD_IG", layer.bwd_ig_comp_time)
+                        if idx == 0:
+                            if fwd_comm_node is None:
+                                raise ValueError("fwd_comm_node is None")
+                            self.add_parent(bwd_ig_comp_node, fwd_comm_node)
+                        else:
+                            self.add_parent(bwd_ig_comp_node, layers[len(layers) - idx].bwd_wg_comp_node)
+                            self.add_parent(bwd_ig_comp_node, layers[len(layers) - idx].bwd_ig_comm_node)
+                        encode_message(g, bwd_ig_comp_node)
+
+                        if idx != num_layers - 1:
+                            bwd_ig_comm_node = self.get_comm_coll_node(
+                                layer.name + "_IG_COMM_", layer.bwd_ig_comm_type, layer.bwd_ig_comm_size
+                            )
+                            self.add_parent(bwd_ig_comm_node, bwd_ig_comp_node)
+                            layer.bwd_ig_comm_node = bwd_ig_comm_node
+                            encode_message(g, bwd_ig_comm_node)
+
+                        bwd_wg_comp_node = self.get_comp_node(layer.name, "BWD_WG", layer.bwd_wg_comp_time)
+                        self.add_parent(bwd_wg_comp_node, bwd_ig_comp_node)
+                        layer.bwd_wg_comp_node = bwd_wg_comp_node
+                        encode_message(g, bwd_wg_comp_node)
+
+                        bwd_wg_comm_node = self.get_comm_coll_node(
+                            layer.name, layer.bwd_wg_comm_type, layer.bwd_wg_comm_size
+                        )
+                        self.add_parent(bwd_wg_comm_node, bwd_wg_comp_node)
+                        layer.bwd_wg_comm_node = bwd_wg_comm_node
+                        encode_message(g, bwd_wg_comm_node)
+
+                for layer in layers:
+                    layer.bwd_wg_comm_node = None
+
+    def convert_hybrid_model_data(self, f: TextIOWrapper, num_layers: int) -> None:
+        layers = self.get_layers(f, num_layers)
+        for npu_id in range(self.num_npus):
+            output_filename = "%s.%d.et" % (self.output_filename, npu_id)
+            with open(output_filename, "wb") as g:
+                global_metadata = self.get_global_metadata()
+                encode_message(g, global_metadata)
+                for i in range(self.num_passes):
+                    fwd_comm_node = None
+
+                    # forward pass
+                    for idx, layer in enumerate(layers):
+                        fwd_comp_node = self.get_comp_node(layer.name, "FWD", layer.fwd_comp_time)
+                        if layer.bwd_wg_comm_node is not None:
+                            self.add_parent(fwd_comp_node, layer.bwd_wg_comm_node)
+                        if idx != 0:
+                            self.add_parent(fwd_comp_node, layers[idx - 1].fwd_comm_node)
+                        encode_message(g, fwd_comp_node)
+
+                        fwd_comm_node = self.get_comm_coll_node(layer.name, layer.fwd_comm_type, layer.fwd_comm_size)
+                        self.add_parent(fwd_comm_node, fwd_comp_node)
+                        layer.fwd_comm_node = fwd_comm_node
+                        encode_message(g, fwd_comm_node)
+
+                    # backward pass
+                    for idx, layer in enumerate(reversed(layers)):
+                        bwd_ig_comp_node = self.get_comp_node(layer.name, "BWD_IG", layer.bwd_ig_comp_time)
+                        if idx == 0:
+                            if fwd_comm_node is None:
+                                raise ValueError("fwd_comm_node is None")
+                            self.add_parent(bwd_ig_comp_node, fwd_comm_node)
+                        else:
+                            self.add_parent(bwd_ig_comp_node, layers[len(layers) - idx].bwd_wg_comp_node)
+                            self.add_parent(bwd_ig_comp_node, layers[len(layers) - idx].bwd_ig_comm_node)
+                        encode_message(g, bwd_ig_comp_node)
+
+                        if idx != num_layers - 1:
+                            bwd_ig_comm_node = self.get_comm_coll_node(
+                                layer.name, layer.bwd_ig_comm_type, layer.bwd_ig_comm_size
+                            )
+                            self.add_parent(bwd_ig_comm_node, bwd_ig_comp_node)
+                            layer.bwd_ig_comm_node = bwd_ig_comm_node
+                            encode_message(g, bwd_ig_comm_node)
+
+                        bwd_wg_comp_node = self.get_comp_node(layer.name, "BWD_WG", layer.bwd_wg_comp_time)
+                        self.add_parent(bwd_wg_comp_node, bwd_ig_comp_node)
+                        layer.bwd_wg_comp_node = bwd_wg_comp_node
+                        encode_message(g, bwd_wg_comp_node)
+
+                        bwd_wg_comm_node = self.get_comm_coll_node(
+                            layer.name, layer.bwd_wg_comm_type, layer.bwd_wg_comm_size
+                        )
+                        self.add_parent(bwd_wg_comm_node, bwd_wg_comp_node)
+                        layer.bwd_wg_comm_node = bwd_wg_comm_node
+                        encode_message(g, bwd_wg_comm_node)
+
+                for layer in layers:
+                    layer.bwd_wg_comm_node = None
+
+    def convert_hybrid_dlrm(self, f: TextIOWrapper, num_layers: int, last_bottom_layer: int) -> None:
+        layers = self.get_layers(f, num_layers)
+        for npu_id in range(self.num_npus):
+            output_filename = "%s.%d.et" % (self.output_filename, npu_id)
+            with open(output_filename, "wb") as g:
+                global_metadata = self.get_global_metadata()
+                encode_message(g, global_metadata)
+                for i in range(self.num_passes):
+                    fwd_comp_node = None
+
+                    # forward pass
+                    for idx, layer in enumerate(layers):
+                        fwd_comp_node = self.get_comp_node(layer.name, "FWD", layer.fwd_comp_time)
+                        if layer.bwd_wg_comm_node is not None:
+                            self.add_parent(fwd_comp_node, layer.bwd_wg_comm_node)
+                        elif layer.bwd_wg_comp_node is not None:
+                            self.add_parent(fwd_comp_node, layer.bwd_wg_comp_node)
+                        if idx != 0:
+                            self.add_parent(fwd_comp_node, layers[idx - 1].fwd_comp_node)
+                        if idx == last_bottom_layer:
+                            self.add_parent(fwd_comp_node, layers[0].fwd_comm_node)
+                        layer.fwd_comp_node = fwd_comp_node
+                        encode_message(g, fwd_comp_node)
+
+                        if layer.fwd_comm_type == "ALLTOALL":
+                            fwd_comm_node = self.get_comm_coll_node(
+                                layer.name, layer.fwd_comm_type, layer.fwd_comm_size
+                            )
+                            self.add_parent(fwd_comm_node, fwd_comp_node)
+                            layer.fwd_comm_node = fwd_comm_node
+                            encode_message(g, fwd_comm_node)
+
+                    # backward pass
+                    for idx, layer in enumerate(reversed(layers)):
+                        bwd_wg_comp_node = self.get_comp_node(layer.name, "BWD_WG", layer.bwd_wg_comp_time)
+                        if idx == 0:
+                            if fwd_comp_node is None:
+                                raise ValueError("fwd_comp_node is None")
+                            self.add_parent(bwd_wg_comp_node, fwd_comp_node)
+                        else:
+                            if layers[len(layers) - idx].bwd_ig_comp_node is not None:
+                                self.add_parent(bwd_wg_comp_node, layers[len(layers) - idx].bwd_ig_comp_node)
+                            if layers[len(layers) - idx - 1].bwd_ig_comm_node is not None:
+                                self.add_parent(bwd_wg_comp_node, layers[len(layers) - idx - 1].bwd_ig_comm_node)
+                        layer.bwd_wg_comp_node = bwd_wg_comp_node
+                        encode_message(g, bwd_wg_comp_node)
+
+                        if layer.bwd_wg_comm_type != "NONE":
+                            bwd_wg_comm_node = self.get_comm_coll_node(
+                                layer.name, layer.bwd_wg_comm_type, layer.bwd_wg_comm_size
+                            )
+                            self.add_parent(bwd_wg_comm_node, bwd_wg_comp_node)
+                            layer.bwd_wg_comm_node = bwd_wg_comm_node
+                            encode_message(g, bwd_wg_comm_node)
+
+                        bwd_ig_comp_node = None
+                        if idx != (len(layers) - 1):
+                            bwd_ig_comp_node = self.get_comp_node(layer.name, "BWD_IG", layer.bwd_ig_comp_time)
+                            self.add_parent(bwd_ig_comp_node, bwd_wg_comp_node)
+                            layer.bwd_ig_comp_node = bwd_ig_comp_node
+                            encode_message(g, bwd_ig_comp_node)
+
+                        if (len(layers) - idx - 1) == (last_bottom_layer + 1):
+                            bwd_ig_comm_node = self.get_comm_coll_node(
+                                layers[0].name, layers[0].bwd_ig_comm_type, layers[0].bwd_ig_comm_size
+                            )
+                            if bwd_ig_comp_node is None:
+                                raise ValueError("bwd_ig_comp_node is None")
+                            self.add_parent(bwd_ig_comm_node, bwd_ig_comp_node)
+                            layers[0].bwd_ig_comm_node = bwd_ig_comm_node
+                            encode_message(g, bwd_ig_comm_node)
+
+                for layer in layers:
+                    layer.bwd_wg_comm_node = None
+                    layer.bwd_wg_comp_node = None
+                    layer.bwd_ig_comm_node = None
+                    layer.bwd_ig_comp_node = None