diff --git a/causy/sample_generator.py b/causy/sample_generator.py
index 9d5a32d..1ea1dcb 100644
--- a/causy/sample_generator.py
+++ b/causy/sample_generator.py
@@ -1,5 +1,7 @@
 import abc
+from dataclasses import dataclass
 from types import SimpleNamespace
+
 import torch
 
 from causy.graph import Graph
@@ -18,35 +20,39 @@ def random() -> torch.Tensor:
     return torch.randn(1, dtype=torch.float32).item()
 
 
-class SampleEdge:
+@dataclass
+class NodeReference:
     """
-    Represents an edge in a sample graph
-    defines a directed edge from source to target
-
-    Example:
-    SampleEdge("X", "Y") defines an edge from X to Y
-
+    A reference to a node in the sample generator
     """
 
-    def __init__(self, source, target):
-        self.source = source
-        self.target = target
+    node: str
+
+    def __str__(self):
+        return self.node
 
 
-class SampleLaggedEdge(SampleEdge):
+@dataclass
+class TimeAwareNodeReference(NodeReference):
+    """
+    A reference to a node in the sample generator
     """
-    Represents a lagged edge in a time series sample graph.
-    Defines a directed edge from source to target with a lag of lag. The lag is the number of time steps between the
-    source and the target.
 
-    Example:
-    SampleLaggedEdge("X", "Y", 1) defines an edge from X to Y with a lag of 1
+    point_in_time: int = 0
 
+    def __str__(self):
+        return f"{self.node} - t{self.point_in_time}"
+
+
+@dataclass
+class SampleEdge:
+    """
+    An edge in the sample generator that references a node and a lag
     """
 
-    def __init__(self, source, target, lag):
-        super().__init__(source, target)
-        self.lag = lag
+    from_node: NodeReference
+    to_node: NodeReference
+    value: float = 0
 
 
 class TimeTravelingError(Exception):
@@ -57,190 +63,218 @@ class TimeTravelingError(Exception):
     pass
 
 
-class TimeProxy:
-    """
-    A proxy object that allows to access past values of a variable by using the t() method.
-
-    Example:
-    >>> tp = TimeProxy(5)
-    >>> tp.set_current_time(1)
-    >>> tp.t(-1)
-    5
-    """
+class AbstractSampleGenerator(abc.ABC):
+    def __init__(
+        self,
+        edges: List[Union[SampleEdge, SampleEdge]],
+        random: Callable = random,  # for setting that to a fixed value for testing use random = lambda: 0
+    ):
+        self._edges = edges
+        self._variables = self._find_variables_in_edges()
+        self.random_fn = random
 
-    def __init__(self, initial_value: torch.Tensor):
+    @abc.abstractmethod
+    def generate(self, size: int) -> SimpleNamespace:
         """
-        :param initial_value: the initial value of the variable
+        Generate data for a sample graph with a time dimension
+        :param size: the number of time steps to generate
+        :return: the generated data and the sample graph
         """
-        if not isinstance(initial_value, torch.Tensor):
-            initial_value = torch.tensor(initial_value, dtype=torch.float32)
-        self._lst = [initial_value]
-        self._t = 0
+        pass
 
-    def set_current_time(self, t):
+    @abc.abstractmethod
+    def _generate_data(self, size: int) -> Dict[str, torch.Tensor]:
         """
-        Set the current time step which t will be relative to
-        :param t: time step as an integer
-        :return:
+        Generate data for a sample graph with a time dimension
+        :param size: the number of time steps to generate
+        :return: the generated data
         """
-        self._t = t
+        pass
 
-    def t(self, t):
+    def _find_variables_in_edges(self):
         """
-        Return the value of the variable at time step t
-        :param t: the relative time step as a negative integer
-        :return: the value of the variable at time step t or a random number if t is too large
-        :raises TimeTravelingError: if t is positive
+        Find all variables in the edges of the sample generator. We need this to calculate the initial values for all existing variables.
+        :return: a set of all variables submitted via the edges
         """
-        if t > 0:
-            raise TimeTravelingError(
-                f"Cannot travel into the future ({self._t + t} steps ahead)."
-            )
-        elif t + self._t < 0:
-            # TODO this might be a bad idea
-            return random()
-        return self._lst[self._t + t]
+        variables = set()
+        for edge in self._edges:
+            variables.add(edge.from_node.node)
+            variables.add(edge.to_node.node)
+        return variables
 
-    def append(self, value):
+    def _get_edges_for_node_to(self, node: str):
         """
-        Append a value to the list of values
-        :param value: the value to append
-        :return:
+        Get all edges that point to a specific node
+        :param node: the node to get the edges for
+        :return: a list of edges
         """
-        if not isinstance(value, torch.Tensor):
-            value = torch.tensor(value, dtype=torch.float32)
-        self._lst.append(value)
+        return [edge for edge in self._edges if edge.to_node.node == node]
 
-    def to_list(self):
-        """
-        Return the list of values
-        :return: the list
-        """
-        return torch.stack(self._lst)
 
-    def __repr__(self):
-        return f"{self._lst} at {self._t}"
+class IIDSampleGenerator(AbstractSampleGenerator):
+    """
+    A sample generator that generates data from i.i.d multivariate Gaussians.
+
+    A variable can not depend on itself.
 
+    Example:
+    >>> sg = IIDSampleGenerator(
+    >>>     edges=[
+    >>>      SampleEdge(NodeReference("X"), NodeReference("Y"), 5),
+    >>>      SampleEdge(NodeReference("Y"), NodeReference("Z"), 7),
+    >>>      ],
+    >>> )
 
-class CurrentElementProxy(float):
-    """
-    A proxy object that allows to access the current value of a variable. It is a subclass of float, so it can be used
-    as a float.
     """
 
-    # TODO: fix this class. Bug: IIDSampleGenerator only depends on the initial value, it should depend on the step
+    def topologic_sort(self, nodes: List[str]):
+        """
+        Sorts the nodes topologically
+        :param nodes: list of nodes
+        :param edges: list of edges
+        :return: a list of sorted nodes
+        """
+        sorted_nodes = []
+        while nodes:
+            for node in nodes:
+                if set(
+                    [edge.from_node.node for edge in self._get_edges_for_node_to(node)]
+                ).issubset(set(sorted_nodes)):
+                    sorted_nodes.append(node)
+                    nodes.remove(node)
+                    break
+        return sorted_nodes
 
-    def __init__(self, initial_value: torch.Tensor):
-        if not isinstance(initial_value, torch.Tensor):
-            initial_value = torch.tensor(initial_value, dtype=torch.float32)
-        self.lst = [initial_value]
-        self.value = initial_value
+    def _generate_data(self, size):
+        """
+        Generate data for a sample graph with a time dimension
+        :param size: the number of time steps to generate
+        :return: the generated data
+        """
+        internal_repr = {}
 
-    def append(self, value):
-        if not isinstance(value, torch.Tensor):
-            value = torch.tensor(value, dtype=torch.float32)
+        # Initialize the output dictionary by adding noise
+        for k in self._variables:
+            internal_repr[k] = torch.tensor(
+                [self.random_fn() for _ in range(size)], dtype=torch.float32
+            )
 
-        self.lst.append(value)
-        self.value = value
+        # Iterate over the nodes and sort them by the number of ingoing edges
+        ingoing_edges = {}
 
-    def to_list(self):
-        return torch.stack(self.lst)
+        # topological sort: sort the nodes in an order that the nodes that depend on other nodes come after the nodes they depend on
+        for node_name in self._variables:
+            # Get the edges that point to this node
+            ingoing_edges[node_name] = self._get_edges_for_node_to(node_name)
 
+        # Sort the node such that all nodes that appear in edges must have occured as keys before
+        sorted_nodes = self.topologic_sort(self._variables)
 
-class AbstractSampleGenerator(abc.ABC):
-    """
-    An abstract class for sample generators that generate data for a sample graph.
-    It is implemented by TimeseriesSampleGenerator and IIDSampleGenerator.
+        # Generate the data
+        for to_node in sorted_nodes:
+            for edge in ingoing_edges[to_node]:
+                from_node = edge.from_node.node
+                internal_repr[to_node] += edge.value * internal_repr[from_node]
+        return internal_repr
 
-    """
+    def generate(self, size):
+        """
+        Generate data for a sample graph with a time dimension
+        :param size: the number of time steps to generate
+        :return: the generated data and the sample graph
+        """
+        output = self._generate_data(size)
+        graph = Graph()
+        for i in self._variables:
+            graph.add_node(
+                i,
+                output[i],
+                id_=i,
+                metadata={"variable": i},
+            )
 
-    def __init__(
-        self,
-        initial_values: Dict[str, any],
-        generators: Dict[str, Callable],
-        edges: List[Union[SampleLaggedEdge, SampleEdge]],
-        variables: Optional[Dict[str, any]] = None,
-    ):
-        self.initial_values = initial_values
-        self.generators = generators
-        self.edges = edges
-        if variables is None:
-            variables = {}
-        self.vars = variables
+        for edge in self._edges:
+            graph.add_directed_edge(
+                graph.nodes[edge.from_node.node],
+                graph.nodes[edge.to_node.node],
+                metadata={},
+            )
 
-    @abc.abstractmethod
-    def generate(self, size: int):
-        pass
+        return output, graph
 
 
+# TODO: Does not work for multiple lags properly yet and is numerically unstable for several cases (check why, fix it)
 class TimeseriesSampleGenerator(AbstractSampleGenerator):
     """
     A sample generator that generates data for a sample graph with a time dimension.
 
-    Generator functions are written as a lambda function that takes two arguments: the current timestep and the input.
-    The input is a SimpleNamespace object that contains the current values of all variables. Via the t(-n) method of the
-    TimeProxy class, the generator can access the values of the variables at previous time steps.
-
-    During generation, the generator functions are called in the order of the keys of the generators dictionary. This
-    means that the order of the keys determines the order in which the variables are generated. If a variable depends on
-    another variable, the generator function of the dependent variable should be defined after the generator function of
-    the variable it depends on.
+    Edges are defined as SampleLaggedEdges, which define a directed edge from a source node to a target node with a
+    ag. The lag is the number of time steps between the source and the target.
 
-    A variable can depend on itself, but only on its past values (with a lag). This is useful for autoregressive models.
+    A variable can depend on itself, but only on its past values (with a lag). This corresponds to autoregressive models.
 
     Example:
     >>> sg = TimeseriesSampleGenerator(
-    >>>     initial_values={
-    >>>         "Z": random(),
-    >>>         "Y": random(),
-    >>>         "X": random(),
-    >>>     },
-    >>>     variables={
-    >>>         "alpha": 0.9,
-    >>>     },
-    >>>     # generate the dependencies of variables on past values of themselves and other variables
-    >>>     generators={
-    >>>         "Z": lambda t, i: i.Z.t(-1) * i.alpha + random(),
-    >>>         "Y": lambda t, i: i.Y.t(-1) * i.alpha + i.Z.t(-1) + random(),
-    >>>         "X": lambda t, i: i.X.t(-1) * i.alpha + i.Y.t(-1) + random()
-    >>>     },
     >>>     edges=[
-    >>>         SampleLaggedEdge("X", "X", 1),
-    >>>         SampleLaggedEdge("Y", "Y", 1),
-    >>>         SampleLaggedEdge("Z", "Z", 1),
-    >>>         SampleLaggedEdge("Y", "Z", 1),
-    >>>         SampleLaggedEdge("Y", "X", 4),
-    >>>     ]
+    >>>      SampleEdge(TimeAwareNodeReference("X", -1), TimeAwareNodeReference("X"), 0.9),
+    >>>      SampleEdge(TimeAwareNodeReference("Y", -1), TimeAwareNodeReference("Y"), 0.9),
+    >>>      SampleEdge(TimeAwareNodeReference("Z", -1), TimeAwareNodeReference("Z"), 0.9),
+    >>>      SampleEdge(TimeAwareNodeReference("Z", -1), TimeAwareNodeReference("Y"), 5),
+    >>>      SampleEdge(TimeAwareNodeReference("Y", -1), TimeAwareNodeReference("X"), 7),
+    >>>      ],
     >>> )
     """
 
+    def __init__(
+        self,
+        edges: List[Union[SampleEdge, SampleEdge]],
+        random: Callable = random,  # for setting that to a fixed value for testing use random = lambda: 0
+    ):
+        super().__init__(edges, random)
+        self._longest_lag = max(
+            [abs(edge.from_node.point_in_time) for edge in self._edges]
+        )
+
+    _initial_distribution_fn: Callable = lambda self, x: torch.normal(0, x)
+
     def _generate_data(self, size):
         """
         Generate data for a sample graph with a time dimension
-        :param size:
-        :return:
+        :param size: the number of time steps to generate
+        :return: the generated data
         """
         internal_repr = {}
 
+        initial_values = self._calculate_initial_values()
         # Initialize the output dictionary
-        for i, v in self.initial_values.items():
-            internal_repr[i] = TimeProxy(v)
+        for k in self._variables:
+            internal_repr[k] = [initial_values[k]]
 
-        # Generate the data for each time step
         for t in range(1, size):
-            for value in self.generators.keys():
-                internal_repr[value].set_current_time(t)
-                generator_input = internal_repr
-                generator_input.update(self.vars)
-                internal_repr[value].append(
-                    self.generators[value](t, SimpleNamespace(**generator_input))
-                )
-
-        output = {}
-        for i in self.generators.keys():
-            output[i] = internal_repr[i].to_list()
-
-        return output
+            for node_name in self._variables:
+                # Get the edges that point to this node
+                edges = self._get_edges_for_node_to(node_name)
+                result = torch.tensor(0.0, dtype=torch.float32)
+                for edge in edges:
+                    if abs(edge.from_node.point_in_time) > t:
+                        result += (
+                            edge.value * initial_values[edge.from_node.node]
+                        )  # TODO(sofia): map here to the proper point in time
+                    else:
+                        result += (
+                            edge.value
+                            * internal_repr[edge.from_node.node][
+                                t + edge.from_node.point_in_time
+                            ]
+                        )
+
+                result += self.random_fn()
+                internal_repr[node_name].append(result)
+
+        for k, v in internal_repr.items():
+            internal_repr[k] = torch.stack(v)
+
+        return internal_repr
 
     def generate(self, size):
         """
@@ -250,7 +284,7 @@ def generate(self, size):
         """
         output = self._generate_data(size)
         graph = Graph()
-        for i in self.generators.keys():
+        for i in self._variables:
             for t in range(size):
                 graph.add_node(
                     f"{i} - t{t}",
@@ -260,101 +294,131 @@ def generate(self, size):
                 )
 
         for t in range(1, size):
-            for edge in self.edges:
-                if t - edge.lag < 0:
+            for edge in self._edges:
+                if t - abs(edge.from_node.point_in_time) < 0:
                     logger.debug(
-                        f"Cannot generate data for {edge.source} at t={t}, "
-                        f"since it depends on {edge.lag}-steps-ago value"
+                        f"Cannot generate data for {edge.from_node.node} at t={t}, "
+                        f"since it depends on {abs(edge.to_node.point_in_time)}-steps-ago value"
                     )
                 else:
-                    graph.add_edge(
-                        graph.nodes[f"{edge.source}-t{t - edge.lag}"],
-                        graph.nodes[f"{edge.target}-t{t}"],
+                    graph.add_directed_edge(
+                        graph.nodes[
+                            f"{edge.from_node.node}-t{t - abs(edge.from_node.point_in_time)}"
+                        ],
+                        graph.nodes[f"{edge.to_node.node}-t{t}"],
                         metadata={},
                     )
-                    graph.remove_directed_edge(
-                        graph.nodes[f"{edge.target}-t{t}"],
-                        graph.nodes[f"{edge.source}-t{t - edge.lag}"],
-                    )
 
         return output, graph
 
+    def custom_block_diagonal(self, matrices):
+        # Get dimensions
+        num_matrices = len(matrices)
+        n = len(matrices[0])  # Assuming all matrices are of the same size
 
-class IIDSampleGenerator(AbstractSampleGenerator):
-    """
-    A sample generator that generates data for a sample graph without a time dimension.
+        # Compute total size of the block diagonal matrix
+        total_rows = num_matrices * n
+        total_cols = num_matrices * n
 
-    Generators are written as a lambda function that takes two arguments: the current step and the input.
-    The input is a SimpleNamespace object that contains the current values of all variables.
+        # Create an empty tensor to hold the block diagonal matrix
+        block_diag = torch.zeros(total_rows, total_cols)
 
-    A variable can not depend on itself.
+        # Fill in the first rows with the input matrices
+        for i, matrix in enumerate(matrices):
+            block_diag[:n, i * n : (i + 1) * n] = torch.tensor(matrix)
 
+        # Fill in the lower left off-diagonal with identity matrices
+        row_start = n
+        col_start = 0
+        for i in range(1, num_matrices):
+            block_diag[
+                row_start : row_start + n, col_start : col_start + n
+            ] = torch.eye(n)
+            row_start += n
+            col_start += n
 
-    Example:
-    >>> sg = IIDSampleGenerator(
-    >>>     initial_values={
-    >>>         "Z": random(),
-    >>>         "Y": random(),
-    >>>         "X": random(),
-    >>>     },
-    >>>     variables={
-    >>>         "param1": 2,
-    >>>         "param2": 3,
-    >>>     },
-    >>>     # generate the dependencies of variables on values of themselves and other variables
-    >>>     generators={
-    >>>         "Z": lambda s, i: random(),
-    >>>         "Y": lambda s, i: i.param1 * i.Z + random(),
-    >>>         "X": lambda s, i: i.param2 * i.Y + random()
-    >>>     },
-    >>>     edges=[
-    >>>         SampleEdge("Z", "Y"),
-    >>>         SampleEdge("Y", "X"),
-    >>>     ]
-    >>> )
+        return block_diag
 
-    """
+    def __generate_coefficient_matrix(self):
+        """
+        generate the coefficient matrix for the sample generator graph
+        :return: the coefficient matrix
+        """
 
-    # TODO: fix this class. Bug: IIDSampleGenerator only depends on the initial value, it should depend on the step
-    def _generate_data(self, size):
-        internal_repr = {}
+        matrix: List[List[List[float]]] = [
+            [[0 for _ in self._variables] for _ in self._variables]
+            for _ in range(self._longest_lag)
+        ]
 
-        # Initialize the output dictionary
-        for i, v in self.initial_values.items():
-            internal_repr[i] = CurrentElementProxy(v)
-
-        # Generate the data for each time step
-        for step in range(1, size):
-            for value in self.generators.keys():
-                generator_input = internal_repr
-                generator_input.update(self.vars)
-                internal_repr[value].append(
-                    self.generators[value](step, SimpleNamespace(**generator_input))
-                )
-        output = {}
-        for i in self.generators.keys():
-            output[i] = internal_repr[i].to_list()
+        # map the initial values to numbers from 0 to n
+        values_map = self.__matrix_position_mapping()
 
-        return output
+        for edge in self._edges:
+            matrix[(edge.from_node.point_in_time * -1) - 1][
+                values_map[edge.to_node.node]
+            ][values_map[edge.from_node.node]] = edge.value
 
-    def generate(self, size):
-        """
-        Generate data for a sample graph without a time dimension
-        :param size: the number of data points to generate
-        :return: the generated data and the sample graph
+        # return me as torch tensor
+        return self.custom_block_diagonal(matrix)
+
+    def vectorize_identity_block(self, n):
+        # Create an empty tensor
+        matrix = torch.zeros(n, n)
+
+        # Fill the upper left block with an identity matrix
+        matrix[: n // self._longest_lag, : n // self._longest_lag] = torch.eye(
+            n // self._longest_lag
+        )
+
+        # Flatten the matrix
+        vectorized_matrix = matrix.view(-1)
+
+        return vectorized_matrix
+
+    def _calculate_initial_values(self):
         """
-        output = self._generate_data(size)
-        graph = Graph()
+        Calculate the initial values for the sample generator graph using the covariance matrix of the noise terms.
 
-        for i in self.generators.keys():
-            graph.add_node(f"{i}", output[i], id_=f"{i}")
+        coefficient_matrix=[[a,0],[b,a]], i.e.
+        coefficient_matrix[0][0] is the coefficient of X_t-1 in the equation for X_t, here a
+        coefficient_matrix[0][1] is the coefficient of Y_t-1 in the equation for X_t (here: no edge, that means zero)
+        coefficient_matrix[1][1] is the coefficient of Y_t-1 in the equation for Y_t, here a
+        coefficient_matrix[1][0] is the coefficient of X_t-1 in the equation for Y_t, here b
 
-        for edge in self.edges:
-            graph.add_edge(
-                graph.nodes[f"{edge.source}"], graph.nodes[f"{edge.target}"], value={}
-            )
-            graph.remove_directed_edge(
-                graph.nodes[f"{edge.target}"], graph.nodes[f"{edge.source}"]
-            )
+        If the top left entry ([0][0]) in our coefficient matrix corresponds to X_{t-1} -> X_t, then the the top left
+        entry in the covariance matrix is the variance of X_t, i.e. V(X_t).
 
-        return output, graph
+        If the top right entry ([0][1]) in our coefficient matrix corresponds to X_{t-1} -> Y_t, then the the top left
+        entry in the covariance matrix is the variance of X_t, i.e. V(X_t).
+        :return: the initial values for the sample generator graph as a dictionary
+        """
+        coefficient_matrix = self.__generate_coefficient_matrix()
+        n, _ = coefficient_matrix.shape
+
+        kronecker_product = torch.kron(coefficient_matrix, coefficient_matrix)
+        identity_matrix = torch.eye(n**2)
+        cov_matrix_noise_terms_vectorized = self.vectorize_identity_block(n)
+        inv_identity_minus_kronecker_product = torch.linalg.pinv(
+            identity_matrix - kronecker_product
+        )
+        vectorized_covariance_matrix = torch.matmul(
+            inv_identity_minus_kronecker_product,
+            cov_matrix_noise_terms_vectorized,
+        )
+        vectorized_covariance_matrix = vectorized_covariance_matrix.reshape(n, n)
+
+        initial_values: Dict[str, torch.Tensor] = {}
+        values = torch.diagonal(vectorized_covariance_matrix, offset=0)
+        for k, i in self.__matrix_position_mapping().items():
+            initial_values[k] = self._initial_distribution_fn(torch.sqrt(values[i]))
+        return initial_values
+
+    def __matrix_position_mapping(self):
+        """
+        Map the variables to numbers from 0 to n. This is needed to calculate the initial values for the sample generator graph.
+        :return:
+        """
+        values_map = {}
+        for i, k in enumerate(self._variables):
+            values_map[k] = i
+        return values_map
diff --git a/tests/test_sample_generator.py b/tests/test_sample_generator.py
index 4772f2c..e26ac9d 100644
--- a/tests/test_sample_generator.py
+++ b/tests/test_sample_generator.py
@@ -1,95 +1,144 @@
 import unittest
 import torch
+import numpy as np
 
 from causy.sample_generator import (
     TimeseriesSampleGenerator,
     random,
-    SampleLaggedEdge,
+    SampleEdge,
     IIDSampleGenerator,
+    TimeAwareNodeReference,
+    NodeReference,
 )
 
 from causy.sample_generator import SampleEdge
 
 
+def set_random_seed(seed):
+    # Ensure reproducability across operating systems
+    torch.manual_seed(seed)
+    torch.cuda.manual_seed(seed)
+    torch.backends.cudnn.deterministic = True
+    torch.backends.cudnn.benchmark = False
+    np.random.seed(seed)
+
+
 class TimeSeriesSampleGeneratorTest(unittest.TestCase):
+    def test_iid_sample_generator(self):
+        model = IIDSampleGenerator(
+            edges=[
+                SampleEdge(NodeReference("X"), NodeReference("Y"), 5),
+                SampleEdge(NodeReference("Y"), NodeReference("Z"), 7),
+            ]
+        )
+        result = model._generate_data(100)
+        self.assertEqual(list(result["X"].shape), [100])
+
     def test_iid_sample_generator_without_randomness(self):
-        self.assertTrue(True)
-        # TODO: fix bug in iid sample generator and write test
-
-    def test_timeseries_sample_generator(self):
-        MODEL_ONE = TimeseriesSampleGenerator(
-            initial_values={
-                "Z": 1,
-                "Y": 2,
-                "X": 3,
-            },
-            variables={
-                "alpha": 0.9,
-                "beta": 0.9,
-                "gamma": 0.9,
-                "param_1": 5,
-                "param_2": 7,
-            },
-            # generate the dependencies of variables on past values of themselves and other variables
-            generators={
-                "Z": lambda t, i: i.Z.t(-1) * i.alpha,
-                "Y": lambda t, i: i.Y.t(-1) * i.beta + i.param_1 * i.Z.t(-1),
-                "X": lambda t, i: i.X.t(-1) * i.gamma + i.param_2 * i.Y.t(-1),
-            },
+        model = IIDSampleGenerator(
+            edges=[
+                SampleEdge(NodeReference("X"), NodeReference("Y"), 5),
+                SampleEdge(NodeReference("Y"), NodeReference("Z"), 7),
+            ]
+        )
+        model.random_fn = lambda: torch.tensor(1, dtype=torch.float32)
+
+        result = model._generate_data(100)
+        self.assertEqual(list(result["X"].shape), [100])
+        self.assertEqual(result["X"][0], 1)
+        self.assertEqual(result["X"][20], 1)
+        self.assertEqual(result["Y"][0], 6)
+        self.assertEqual(result["Y"][20], 6)
+        self.assertEqual(result["Z"][0], 43)
+        self.assertEqual(result["Z"][20], 43)
+
+    def test_iid_sample_generator_more_complex_case_without_randomness(self):
+        model = IIDSampleGenerator(
             edges=[
-                SampleLaggedEdge("X", "X", 1),
-                SampleLaggedEdge("Y", "Y", 1),
-                SampleLaggedEdge("Z", "Z", 1),
-                SampleLaggedEdge("Z", "Y", 1),
-                SampleLaggedEdge("Y", "X", 1),
+                SampleEdge(NodeReference("X"), NodeReference("Y"), 5),
+                SampleEdge(NodeReference("Y"), NodeReference("Z"), 1),
+                SampleEdge(NodeReference("W"), NodeReference("Y"), 5),
+            ]
+        )
+        model.random_fn = lambda: torch.tensor(1, dtype=torch.float32)
+
+        result = model._generate_data(100)
+        self.assertEqual(list(result["X"].shape), [100])
+        self.assertEqual(result["X"][0], 1)
+        self.assertEqual(result["X"][20], 1)
+        self.assertEqual(result["W"][0], 1)
+        self.assertEqual(result["W"][20], 1)
+        self.assertEqual(result["Y"][0], 11)
+        self.assertEqual(result["Y"][20], 11)
+        self.assertEqual(result["Z"][0], 12)
+        self.assertEqual(result["Z"][20], 12)
+
+    def test_timeseries_sample_generator_fixed_initial_distribution(self):
+        model_one = TimeseriesSampleGenerator(
+            edges=[
+                SampleEdge(
+                    TimeAwareNodeReference("X", -1), TimeAwareNodeReference("X"), 0.9
+                ),
+                SampleEdge(
+                    TimeAwareNodeReference("Y", -1), TimeAwareNodeReference("Y"), 0.9
+                ),
+                SampleEdge(
+                    TimeAwareNodeReference("Z", -1), TimeAwareNodeReference("Z"), 0.9
+                ),
+                SampleEdge(
+                    TimeAwareNodeReference("Z", -1), TimeAwareNodeReference("Y"), 5
+                ),
+                SampleEdge(
+                    TimeAwareNodeReference("Y", -1), TimeAwareNodeReference("X"), 7
+                ),
             ],
+            random=lambda: 0,
+        )
+
+        model_one._initial_distribution_fn = lambda x: torch.tensor(
+            1, dtype=torch.float32
         )
 
-        result, graph = MODEL_ONE.generate(100)
-        result_10_samples, _ = MODEL_ONE.generate(10)
+        result, graph = model_one.generate(100)
+        result_10_samples, _ = model_one.generate(10)
         self.assertEqual(len(result["X"]), 100)
         list_of_ground_truth_values = [
-            3.0000,
-            16.7000,
-            62.6300,
-            130.7070,
-            212.8923,
-            302.8484,
-            395.6479,
-            487.5262,
-            575.6727,
-            658.0551,
+            1.0000e00,
+            7.9000e00,
+            4.8410e01,
+            1.1224e02,
+            1.9117e02,
+            2.7870e02,
+            3.6978e02,
+            4.6053e02,
+            5.4803e02,
+            6.3016e02,
         ]
         for i in range(10):
             self.assertAlmostEqual(
                 result_10_samples["X"].tolist()[i],
                 list_of_ground_truth_values[i],
-                delta=0.0005,
+                delta=0.005,
             )
 
     def test_without_randomness(self):
-        MODEL = TimeseriesSampleGenerator(
-            initial_values={
-                "X": 1,
-                "Y": 1,
-            },
-            variables={
-                "alpha": 0.9,
-                "beta": 0.9,
-                "param_1": 5,
-            },
-            # generate the dependencies of variables on past values of themselves and other variables
-            generators={
-                "X": lambda t, i: i.X.t(-1) * i.alpha,
-                "Y": lambda t, i: i.Y.t(-1) * i.beta + i.param_1 * i.X.t(-1),
-            },
+        model = TimeseriesSampleGenerator(
             edges=[
-                SampleLaggedEdge("X", "X", 1),
-                SampleLaggedEdge("Y", "Y", 1),
-                SampleLaggedEdge("X", "Y", 1),
+                SampleEdge(
+                    TimeAwareNodeReference("X", -1), TimeAwareNodeReference("X"), 0.9
+                ),
+                SampleEdge(
+                    TimeAwareNodeReference("Y", -1), TimeAwareNodeReference("Y"), 0.9
+                ),
+                SampleEdge(
+                    TimeAwareNodeReference("X", -1), TimeAwareNodeReference("Y"), 5
+                ),
             ],
+            random=lambda: 0,
         )
-        result, graph = MODEL.generate(100)
+        model._initial_distribution_fn = lambda x: torch.tensor(1, dtype=torch.float32)
+
+        result, graph = model.generate(100)
 
         self.assertEqual(len(result["X"]), 100)
         self.assertEqual(len(result["Y"]), 100)
@@ -99,3 +148,77 @@ def test_without_randomness(self):
         self.assertAlmostEqual(result["Y"][1].item(), 5.9, places=2)
         self.assertAlmostEqual(result["X"][2].item(), 0.81, places=2)
         self.assertAlmostEqual(result["Y"][2].item(), 9.81, places=2)
+
+    def test_data_generator_multiple_autocorrelations(self):
+        set_random_seed(1)
+        model_multi_autocorr = TimeseriesSampleGenerator(
+            edges=[
+                SampleEdge(
+                    TimeAwareNodeReference("X", -1), TimeAwareNodeReference("X"), 0.4
+                ),
+                SampleEdge(
+                    TimeAwareNodeReference("X", -2), TimeAwareNodeReference("X"), 0.4
+                ),
+            ],
+            random=lambda: torch.tensor(0, dtype=torch.float32),
+        )
+
+        model_multi_autocorr._initial_distribution_fn = lambda x: torch.tensor(
+            1, dtype=torch.float32
+        )
+
+        result, graph = model_multi_autocorr.generate(100)
+        self.assertEqual(len(result["X"]), 100)
+        self.assertAlmostEqual(result["X"][0].item(), 1, places=2)
+        self.assertAlmostEqual(result["X"][1].item(), 0.8, places=2)
+        self.assertAlmostEqual(result["X"][2].item(), 0.72, places=2)
+        self.assertAlmostEqual(result["X"][3].item(), 0.608, places=2)
+
+    def test_generating_initial_values(self):  #
+        set_random_seed(1)
+        model = TimeseriesSampleGenerator(
+            edges=[
+                SampleEdge(
+                    TimeAwareNodeReference("X", -1), TimeAwareNodeReference("X"), 0.9
+                ),
+                SampleEdge(
+                    TimeAwareNodeReference("Y", -1), TimeAwareNodeReference("Y"), 0.9
+                ),
+                SampleEdge(
+                    TimeAwareNodeReference("X", -1), TimeAwareNodeReference("Y"), 5
+                ),
+            ],
+        )
+        model._initial_distribution_fn = lambda x: x
+        initial_values = model._calculate_initial_values()
+
+        self.assertAlmostEqual(float(initial_values["X"] ** 2), 5.2630, places=0)
+        self.assertAlmostEqual(float(initial_values["Y"] ** 2), 6602.2842, places=0)
+
+    def test_generating_initial_values_additional_variable(self):
+        set_random_seed(1)
+        model = TimeseriesSampleGenerator(
+            edges=[
+                SampleEdge(
+                    TimeAwareNodeReference("X", -1), TimeAwareNodeReference("X"), 0.9
+                ),
+                SampleEdge(
+                    TimeAwareNodeReference("Y", -1), TimeAwareNodeReference("Y"), 0.9
+                ),
+                SampleEdge(
+                    TimeAwareNodeReference("Z", -1), TimeAwareNodeReference("Z"), 0.9
+                ),
+                SampleEdge(
+                    TimeAwareNodeReference("X", -1), TimeAwareNodeReference("Y"), 5
+                ),
+                SampleEdge(
+                    TimeAwareNodeReference("X", -1), TimeAwareNodeReference("Z"), 5
+                ),
+            ],
+        )
+        model._initial_distribution_fn = lambda x: x
+        initial_values = model._calculate_initial_values()
+
+        self.assertAlmostEqual(float(initial_values["X"] ** 2), 5.2630, places=0)
+        # TODO: this is a bit of a hack, we have to fix numerical stability and then reduce the places
+        self.assertAlmostEqual(float(initial_values["Y"] ** 2), 6602.2842, places=-2)