models

`navis.models.BayesianTraversalModel` #

Model for traversing a network starting with given seed nodes.

This model is a Bayes net version of navis.models.network_models.TraversalModel that propagates traversal probabilities through the network and converges to a distribution of time of traversal for each node, rather than stochastically sampling.

Unlike TraversalModel, this model should only be run once. Note alse that traversal_func should be a function returing probabilities of traversal, rather than a random boolean of traversal.

PARAMETER	DESCRIPTION
`edges`	DataFrame representing an edge list. Must minimally have a `source` and `target` column. TYPE: `pandas.DataFrame`
`seeds`	Seed nodes for traversal. Nodes that aren't found in `edges['source']` will be (silently) removed. TYPE: `iterable`
`weights`	Name of a column in `edges` used as weights. If not provided, all edges will be given a weight of 1. If using the default activation function the weights need to be between 0 and 1. TYPE: `str`
`max_steps`	`Limits the number of steps for each iteration.` TYPE: `int`
`traversal_func`	Function returning probability whether a given edge will be traversed or not in a given step. Must take numpy array (N, 1) of edge weights and return an array with probabilities of equal size. Defaults to [`navis.models.network_models.linear_activation_p`][] which will linearly scale probability of traversal from 0 to 100% between edges weights 0 to 0.3. TYPE: `callable` DEFAULT: `None`

Examples:

>>> from navis.models import BayesianTraversalModel
>>> import networkx as nx
>>> import numpy as np
>>> # Generate a random graph
>>> G = nx.fast_gnp_random_graph(1000, .2, directed=True)
>>> # Turn into edge list
>>> edges = nx.to_pandas_edgelist(G)
>>> # Add random edge weights
>>> edges['weight'] = np.random.random(edges.shape[0])
>>> # Initialize model
>>> model = BayesianTraversalModel(edges, seeds=list(G.nodes)[:10])
>>> # Run model
>>> res = model.run()
>>> # Get a summary
>>> model.summary.tail()
      layer_min  layer_max  layer_mean  layer_median
node
995           2          2        2.00             2
996           2          3        2.33             2
997           2          2        2.00             2
998           2          2        2.00             2
999           2          2        2.00             2

Above Graph was traversed quickly (3 steps max). Let's adjust the traversal function:

>>> from navis.models import linear_activation_p
>>> # Use a lower probability for activation
>>> def my_act(x):
...     return linear_activation_p(x, max_w=10)
>>> model = BayesianTraversalModel(edges, seeds=list(G.nodes)[:10],
...                                traversal_func=my_act)
>>> res = model.run()
>>> res.tail()
      layer_min  layer_max  layer_mean  layer_median
node
995           2          4       3.210           3.0
996           2          4       3.280           3.0
997           2          4       3.260           3.0
998           2          4       3.320           3.0
999           2          4       3.195           3.0

Source code in navis/models/network_models.py

class BayesianTraversalModel(TraversalModel):
    """Model for traversing a network starting with given seed nodes.

    This model is a Bayes net version of
    [`navis.models.network_models.TraversalModel`][] that propagates
    traversal probabilities through the network and converges to a
    distribution of time of traversal for each node, rather than
    stochastically sampling.

    Unlike `TraversalModel`, this model should only be run once.
    Note alse that `traversal_func` should be a function returing
    probabilities of traversal, rather than a random boolean of traversal.

    Parameters
    ----------
    edges :             pandas.DataFrame
                        DataFrame representing an edge list. Must minimally have
                        a `source` and `target` column.
    seeds :             iterable
                        Seed nodes for traversal. Nodes that aren't found in
                        `edges['source']` will be (silently) removed.
    weights :           str, optional
                        Name of a column in `edges` used as weights. If not
                        provided, all edges will be given a weight of 1. If using
                        the default activation function the weights need to be
                        between 0 and 1.
    max_steps :         int
                        Limits the number of steps for each iteration.
    traversal_func :    callable, optional
                        Function returning probability whether a given edge will be
                        traversed or not in a given step. Must take numpy array
                        (N, 1) of edge weights and return an array with
                        probabilities of equal size. Defaults to
                        [`navis.models.network_models.linear_activation_p`][]
                        which will linearly scale probability of traversal
                        from 0 to 100% between edges weights 0 to 0.3.

    Examples
    --------
    >>> from navis.models import BayesianTraversalModel
    >>> import networkx as nx
    >>> import numpy as np
    >>> # Generate a random graph
    >>> G = nx.fast_gnp_random_graph(1000, .2, directed=True)
    >>> # Turn into edge list
    >>> edges = nx.to_pandas_edgelist(G)
    >>> # Add random edge weights
    >>> edges['weight'] = np.random.random(edges.shape[0])
    >>> # Initialize model
    >>> model = BayesianTraversalModel(edges, seeds=list(G.nodes)[:10])
    >>> # Run model
    >>> res = model.run()
    >>> # Get a summary
    >>> model.summary.tail()                                    # doctest: +SKIP
          layer_min  layer_max  layer_mean  layer_median
    node
    995           2          2        2.00             2
    996           2          3        2.33             2
    997           2          2        2.00             2
    998           2          2        2.00             2
    999           2          2        2.00             2

    Above Graph was traversed quickly (3 steps max). Let's adjust the
    traversal function:

    >>> from navis.models import linear_activation_p
    >>> # Use a lower probability for activation
    >>> def my_act(x):
    ...     return linear_activation_p(x, max_w=10)
    >>> model = BayesianTraversalModel(edges, seeds=list(G.nodes)[:10],
    ...                                traversal_func=my_act)
    >>> res = model.run()
    >>> res.tail()                                              # doctest: +SKIP
          layer_min  layer_max  layer_mean  layer_median
    node
    995           2          4       3.210           3.0
    996           2          4       3.280           3.0
    997           2          4       3.260           3.0
    998           2          4       3.320           3.0
    999           2          4       3.195           3.0

    """

    def __init__(self,
                 *args,
                 traversal_func: Optional[Callable] = None,
                 **kwargs):
        """Initialize model."""
        super().__init__(*args, **kwargs)

        if isinstance(traversal_func, type(None)):
            self.traversal_func = linear_activation_p
        elif callable(traversal_func):
            self.traversal_func = traversal_func
        else:
            raise ValueError('`traversal_func` must be None or a callable')

    def make_summary(self) -> pd.DataFrame:
        """Generate summary."""
        if not self.has_results:
            logger.error('Must run simulation first.')

        cmfs = np.stack(self.results.cmf)
        layer_min = (cmfs != 0).argmax(axis=1)
        valid = np.any(cmfs != 0, axis=1)
        layer_max = (cmfs == 1.).argmax(axis=1)
        layer_max[~np.any(cmfs == 1., axis=1)] = cmfs.shape[1]
        layer_median = (cmfs >= .5).argmax(axis=1).astype(float)
        pmfs = np.diff(cmfs, axis=1, prepend=0.)
        layer_pmfs = pmfs * np.arange(pmfs.shape[1])
        layer_mean = np.sum(layer_pmfs, axis=1)

        summary = pd.DataFrame({
                'layer_min': layer_min + 1,
                'layer_max': layer_max + 1,
                'layer_mean': layer_mean + 1,
                'layer_median': layer_median + 1,
            }, index=self.results.node)

        # Discard nodes that are never activated
        summary = summary[valid]

        self._summary = summary
        return self._summary

    def run(self, **kwargs) -> pd.DataFrame:
        """Run model (single process)."""

        # For some reason this is required for progress bars in Jupyter to show
        print(' ', end='', flush=True)
        # For faster access, use the raw array
        edges = self.edges[[self.source, self.target, self.weights]].values
        id_type = self.edges[self.source].dtype
        # Transform weights to traversal probabilities
        edges[:, 2] = self.traversal_func(edges[:, 2])

        # Change node IDs into indices in [0, len(nodes))
        ids, edges_idx = np.unique(edges[:, :2], return_inverse=True)
        ids = ids.astype(id_type)
        edges_idx = edges_idx.reshape((edges.shape[0], 2))
        edges_idx = np.concatenate(
            (edges_idx, np.expand_dims(edges[:, 2], axis=1)),
            axis=1)

        cmfs = np.zeros((len(ids), self.max_steps), dtype=np.float64)
        seed_idx = np.searchsorted(ids, self.seeds)
        cmfs[seed_idx, :] = 1.
        changed = set(edges_idx[np.isin(edges_idx[:, 0], seed_idx), 1].astype(id_type))

        with config.tqdm(
                total=0,
                disable=config.pbar_hide,
                leave=config.pbar_leave,
                position=kwargs.get('position', 0)) as pbar:
            while len(changed):
                next_changed = []

                pbar.total += len(changed)
                pbar.refresh()

                for idx in changed:
                    cmf = cmfs[idx, :]
                    inbound = edges_idx[edges_idx[:, 1] == idx, :]
                    pre = inbound[:, 0].astype(np.int64)

                    # Traversal probability for each inbound edge at each time.
                    posteriors = cmfs[pre, :] * np.expand_dims(inbound[:, 2], axis=1)
                    # At each time, compute the probability that at least one inbound edge
                    # is traversed.
                    new_pmf = 1 - np.prod(1 - posteriors, axis=0)
                    new_cmf = cmf.copy()
                    # Offset the time-cumulative probability by 1 to account for traversal iteration.
                    # Use maximum of previous CMF as it is monotonic and to include fixed seed traversal.
                    new_cmf[1:] = np.maximum(cmf[1:], 1 - np.cumprod(1 - new_pmf[:-1]))
                    np.clip(new_cmf, 0., 1., out=new_cmf)

                    if np.allclose(cmf, new_cmf):
                        continue

                    cmfs[idx, :] = new_cmf

                    # Notify downstream nodes that they have changed next iteration.
                    post_idx = edges_idx[edges_idx[:, 0] == idx, 1].astype(id_type)
                    next_changed.extend(list(post_idx))

                pbar.update(len(changed))
                changed = set(next_changed)

        self.iterations = 1
        self.results = pd.DataFrame({'node': ids, 'cmf': list(cmfs)})
        return self.results

    def run_parallel(self, *args, **kwargs) -> None:
        warnings.warn(f"{self.__class__.__name__} should not be run in parallel. Falling back to run.")
        self.run(**kwargs)

`init` #

Initialize model.

Source code in navis/models/network_models.py

def __init__(self,
             *args,
             traversal_func: Optional[Callable] = None,
             **kwargs):
    """Initialize model."""
    super().__init__(*args, **kwargs)

    if isinstance(traversal_func, type(None)):
        self.traversal_func = linear_activation_p
    elif callable(traversal_func):
        self.traversal_func = traversal_func
    else:
        raise ValueError('`traversal_func` must be None or a callable')

`make_summary` #

Generate summary.

Source code in navis/models/network_models.py

def make_summary(self) -> pd.DataFrame:
    """Generate summary."""
    if not self.has_results:
        logger.error('Must run simulation first.')

    cmfs = np.stack(self.results.cmf)
    layer_min = (cmfs != 0).argmax(axis=1)
    valid = np.any(cmfs != 0, axis=1)
    layer_max = (cmfs == 1.).argmax(axis=1)
    layer_max[~np.any(cmfs == 1., axis=1)] = cmfs.shape[1]
    layer_median = (cmfs >= .5).argmax(axis=1).astype(float)
    pmfs = np.diff(cmfs, axis=1, prepend=0.)
    layer_pmfs = pmfs * np.arange(pmfs.shape[1])
    layer_mean = np.sum(layer_pmfs, axis=1)

    summary = pd.DataFrame({
            'layer_min': layer_min + 1,
            'layer_max': layer_max + 1,
            'layer_mean': layer_mean + 1,
            'layer_median': layer_median + 1,
        }, index=self.results.node)

    # Discard nodes that are never activated
    summary = summary[valid]

    self._summary = summary
    return self._summary

`run` #

Run model (single process).

Source code in navis/models/network_models.py

def run(self, **kwargs) -> pd.DataFrame:
    """Run model (single process)."""

    # For some reason this is required for progress bars in Jupyter to show
    print(' ', end='', flush=True)
    # For faster access, use the raw array
    edges = self.edges[[self.source, self.target, self.weights]].values
    id_type = self.edges[self.source].dtype
    # Transform weights to traversal probabilities
    edges[:, 2] = self.traversal_func(edges[:, 2])

    # Change node IDs into indices in [0, len(nodes))
    ids, edges_idx = np.unique(edges[:, :2], return_inverse=True)
    ids = ids.astype(id_type)
    edges_idx = edges_idx.reshape((edges.shape[0], 2))
    edges_idx = np.concatenate(
        (edges_idx, np.expand_dims(edges[:, 2], axis=1)),
        axis=1)

    cmfs = np.zeros((len(ids), self.max_steps), dtype=np.float64)
    seed_idx = np.searchsorted(ids, self.seeds)
    cmfs[seed_idx, :] = 1.
    changed = set(edges_idx[np.isin(edges_idx[:, 0], seed_idx), 1].astype(id_type))

    with config.tqdm(
            total=0,
            disable=config.pbar_hide,
            leave=config.pbar_leave,
            position=kwargs.get('position', 0)) as pbar:
        while len(changed):
            next_changed = []

            pbar.total += len(changed)
            pbar.refresh()

            for idx in changed:
                cmf = cmfs[idx, :]
                inbound = edges_idx[edges_idx[:, 1] == idx, :]
                pre = inbound[:, 0].astype(np.int64)

                # Traversal probability for each inbound edge at each time.
                posteriors = cmfs[pre, :] * np.expand_dims(inbound[:, 2], axis=1)
                # At each time, compute the probability that at least one inbound edge
                # is traversed.
                new_pmf = 1 - np.prod(1 - posteriors, axis=0)
                new_cmf = cmf.copy()
                # Offset the time-cumulative probability by 1 to account for traversal iteration.
                # Use maximum of previous CMF as it is monotonic and to include fixed seed traversal.
                new_cmf[1:] = np.maximum(cmf[1:], 1 - np.cumprod(1 - new_pmf[:-1]))
                np.clip(new_cmf, 0., 1., out=new_cmf)

                if np.allclose(cmf, new_cmf):
                    continue

                cmfs[idx, :] = new_cmf

                # Notify downstream nodes that they have changed next iteration.
                post_idx = edges_idx[edges_idx[:, 0] == idx, 1].astype(id_type)
                next_changed.extend(list(post_idx))

            pbar.update(len(changed))
            changed = set(next_changed)

    self.iterations = 1
    self.results = pd.DataFrame({'node': ids, 'cmf': list(cmfs)})
    return self.results

`navis.models.TraversalModel` #

Model for traversing a network starting with given seed nodes.

What this does:

Grab all already visited nodes (starting with seeds in step 1)
Find all downstream nodes of these
Probabilistically traverse based on the weight of the connecting edges
Add those newly visited nodes to the pool & repeat from beginning
Stop when every (connected) neuron was visited or we reached max_steps

PARAMETER	DESCRIPTION
`edges`	DataFrame representing an edge list. Must minimally have a `source` and `target` column. TYPE: `pandas.DataFrame`
`seeds`	Seed nodes for traversal. Nodes that aren't found in `edges['source']` will be (silently) removed. TYPE: `iterable`
`weights`	Name of a column in `edges` used as weights. If not provided, all edges will be given a weight of 1. If using the default activation function the weights need to be between 0 and 1. TYPE: `str` DEFAULT: `'weight'`
`max_steps`	`Limits the number of steps for each iteration.` TYPE: `int` DEFAULT: `15`
`traversal_func`	Function that determines whether a given edge will be traversed or not in a given step. Must take numpy array (N, 1) of edge weights and return an array with True/False of equal size. Defaults to [`navis.models.network_models.random_linear_activation_function`][] which will linearly scale probability of traversal from 0 to 100% between edges weights 0 to 0.3. TYPE: `callable` DEFAULT: `None`

Examples:

>>> from navis.models import TraversalModel
>>> import networkx as nx
>>> import numpy as np
>>> # Generate a random graph
>>> G = nx.fast_gnp_random_graph(1000, .2, directed=True)
>>> # Turn into edge list
>>> edges = nx.to_pandas_edgelist(G)
>>> # Add random edge weights
>>> edges['weight'] = np.random.random(edges.shape[0])
>>> # Initialize model
>>> model = TraversalModel(edges, seeds=list(G.nodes)[:10])
>>> # Run model on 2 cores
>>> model.run_parallel(n_cores=2, iterations=100)
>>> # Get a summary
>>> model.summary.tail()
      layer_min  layer_max  layer_mean  layer_median
node
995           2          2        2.00             2
996           2          3        2.33             2
997           2          2        2.00             2
998           2          2        2.00             2
999           2          2        2.00             2

Above Graph was traversed quickly (3 steps max). Let's adjust the traversal function:

>>> from navis.models import random_linear_activation_function
>>> # Use a lower probability for activation
>>> def my_act(x):
...     return random_linear_activation_function(x, max_w=10)
>>> model = TraversalModel(edges, seeds=list(G.nodes)[:10],
...                        traversal_func=my_act)
>>> res = model.run(iterations=100)
>>> res.tail()
      layer_min  layer_max  layer_mean  layer_median
node
995           2          4       3.210           3.0
996           2          4       3.280           3.0
997           2          4       3.260           3.0
998           2          4       3.320           3.0
999           2          4       3.195           3.0

Source code in navis/models/network_models.py

class TraversalModel(BaseNetworkModel):
    """Model for traversing a network starting with given seed nodes.

    What this does:

      1. Grab all already visited nodes (starting with `seeds` in step 1)
      2. Find all downstream nodes of these
      3. Probabilistically traverse based on the weight of the connecting edges
      4. Add those newly visited nodes to the pool & repeat from beginning
      5. Stop when every (connected) neuron was visited or we reached `max_steps`

    Parameters
    ----------
    edges :             pandas.DataFrame
                        DataFrame representing an edge list. Must minimally have
                        a `source` and `target` column.
    seeds :             iterable
                        Seed nodes for traversal. Nodes that aren't found in
                        `edges['source']` will be (silently) removed.
    weights :           str, optional
                        Name of a column in `edges` used as weights. If not
                        provided, all edges will be given a weight of 1. If using
                        the default activation function the weights need to be
                        between 0 and 1.
    max_steps :         int
                        Limits the number of steps for each iteration.
    traversal_func :    callable, optional
                        Function that determines whether a given edge will be
                        traversed or not in a given step. Must take numpy array
                        (N, 1) of edge weights and return an array with
                        True/False of equal size. Defaults to
                        [`navis.models.network_models.random_linear_activation_function`][]
                        which will linearly scale probability of traversal
                        from 0 to 100% between edges weights 0 to 0.3.

    Examples
    --------
    >>> from navis.models import TraversalModel
    >>> import networkx as nx
    >>> import numpy as np
    >>> # Generate a random graph
    >>> G = nx.fast_gnp_random_graph(1000, .2, directed=True)
    >>> # Turn into edge list
    >>> edges = nx.to_pandas_edgelist(G)
    >>> # Add random edge weights
    >>> edges['weight'] = np.random.random(edges.shape[0])
    >>> # Initialize model
    >>> model = TraversalModel(edges, seeds=list(G.nodes)[:10])
    >>> # Run model on 2 cores
    >>> model.run_parallel(n_cores=2, iterations=100)
    >>> # Get a summary
    >>> model.summary.tail()                                    # doctest: +SKIP
          layer_min  layer_max  layer_mean  layer_median
    node
    995           2          2        2.00             2
    996           2          3        2.33             2
    997           2          2        2.00             2
    998           2          2        2.00             2
    999           2          2        2.00             2

    Above Graph was traversed quickly (3 steps max). Let's adjust the
    traversal function:

    >>> from navis.models import random_linear_activation_function
    >>> # Use a lower probability for activation
    >>> def my_act(x):
    ...     return random_linear_activation_function(x, max_w=10)
    >>> model = TraversalModel(edges, seeds=list(G.nodes)[:10],
    ...                        traversal_func=my_act)
    >>> res = model.run(iterations=100)
    >>> res.tail()                                              # doctest: +SKIP
          layer_min  layer_max  layer_mean  layer_median
    node
    995           2          4       3.210           3.0
    996           2          4       3.280           3.0
    997           2          4       3.260           3.0
    998           2          4       3.320           3.0
    999           2          4       3.195           3.0

    """

    def __init__(self,
                 edges: pd.DataFrame,
                 seeds: Iterable[Union[str, int]],
                 source: str = 'source',
                 target: str = 'target',
                 weights: Optional[str] = 'weight',
                 max_steps: int = 15,
                 traversal_func: Optional[Callable] = None):
        """Initialize model."""
        super().__init__(edges=edges, source=source, target=target)

        if not weights:
            edges['weight'] = 1
            weights = 'weight'

        assert weights in edges.columns, f'"{weights}" must be column in edge list'

        # Remove seeds that don't exist
        self.seeds = edges[edges[self.source].isin(seeds)][self.source].unique()

        if len(self.seeds) == 0:
            raise ValueError('None of the seeds where among edge list sources.')

        self.weights = weights
        self.max_steps = max_steps

        if isinstance(traversal_func, type(None)):
            self.traversal_func = random_linear_activation_function
        elif callable(traversal_func):
            self.traversal_func = traversal_func
        else:
            raise ValueError('`traversal_func` must be None or a callable')

    @property
    def summary(self) -> pd.DataFrame:
        """Per-node summary."""
        return getattr(self, '_summary', self.make_summary())

    def __str__(self):
        return self.__repr__()

    def __repr__(self):
        s = f'{self.__class__}: {self.edges.shape[0]} edges; {self.n_nodes}' \
            f' unique nodes; {len(self.seeds)} seeds;' \
            f' traversal_func {self.traversal_func}.'
        if self.has_results:
            s += f' Model ran with {self.iterations} iterations.'
        else:
            s += ' Model has not yet been run.'
        return s

    def make_summary(self) -> pd.DataFrame:
        """Generate summary."""
        if not self.has_results:
            logger.error('Must run simulation first.')

        summary = self.results.groupby('node',
                                       as_index=False).steps.agg(['min',
                                                                  'max',
                                                                  'mean',
                                                                  'median'])

        summary.rename({'min': 'layer_min',
                        'mean': 'layer_mean',
                        'max': 'layer_max',
                        'median': 'layer_median'}, axis=1, inplace=True)

        self._summary = summary
        return self._summary

    def run(self, iterations: int = 100, return_iterations=False, **kwargs) -> pd.DataFrame:
        """Run model (single process).

        Use `.run_parallel` to use parallel processes.

        """
        # For some reason this is required for progress bars in Jupyter to show
        print(' ', end='', flush=True)
        # For faster access, use the raw array
        # Note: we're splitting the columns in case we have different datatypes
        # (e.g. int64 for IDs and float for weights)
        sources = self.edges[self.source].values
        targets = self.edges[self.target].values
        weights = self.edges[self.weights].values

        # For some reason the progress bar does not show unless we have a print here
        all_enc_nodes = None
        for it in config.trange(1, iterations + 1,
                                disable=config.pbar_hide,
                                leave=config.pbar_leave,
                                position=kwargs.get('position', 0)):
            # Set seeds as encountered in step 1
            enc_nodes = self.seeds
            enc_steps = np.repeat(1, len(self.seeds))
            if return_iterations:
                enc_it = np.repeat(it, len(self.seeds))

            # Start with all edges
            this_weights = weights
            this_sources = sources
            this_targets = targets
            for i in range(2, self.max_steps + 1):
                # Which edges have their presynaptic node already traversed?
                pre_trav = np.isin(this_sources, enc_nodes)
                # Among those, which edges have the postsynaptic node traversed?
                post_trav = np.isin(this_targets[pre_trav], enc_nodes)

                # Combine conditions to find edges where the presynaptic node
                # has been traversed but not the postsynaptic node
                pre_not_post = np.where(pre_trav)[0][~post_trav]
                out_targets = this_targets[pre_not_post]
                out_weights = this_weights[pre_not_post]

                # Drop edges that have already been traversed - speeds up things
                pre_and_post = np.where(pre_trav)[0][post_trav]
                this_targets = np.delete(this_targets, pre_and_post, axis=0)
                this_sources = np.delete(this_sources, pre_and_post, axis=0)
                this_weights = np.delete(this_weights, pre_and_post, axis=0)

                # Stop if we traversed the entire (reachable) graph
                if out_targets.size == 0:
                    break

                # Edges traversed in this round
                trav = self.traversal_func(out_weights)
                if not trav.sum():
                    continue

                trav_targets = out_targets[trav]

                # Keep track
                new_trav = np.unique(trav_targets)

                # Store results
                enc_nodes = np.concatenate((enc_nodes, new_trav))
                enc_steps = np.concatenate((enc_steps, np.repeat(i, len(new_trav))))
                if return_iterations:
                    enc_it = np.concatenate((enc_it, np.repeat(it, len(new_trav))))

            # Save this round of traversal
            if all_enc_nodes is None:
                all_enc_nodes = enc_nodes
                all_enc_steps = enc_steps
                if return_iterations:
                    all_enc_it = enc_it
            else:
                all_enc_nodes = np.concatenate((all_enc_nodes, enc_nodes))
                all_enc_steps = np.concatenate((all_enc_steps, enc_steps))
                if return_iterations:
                    all_enc_it = np.concatenate((all_enc_it, enc_it))

        self.iterations = iterations

        # Combine results into DataFrame
        self.results = pd.DataFrame()
        self.results['steps'] = all_enc_steps
        self.results['node'] = all_enc_nodes
        if return_iterations:
            self.results['iteration'] = all_enc_it

        return self.results

`summary: pd.DataFrame` `property` #

Per-node summary.

`init` #

Initialize model.

Source code in navis/models/network_models.py

def __init__(self,
             edges: pd.DataFrame,
             seeds: Iterable[Union[str, int]],
             source: str = 'source',
             target: str = 'target',
             weights: Optional[str] = 'weight',
             max_steps: int = 15,
             traversal_func: Optional[Callable] = None):
    """Initialize model."""
    super().__init__(edges=edges, source=source, target=target)

    if not weights:
        edges['weight'] = 1
        weights = 'weight'

    assert weights in edges.columns, f'"{weights}" must be column in edge list'

    # Remove seeds that don't exist
    self.seeds = edges[edges[self.source].isin(seeds)][self.source].unique()

    if len(self.seeds) == 0:
        raise ValueError('None of the seeds where among edge list sources.')

    self.weights = weights
    self.max_steps = max_steps

    if isinstance(traversal_func, type(None)):
        self.traversal_func = random_linear_activation_function
    elif callable(traversal_func):
        self.traversal_func = traversal_func
    else:
        raise ValueError('`traversal_func` must be None or a callable')

`make_summary` #

Generate summary.

Source code in navis/models/network_models.py

def make_summary(self) -> pd.DataFrame:
    """Generate summary."""
    if not self.has_results:
        logger.error('Must run simulation first.')

    summary = self.results.groupby('node',
                                   as_index=False).steps.agg(['min',
                                                              'max',
                                                              'mean',
                                                              'median'])

    summary.rename({'min': 'layer_min',
                    'mean': 'layer_mean',
                    'max': 'layer_max',
                    'median': 'layer_median'}, axis=1, inplace=True)

    self._summary = summary
    return self._summary

`run` #

Run model (single process).

Use .run_parallel to use parallel processes.

Source code in navis/models/network_models.py

def run(self, iterations: int = 100, return_iterations=False, **kwargs) -> pd.DataFrame:
    """Run model (single process).

    Use `.run_parallel` to use parallel processes.

    """
    # For some reason this is required for progress bars in Jupyter to show
    print(' ', end='', flush=True)
    # For faster access, use the raw array
    # Note: we're splitting the columns in case we have different datatypes
    # (e.g. int64 for IDs and float for weights)
    sources = self.edges[self.source].values
    targets = self.edges[self.target].values
    weights = self.edges[self.weights].values

    # For some reason the progress bar does not show unless we have a print here
    all_enc_nodes = None
    for it in config.trange(1, iterations + 1,
                            disable=config.pbar_hide,
                            leave=config.pbar_leave,
                            position=kwargs.get('position', 0)):
        # Set seeds as encountered in step 1
        enc_nodes = self.seeds
        enc_steps = np.repeat(1, len(self.seeds))
        if return_iterations:
            enc_it = np.repeat(it, len(self.seeds))

        # Start with all edges
        this_weights = weights
        this_sources = sources
        this_targets = targets
        for i in range(2, self.max_steps + 1):
            # Which edges have their presynaptic node already traversed?
            pre_trav = np.isin(this_sources, enc_nodes)
            # Among those, which edges have the postsynaptic node traversed?
            post_trav = np.isin(this_targets[pre_trav], enc_nodes)

            # Combine conditions to find edges where the presynaptic node
            # has been traversed but not the postsynaptic node
            pre_not_post = np.where(pre_trav)[0][~post_trav]
            out_targets = this_targets[pre_not_post]
            out_weights = this_weights[pre_not_post]

            # Drop edges that have already been traversed - speeds up things
            pre_and_post = np.where(pre_trav)[0][post_trav]
            this_targets = np.delete(this_targets, pre_and_post, axis=0)
            this_sources = np.delete(this_sources, pre_and_post, axis=0)
            this_weights = np.delete(this_weights, pre_and_post, axis=0)

            # Stop if we traversed the entire (reachable) graph
            if out_targets.size == 0:
                break

            # Edges traversed in this round
            trav = self.traversal_func(out_weights)
            if not trav.sum():
                continue

            trav_targets = out_targets[trav]

            # Keep track
            new_trav = np.unique(trav_targets)

            # Store results
            enc_nodes = np.concatenate((enc_nodes, new_trav))
            enc_steps = np.concatenate((enc_steps, np.repeat(i, len(new_trav))))
            if return_iterations:
                enc_it = np.concatenate((enc_it, np.repeat(it, len(new_trav))))

        # Save this round of traversal
        if all_enc_nodes is None:
            all_enc_nodes = enc_nodes
            all_enc_steps = enc_steps
            if return_iterations:
                all_enc_it = enc_it
        else:
            all_enc_nodes = np.concatenate((all_enc_nodes, enc_nodes))
            all_enc_steps = np.concatenate((all_enc_steps, enc_steps))
            if return_iterations:
                all_enc_it = np.concatenate((all_enc_it, enc_it))

    self.iterations = iterations

    # Combine results into DataFrame
    self.results = pd.DataFrame()
    self.results['steps'] = all_enc_steps
    self.results['node'] = all_enc_nodes
    if return_iterations:
        self.results['iteration'] = all_enc_it

    return self.results

`navis.models.linear_activation_p` #

Linear activation probability.

PARAMETER	DESCRIPTION
`w`	`(N, 1) array containing the edge weights.` TYPE: `np.ndarray`
`min_w`	Value of `w` at which probability of activation is 0%. TYPE: `float` DEFAULT: `0`
`max_w`	Value of `w` at which probability of activation is 100%. TYPE: `float` DEFAULT: `0.3`

RETURNS	DESCRIPTION
`np.ndarray`	Probability of activation for each edge.

Source code in navis/models/network_models.py

def linear_activation_p(
    w: np.ndarray,
    min_w: float = 0,
    max_w: float = .3,
) -> np.ndarray:
    """Linear activation probability.

    Parameters
    ----------
    w :     np.ndarray
            (N, 1) array containing the edge weights.
    min_w : float
            Value of `w` at which probability of activation is 0%.
    max_w : float
            Value of `w` at which probability of activation is 100%.

    Returns
    -------
    np.ndarray
            Probability of activation for each edge.

    """
    return np.clip((w - min_w) / (max_w - min_w), 0., 1.)

`navis.models.random_linear_activation_function` #

Random linear activation function.

PARAMETER	DESCRIPTION
`w`	`(N, 1) array containing the edge weights.` TYPE: `np.ndarray`
`min_w`	Value of `w` at which probability of activation is 0%. TYPE: `float` DEFAULT: `0`
`max_w`	Value of `w` at which probability of activation is 100%. TYPE: `float` DEFAULT: `0.3`

RETURNS	DESCRIPTION
`np.ndarray`	True or False values for each edge.

Source code in navis/models/network_models.py

def random_linear_activation_function(w: np.ndarray,
                                      min_w: float = 0,
                                      max_w: float = .3) -> np.ndarray:
    """Random linear activation function.

    Parameters
    ----------
    w :     np.ndarray
            (N, 1) array containing the edge weights.
    min_w : float
            Value of `w` at which probability of activation is 0%.
    max_w : float
            Value of `w` at which probability of activation is 100%.

    Returns
    -------
    np.ndarray
            True or False values for each edge.

    """
    return random_activation_function(w, lambda w: linear_activation_p(w, min_w, max_w))

models

navis.models.BayesianTraversalModel #

__init__ #

make_summary #

run #

navis.models.TraversalModel #

summary: pd.DataFrame property #

__init__ #

make_summary #

run #

navis.models.linear_activation_p #

navis.models.random_linear_activation_function #

`navis.models.BayesianTraversalModel` #

`init` #

`make_summary` #

`run` #

`navis.models.TraversalModel` #

`summary: pd.DataFrame` `property` #

`init` #

`make_summary` #

`run` #

`navis.models.linear_activation_p` #

`navis.models.random_linear_activation_function` #