genet.utils.graph_operations

`Filter(conditions=None, how=any, mixed_dtypes=True)` #

Helps filtering on specified attributes.

PARAMETER	DESCRIPTION
`conditions`	{'attribute_key': 'target_value'} or nested {'attribute_key': {'another_key': {'yet_another_key': 'target_value'}}}, where 'target_value' could be: single value, string, int, float, where the edge_data[key] == value (if mixed_dtypes==True and in case of set/list edge_data[key], value is in edge_data[key]) list or set of single values as above, where edge_data[key] in [value1, value2] (if mixed_dtypes==True and in case of set/list edge_data[key], set(edge_data[key]) & set([value1, value2]) is non-empty) for int or float values, two-tuple bound (lower_bound, upper_bound) where lower_bound <= edge_data[key] <= upper_bound (if mixed_dtypes==True and in case of set/list edge_data[key], at least one item in edge_data[key] satisfies lower_bound <= item <= upper_bound) function that returns a boolean given the value e.g. `def below_exclusive_upper_bound(value): return value < 100` (if mixed_dtypes==True and in case of set/list edge_data[key], at least one item in edge_data[key] returns True after applying function) TYPE: `Union[list, dict]` DEFAULT: `None`
`how`	The level of rigour used to match conditions. Defaults to any. - all: means all conditions need to be met - any: means at least one condition needs to be met TYPE: `Callable` DEFAULT: `any`
`mixed_dtypes`	If True, will consider the intersection of single values or lists of values in queried dictionary keys, e.g. as in simplified networks. Defaults to True. TYPE: `bool` DEFAULT: `True`

Source code in src/genet/utils/graph_operations.py

def __init__(
    self,
    conditions: Optional[
        Union[
            list,
            dict[str, Union[dict, str, int, float, list, Callable[[str, int, float], bool]]],
        ]
    ] = None,
    how: Callable = any,
    mixed_dtypes: bool = True,
):
    """Helps filtering on specified attributes.

    Args:
        conditions (Union[list, dict]):
            {'attribute_key': 'target_value'} or nested {'attribute_key': {'another_key': {'yet_another_key': 'target_value'}}},
            where 'target_value' could be:

            - single value, string, int, float, where the edge_data[key] == value
            (if mixed_dtypes==True and in case of set/list edge_data[key], value is in edge_data[key])

            - list or set of single values as above, where edge_data[key] in [value1, value2]
            (if mixed_dtypes==True and in case of set/list edge_data[key],
            set(edge_data[key]) & set([value1, value2]) is non-empty)

            - for int or float values, two-tuple bound (lower_bound, upper_bound) where
            lower_bound <= edge_data[key] <= upper_bound
            (if mixed_dtypes==True and in case of set/list edge_data[key], at least one item in
            edge_data[key] satisfies lower_bound <= item <= upper_bound)

            - function that returns a boolean given the value e.g.
            ```python
            def below_exclusive_upper_bound(value):
                return value < 100
            ```
            (if mixed_dtypes==True and in case of set/list edge_data[key], at least one item in
            edge_data[key] returns True after applying function)

        how (Callable, optional):
            The level of rigour used to match conditions. Defaults to any.
            - all: means all conditions need to be met
            - any: means at least one condition needs to be met

        mixed_dtypes (bool, optional):
            If True, will consider the intersection of single values or lists of values in queried dictionary keys, e.g. as in simplified networks.
            Defaults to True.
    """

    self.conditions = conditions
    self.how = how
    self.mixed_dtypes = mixed_dtypes

`conditions = conditions` `instance-attribute` #

`how = how` `instance-attribute` #

`mixed_dtypes = mixed_dtypes` `instance-attribute` #

`evaluate_condition(condition, data_dict)` #

Source code in src/genet/utils/graph_operations.py

def evaluate_condition(self, condition, data_dict):
    satisfies = False
    for key, val in condition.items():
        if key in data_dict:
            if isinstance(val, dict):
                # keep going
                satisfies = self.evaluate_condition(val, data_dict[key])
            elif isinstance(val, (int, float, str)):
                if isinstance(data_dict[key], (list, set)) and self.mixed_dtypes:
                    satisfies = val in data_dict[key]
                else:
                    # value is that value
                    satisfies = data_dict[key] == val
            elif isinstance(val, (list, set)):
                if isinstance(data_dict[key], (list, set)) and self.mixed_dtypes:
                    if set(data_dict[key]) & set(val):
                        satisfies = True
                else:
                    # value is one of the items in the list
                    satisfies = data_dict[key] in val
            elif isinstance(val, tuple):
                if len(val) != 2:
                    raise AttributeError(
                        "Tuple defining the bound has to be a two-tuple: (lower_bound, upper_bound)"
                    )
                if isinstance(data_dict[key], (list, set)) and self.mixed_dtypes:
                    return any([val[0] <= value <= val[1] for value in data_dict[key]])
                else:
                    try:
                        # value is within the bound
                        satisfies = val[0] <= data_dict[key] <= val[1]
                    except TypeError:
                        # ignore types not suitable for this condition
                        pass
            elif callable(val):
                if isinstance(data_dict[key], (list, set)) and self.mixed_dtypes:
                    return any([val(value) for value in data_dict[key]])
                else:
                    # value is a function of data_dict[key] that returns a bool
                    satisfies = val(data_dict[key])
    return satisfies

`satisfies_conditions(data_dict)` #

Source code in src/genet/utils/graph_operations.py

def satisfies_conditions(self, data_dict):
    if isinstance(self.conditions, list):
        conditions_satisfied = []
        for condition in self.conditions:
            conditions_satisfied.append(self.evaluate_condition(condition, data_dict))
        return self.how(conditions_satisfied)
    elif isinstance(self.conditions, dict):
        return self.evaluate_condition(self.conditions, data_dict)
    elif self.conditions is None:
        return True

`apply_function_to_attributes(iterator, function, location)` #

Source code in src/genet/utils/graph_operations.py

def apply_function_to_attributes(iterator, function, location):
    new_attributes = {}
    for item_id, item_attribs in iterator:
        try:
            new_attributes[item_id] = {location: function(item_attribs)}
        except KeyError:
            # Not all items are required to work with the function. Fail silently and only apply
            # to relevant items
            pass
    return new_attributes

`apply_mapping_to_attributes(iterator, mapping, location)` #

Source code in src/genet/utils/graph_operations.py

def apply_mapping_to_attributes(iterator, mapping, location):
    new_attributes = {}
    # assumes mapping at the same location
    for item_id, item_attribs in iterator:
        try:
            new_attributes[item_id] = {location: mapping[item_attribs[location]]}
        except KeyError:
            # Not all items are required to work with the mapping. Fail silently and only apply
            # to relevant items
            pass
    if (not new_attributes) and mapping:
        logging.warning(
            f"Mapping attributes resulted in 0 changes. Ensure your location variable: {location} exists "
            f"as keys in the input dictionaries. Only dictionaries with location={location} keys will be "
            "mapped."
        )
    return new_attributes

`apply_to_attributes(iterator, to_apply, location)` #

Source code in src/genet/utils/graph_operations.py

def apply_to_attributes(iterator, to_apply, location):
    if isinstance(to_apply, dict):
        return apply_mapping_to_attributes(iterator, to_apply, location)
    else:
        return apply_function_to_attributes(iterator, to_apply, location)

`build_attribute_dataframe(iterator, keys, index_name=None)` #

Builds a pandas.DataFrame from data in iterator.

PARAMETER	DESCRIPTION
`iterator`	iterator or list of tuples (id, dictionary data with keys of interest). TYPE: `Iterable`
`keys`	keys to extract data from. Can be a string, list or dictionary/list of dictionaries if accessing nested dictionaries, for example on using dictionaries see `get_attribute_data_under_key` docstring. TYPE: `Union[list, dict, str]`
`index_name`	Name of returned dataframe index. Defaults to None. TYPE: `Optional[str]` DEFAULT: `None`

RETURNS	DESCRIPTION
`DataFrame`	pd.DataFrame: Attribute dataframe.

Source code in src/genet/utils/graph_operations.py

def build_attribute_dataframe(
    iterator: Iterable, keys: Union[list, dict, str], index_name: Optional[str] = None
) -> pd.DataFrame:
    """Builds a pandas.DataFrame from data in iterator.

    Args:
        iterator (Iterable): iterator or list of tuples (id, dictionary data with keys of interest).
        keys (Union[list, dict, str]):
            keys to extract data from.
            Can be a string, list or dictionary/list of dictionaries if accessing nested dictionaries, for example on using dictionaries see `get_attribute_data_under_key` docstring.
        index_name (Optional[str], optional): Name of returned dataframe index. Defaults to None.

    Returns:
        pd.DataFrame: Attribute dataframe.
    """
    df = pd.DataFrame()
    if isinstance(keys, str):
        keys = [keys]
    if len(keys) > 1:
        iterator = list(iterator)
    for key in keys:
        if isinstance(key, dict):
            # consolidate nestedness to get a name for the column
            name = dict_support.dict_to_string(key)
        else:
            name = key

        attribute_data = get_attribute_data_under_key(iterator, key)
        col_series = pd.Series(attribute_data, dtype=pd_helpers.get_pandas_dtype(attribute_data))
        col_series.name = name

        df = df.merge(pd.DataFrame(col_series), left_index=True, right_index=True, how="outer")
    if index_name is not None:
        df.index = df.index.set_names([index_name])
    return df

`consolidate_link_indices(left, right)` #

Changes the link indexing in right to match left on modes stored on the links and resolves clashing link ids if they don't match.

This method assumes that the node ids of left vs right have already been consolidated (see consolidate_node_indices, which consolidates node ids).

PARAMETER	DESCRIPTION
`left`	GeNet network. TYPE: `Network`
`right`	GeNet network that needs to be updated to match left network. TYPE: `Network`

RETURNS	DESCRIPTION
`Network`	Updated `right` network. TYPE: `Network`

Source code in src/genet/utils/graph_operations.py

def consolidate_link_indices(left: Network, right: Network) -> Network:
    """Changes the link indexing in right to match left on modes stored on the links and resolves clashing link ids if they don't match.

    This method assumes that the node ids of left vs right have already been consolidated (see `consolidate_node_indices`, which consolidates node ids).

    Args:
        left (Network): GeNet network.
        right (Network): GeNet network that needs to be updated to match left network.

    Returns:
        Network: Updated `right` network.
    """

    def sort_and_hash(modes_list):
        modes_list.sort()
        return "_".join(modes_list)

    def extract_multindex(link_id, graph):
        return graph.link_id_mapping[link_id]["multi_edge_idx"]

    def get_edges_with_clashing_ids(group):
        if (
            (group.dropna()["link_id_right"] != group.dropna()["link_id_left"])
            | (group.dropna()["multi_idx_right"] != group.dropna()["multi_idx_left"])
        ).any():
            return group
        elif group.dropna().empty:
            clashing_multi_idx = set(group["multi_idx_right"].dropna()) & set(
                group["multi_idx_left"].dropna()
            )
            if clashing_multi_idx:
                return group

    def append_data_to_overlapping_links_data(row):
        if not row.empty:
            overlapping_links_data[row["link_id_left"]] = right.link(row["link_id_right"])

    def append_data_to_unique_clashing_links_data(row):
        if not row.empty:
            unique_clashing_links_data[row["link_id_right"]] = right.link(row["link_id_right"])

    # Now consolidate link ids, we do a similar dataframe join as for nodes but on edge data and nodes the edges
    # connect instead of spatial
    left_df = left.link_attribute_data_under_keys(["modes", "from", "to", "id"], index_name="left")
    # extract multi index and hash modes
    left_df["multi_idx"] = left_df["id"].apply(lambda x: extract_multindex(x, left))
    left_df["modes"] = left_df["modes"].apply(lambda x: sort_and_hash(x))
    left_df = left_df.rename(columns={"id": "link_id"})
    right_df = right.link_attribute_data_under_keys(
        ["modes", "from", "to", "id"], index_name="right"
    )
    # extract multi index and hash modes
    right_df["multi_idx"] = right_df["id"].apply(lambda x: extract_multindex(x, right))
    right_df["modes"] = right_df["modes"].apply(lambda x: sort_and_hash(x))
    right_df = right_df.rename(columns={"id": "link_id"})

    df = left_df.reset_index().merge(
        right_df.reset_index(),
        on=["modes", "from", "to"],
        how="outer",
        suffixes=("_left", "_right"),
    )

    # In the dataframe above we have combined to compare edges which have the same from and to nodes and the same modes
    # on the edge. Remember these graphs have multi edges, there could be more than one edge between two nodes.
    # There are a few different scenarios here, if edges have found a match on mode, and nodes
    # - link ids match and multi indices match
    # - link ids match but the multi indices dont match
    # - link ids dont match but multi indices do match
    # - neither link ids or multi indices match, but the edge is the same in terms of mode and from/to nodes
    # Similarly, there are a few scenarios if the edges didn't find a match
    # - remaining (unmatched) link ids for edges in right are unique, don't clash with left,
    # they will remain as they are
    # - link ids clash with left

    # remove all edges that match and clash, we will re-add them later
    # this includes multiedges of edges that may have matched only one multiedge or no multi edges at all, i.e. the
    # graphs that multi edges that are completely separate but clash in the multi index
    # ---this is to consolidate the multindices across left and right
    clashing_overlapping_edges = (
        df.groupby(["from", "to"]).apply(get_edges_with_clashing_ids).reset_index(drop=True)
    )
    # store the edge data from right
    overlapping_links_data: dict = {}
    unique_clashing_links_data: dict = {}
    if not clashing_overlapping_edges.empty:
        clashing_overlapping_edges[
            clashing_overlapping_edges["link_id_right"].notna()
            & clashing_overlapping_edges["link_id_left"].notna()
        ].apply(lambda row: append_data_to_overlapping_links_data(row), axis=1)
        clashing_overlapping_edges[
            clashing_overlapping_edges["link_id_right"].notna()
            & clashing_overlapping_edges["link_id_left"].isna()
        ].apply(lambda row: append_data_to_unique_clashing_links_data(row), axis=1)

        right.remove_links(set(clashing_overlapping_edges["link_id_right"].dropna()))

    # resolve clashing link ids for links in right which don't exist in left
    clashing_right_link_ids = set(df[df["left"].isna()]["link_id_right"]) & set(
        df["link_id_left"].dropna()
    )
    # some link ids could have been picked up before and deleted, only consider the ones which don't overlap
    clashing_right_link_ids = set(right.link_id_mapping.keys()) & clashing_right_link_ids
    if clashing_right_link_ids:
        # generate the index avoiding indices from left, that way they're unique across both graphs
        [
            right.reindex_link(
                link, right.generate_index_for_edge(set(left.link_id_mapping.keys()))
            )
            for link in clashing_right_link_ids
        ]

    # Impose link id and multi index if from left on right, basically add the links we deleted from right but using
    # left's indexing, keep the data from right using the dictionaries where we saved them
    for left_link_id, data in overlapping_links_data.items():
        u, v = left.link_id_mapping[left_link_id]["from"], left.link_id_mapping[left_link_id]["to"]
        multi_idx = left.link_id_mapping[left_link_id]["multi_edge_idx"]
        right.add_link(left_link_id, u, v, multi_idx, data, silent=True)

    for right_link_id, data in unique_clashing_links_data.items():
        u, v = data["from"], data["to"]
        # generate unique multi index, unique in both left and right
        right_multi_idx = set()
        if right.graph.has_edge(u, v):
            right_multi_idx = set(right.graph[u][v].keys())
        left_multi_idx = set()
        if left.graph.has_edge(u, v):
            left_multi_idx = set(left.graph[u][v].keys())
        existing_multi_edge_ids = right_multi_idx | left_multi_idx
        multi_idx = next(filterfalse(set(existing_multi_edge_ids).__contains__, count(1)))
        if right_link_id in set(left.link_id_mapping.keys()) | set(right.link_id_mapping.keys()):
            right_link_id = right.generate_index_for_edge(set(left.link_id_mapping.keys()))
        right.add_link(right_link_id, u, v, multi_idx, data, silent=True)

    logging.info("Finished consolidating link indexing between the two graphs")
    return right

`consolidate_node_indices(left, right)` #

Changes the node indexing in right to match left spatially and resolves clashing node ids if they don't match spatially.

The two networks need to be in matching coordinate systems.

PARAMETER	DESCRIPTION
`left`	GeNet network. TYPE: `Network`
`right`	GeNet network that needs to be updated to match left network. TYPE: `Network`

RAISES	DESCRIPTION
`RuntimeError`	Nodes must be spatially unique.

RETURNS	DESCRIPTION
`Network`	Updated `right` network. TYPE: `Network`

Source code in src/genet/utils/graph_operations.py

def consolidate_node_indices(left: Network, right: Network) -> Network:
    """Changes the node indexing in right to match left spatially and resolves clashing node ids if they don't match spatially.

    The two networks need to be in matching coordinate systems.

    Args:
        left (Network): GeNet network.
        right (Network): GeNet network that needs to be updated to match left network.

    Raises:
        RuntimeError: Nodes must be spatially unique.

    Returns:
        Network: Updated `right` network.
    """
    # find spatially overlapping nodes by extracting all of the s2 spatial ids from right
    s2_ids_right = right.node_attribute_data_under_key("s2_id")
    if len(s2_ids_right) != len(s2_ids_right.unique()):
        raise RuntimeError(
            "There is more than one node in one place in the network you are trying to add"
        )
    s2_ids_right.name = "s2_id"
    s2_ids_right.index = s2_ids_right.index.set_names(["right"])
    s2_ids_left = left.node_attribute_data_under_key("s2_id")
    # do the same for left
    if len(s2_ids_left) != len(s2_ids_left.unique()):
        raise RuntimeError(
            "There is more than one node in one place in the network you are trying to add"
        )
    s2_ids_left.name = "s2_id"
    s2_ids_left.index = s2_ids_left.index.set_names(["left"])
    # combine spatial info on nodes in left and right into a dataframe, join on s2 ids
    s2_id_df = (
        pd.DataFrame(s2_ids_right)
        .reset_index()
        .merge(pd.DataFrame(s2_ids_left).reset_index(), on="s2_id", how="outer")
    )

    # check uniqueness of the node indices that are left in right
    clashing_right_node_ids = set(s2_id_df[s2_id_df["left"].isna()]["right"]) & set(
        s2_id_df["left"].dropna()
    )
    if clashing_right_node_ids:
        # generate the index avoiding indices from left, that way they're unique across both graphs
        [
            right.reindex_node(node, right.generate_index_for_node([i for i, a in left.nodes()]))
            for node in clashing_right_node_ids
        ]

    # finally change node ids for overlapping nodes
    # TODO check that a new index is not being generated if an index exists in right but hasnt been overwritten yet
    [
        right.reindex_node(s2_id_df.loc[idx, "right"], s2_id_df.loc[idx, "left"])
        for idx in s2_id_df.dropna()[s2_id_df["right"] != s2_id_df["left"]].index
    ]
    logging.info("Finished consolidating node indexing between the two graphs")
    return right

`convert_list_of_link_ids_to_network_nodes(network, link_ids)` #

Extracts nodes corresponding to link ids in the order of given link_ids list.

Useful for extracting network routes.

PARAMETER	DESCRIPTION
`network`	GeNet network. TYPE: `Network`
`link_ids`	Link IDs whose nodes are to be extracted. TYPE: `list`

RETURNS	DESCRIPTION
`list`	Node IDs. TYPE: `list`

Source code in src/genet/utils/graph_operations.py

def convert_list_of_link_ids_to_network_nodes(network: Network, link_ids: list) -> list:
    """Extracts nodes corresponding to link ids in the order of given link_ids list.

    Useful for extracting network routes.

    Args:
        network (Network): GeNet network.
        link_ids (list): Link IDs whose nodes are to be extracted.

    Returns:
        list: Node IDs.
    """
    paths: list = []
    connected_path: list = []
    for link_id in link_ids:
        x, y = network.link_id_mapping[link_id]["from"], network.link_id_mapping[link_id]["to"]
        if not connected_path:
            connected_path = [x, y]
        elif connected_path[-1] != x:
            paths.append(connected_path)
            connected_path = [x, y]
        else:
            connected_path.append(y)
    paths.append(connected_path)
    return paths

`extract_on_attributes(iterator, conditions, how=any, mixed_dtypes=True)` #

Extracts ids in iterator based on values of attributes attached to the items.

Fails silently, assumes not all items have those attributes. In the case were the attributes stored are a list or set, like in the case of a simplified network (there will be a mix of objects that are sets and not), an intersection of values satisfying condition(s) is considered in case of iterable value, if not empty, it is deemed successful by default. To disable this behaviour set mixed_dtypes to False.

PARAMETER	DESCRIPTION
`iterator`	list or set of two-tuples: (id of the item, attributes of the item) TYPE: `Iterator[tuple[str, dict]]`
`conditions`	{'attribute_key': 'target_value'} or nested {'attribute_key': {'another_key': {'yet_another_key': 'target_value'}}}, where 'target_value' could be: single value, string, int, float, where the edge_data[key] == value (if mixed_dtypes==True and in case of set/list edge_data[key], value is in edge_data[key]) list or set of single values as above, where edge_data[key] in [value1, value2] (if mixed_dtypes==True and in case of set/list edge_data[key], set(edge_data[key]) & set([value1, value2]) is non-empty) for int or float values, two-tuple bound (lower_bound, upper_bound) where lower_bound <= edge_data[key] <= upper_bound (if mixed_dtypes==True and in case of set/list edge_data[key], at least one item in edge_data[key] satisfies lower_bound <= item <= upper_bound) function that returns a boolean given the value e.g. `def below_exclusive_upper_bound(value): return value < 100` (if mixed_dtypes==True and in case of set/list edge_data[key], at least one item in edge_data[key] returns True after applying function) TYPE: `Union[list, dict]`
`how`	The level of rigour used to match conditions. Defaults to any. - all: means all conditions need to be met - any: means at least one condition needs to be met TYPE: `Callable` DEFAULT: `any`
`mixed_dtypes`	If True, will consider the intersection of single values or lists of values in queried dictionary keys, e.g. as in simplified networks. Defaults to True. TYPE: `bool` DEFAULT: `True`

RETURNS	DESCRIPTION
`list`	list of ids in input iterator satisfying conditions TYPE: `list`

Source code in src/genet/utils/graph_operations.py

def extract_on_attributes(
    iterator: Iterator[tuple[str, dict]],
    conditions: Union[list, dict],
    how: Callable = any,
    mixed_dtypes: bool = True,
) -> list:
    """Extracts ids in iterator based on values of attributes attached to the items.

    Fails silently, assumes not all items have those attributes.
    In the case were the attributes stored are a list or set,
    like in the case of a simplified network (there will be a mix of objects that are sets and not),
    an intersection of values satisfying condition(s) is considered in case of iterable value, if not empty, it is deemed successful by default.
    To disable this behaviour set mixed_dtypes to False.

    Args:
        iterator (Iterator[tuple[str, dict]]): list or set of two-tuples: (id of the item, attributes of the item)
        conditions (Union[list, dict]):
            {'attribute_key': 'target_value'} or nested {'attribute_key': {'another_key': {'yet_another_key': 'target_value'}}},
            where 'target_value' could be:

            - single value, string, int, float, where the edge_data[key] == value
            (if mixed_dtypes==True and in case of set/list edge_data[key], value is in edge_data[key])

            - list or set of single values as above, where edge_data[key] in [value1, value2]
            (if mixed_dtypes==True and in case of set/list edge_data[key],
            set(edge_data[key]) & set([value1, value2]) is non-empty)

            - for int or float values, two-tuple bound (lower_bound, upper_bound) where
            lower_bound <= edge_data[key] <= upper_bound
            (if mixed_dtypes==True and in case of set/list edge_data[key], at least one item in
            edge_data[key] satisfies lower_bound <= item <= upper_bound)

            - function that returns a boolean given the value e.g.
            ```python
            def below_exclusive_upper_bound(value):
                return value < 100
            ```
            (if mixed_dtypes==True and in case of set/list edge_data[key], at least one item in
            edge_data[key] returns True after applying function)

        how (Callable, optional):
            The level of rigour used to match conditions. Defaults to any.
            - all: means all conditions need to be met
            - any: means at least one condition needs to be met

        mixed_dtypes (bool, optional):
            If True, will consider the intersection of single values or lists of values in queried dictionary keys, e.g. as in simplified networks.
            Defaults to True.

    Returns:
        list: list of ids in input iterator satisfying conditions
    """
    filter = Filter(conditions, how, mixed_dtypes)
    return [_id for _id, attribs in iterator if filter.satisfies_conditions(attribs)]

`find_shortest_path_link(link_attribute_dictionary, modes=None)` #

Finds link that is deemed quickest if freespeed present.

Relies on (link) id being stored on edge data (default if using genet Network's add_link or add_edge methods or reading data using genet's Network methods.) Throws a RuntimeError if a link id is not found.

PARAMETER	DESCRIPTION
`link_attribute_dictionary`	Link attribute dictionary, e.g. `{multi_index_id: {'length': 10}}`. TYPE: `dict`
`modes`	If passed and there is more than one possible edge that has the same length and speed, will also check if there is a link with modes that match exactly with `modes`. Defaults to None. TYPE: `Optional[Union[list, str]]` DEFAULT: `None`

RAISES	DESCRIPTION
`RuntimeError`	Link ID must exist.

RETURNS	DESCRIPTION
`str`	Shortest path link ID TYPE: `str`

Source code in src/genet/utils/graph_operations.py

def find_shortest_path_link(
    link_attribute_dictionary: dict, modes: Optional[Union[list, str]] = None
) -> str:
    """Finds link that is deemed quickest if freespeed present.

    Relies on (link) id being stored on edge data (default if using genet Network's `add_link` or `add_edge` methods or reading data using genet's Network methods.)
    Throws a `RuntimeError` if a link id is not found.

    Args:
        link_attribute_dictionary (dict): Link attribute dictionary, e.g. `{multi_index_id: {'length': 10}}`.
        modes (Optional[Union[list, str]], optional):
            If passed and there is more than one possible edge that has the same length and speed, will also check if there is a link with modes that match exactly with `modes`.
            Defaults to None.

    Raises:
        RuntimeError: Link ID must exist.

    Returns:
        str: Shortest path link ID
    """
    selected_link = None
    if len(link_attribute_dictionary) > 1:
        # check if any link is better than the other
        if modes:
            for multi_idx, attribs in link_attribute_dictionary.items():
                if "modes" in attribs:
                    if isinstance(modes, str):
                        modes = [modes]
                    if set(attribs["modes"]) == set(modes):
                        selected_link = attribs["id"]
        if selected_link is None:
            current_freespeed = None
            for multi_idx, attribs in link_attribute_dictionary.items():
                if "freespeed" in attribs:
                    if current_freespeed is None:
                        current_freespeed = attribs["freespeed"]
                        selected_link = attribs["id"]
                    elif attribs["freespeed"] > current_freespeed:
                        current_freespeed = attribs["freespeed"]
                        selected_link = attribs["id"]
    else:
        selected_link = link_attribute_dictionary[list(link_attribute_dictionary.keys())[0]]["id"]
    if selected_link is None:
        raise RuntimeError("Failed to find suitable link_id for shortest path")
    else:
        return selected_link

`get_attribute_data_under_key(iterator, key)` #

Returns all data stored under key in attribute dictionaries for iterators yielding (index, attribute_dictionary).

Inherits index from the iterator.

PARAMETER	DESCRIPTION
`iterator`	list or iterator yielding (index, attribute_dictionary) TYPE: `Iterable`
`key`	A string, e.g. 'modes'. A dictionary, if accessing nested information, e.g. `{'attributes': 'osm:way:name'}` or `{'attributes': {'osm:way:name': 'text'}}`. TYPE: `Union[str, dict]`

RETURNS	DESCRIPTION
`dict`	dictionary where keys are indices and values are data stored under the key TYPE: `dict`

Source code in src/genet/utils/graph_operations.py

def get_attribute_data_under_key(iterator: Iterable, key: Union[str, dict]) -> dict:
    """Returns all data stored under key in attribute dictionaries for iterators yielding (index, attribute_dictionary).

    Inherits index from the iterator.

    Args:
        iterator (Iterable): list or iterator yielding (index, attribute_dictionary)
        key (Union[str, dict]):
            A string, e.g. 'modes'.
            A dictionary, if accessing nested information, e.g. `{'attributes': 'osm:way:name'}` or `{'attributes': {'osm:way:name': 'text'}}`.

    Returns:
        dict: dictionary where keys are indices and values are data stored under the key
    """

    def get_the_data(attributes, key):
        if isinstance(key, dict):
            for k, v in key.items():
                if k in attributes:
                    if isinstance(v, dict):
                        get_the_data(attributes[k], v)
                    elif v in attributes[k]:
                        data[_id] = attributes[k][v]
        else:
            if key in attributes:
                data[_id] = attributes[key]

    data: dict = {}

    for _id, _attribs in iterator:
        get_the_data(_attribs, key)

    return data

`get_attribute_schema(iterator, data=False)` #

Source code in src/genet/utils/graph_operations.py

def get_attribute_schema(iterator, data=False):
    def get_identical_twin_if_exists(parent, name_of_node_to_be):
        for child in parent.children:
            if name_of_node_to_be == child.name:
                return child
        return None

    def append_to_tree(d: dict, parent):
        for k, v in d.items():
            twin = get_identical_twin_if_exists(parent, k)
            if isinstance(v, dict):
                if not twin:
                    twin = Node(k, parent=parent)
                append_to_tree(v, twin)
            elif not twin:
                if data:
                    if isinstance(v, (list, set)):
                        values = set(v)
                    else:
                        values = {v}
                    Node(k, parent=parent, values=values)
                else:
                    Node(k, parent=parent)
            elif data:
                node = get_identical_twin_if_exists(parent, k)
                if isinstance(v, (list, set)):
                    values = set(v)
                else:
                    values = {v}
                node.values = node.values | values

    root = Node("attribute")

    for _id, _attribs in iterator:
        append_to_tree(_attribs, root)

    return root

`parse_leaf(leaf)` #

PARAMETER	DESCRIPTION
`leaf`	Leaf node. TYPE: `Node`

RETURNS	DESCRIPTION
`Union[str, dict]`	Union[str, dict]: str or dictionary with string key value pairs, for use as keys to extraction methods.

Source code in src/genet/utils/graph_operations.py

def parse_leaf(leaf: Node) -> Union[str, dict]:
    """

    Args:
        leaf (Node): Leaf node.

    Returns:
        Union[str, dict]: str or dictionary with string key value pairs, for use as keys to extraction methods.
    """
    if leaf.depth > 1:
        dict_path = {leaf.path[1].name: leaf.path[2].name}
        if leaf.depth > 2:
            for node in leaf.path[3:]:
                dict_path = dict_support.nest_at_leaf(dict_path, node.name)
        return dict_path
    else:
        return leaf.name

`render_tree(root, data=False)` #

Source code in src/genet/utils/graph_operations.py

def render_tree(root, data=False):
    for pre, fill, node in RenderTree(root):
        if hasattr(node, "values") and data:
            print("%s%s: %s" % (pre, node.name, list(node.values)[:5]))
        else:
            print("%s%s" % (pre, node.name))

genet.utils.graph_operations

Filter(conditions=None, how=any, mixed_dtypes=True) #

conditions = conditions instance-attribute #

how = how instance-attribute #

mixed_dtypes = mixed_dtypes instance-attribute #

evaluate_condition(condition, data_dict) #

satisfies_conditions(data_dict) #

apply_function_to_attributes(iterator, function, location) #

apply_mapping_to_attributes(iterator, mapping, location) #

apply_to_attributes(iterator, to_apply, location) #

build_attribute_dataframe(iterator, keys, index_name=None) #

consolidate_link_indices(left, right) #

consolidate_node_indices(left, right) #

convert_list_of_link_ids_to_network_nodes(network, link_ids) #

extract_on_attributes(iterator, conditions, how=any, mixed_dtypes=True) #

find_shortest_path_link(link_attribute_dictionary, modes=None) #

get_attribute_data_under_key(iterator, key) #

get_attribute_schema(iterator, data=False) #

parse_leaf(leaf) #

render_tree(root, data=False) #

`Filter(conditions=None, how=any, mixed_dtypes=True)` #

`conditions = conditions` `instance-attribute` #

`how = how` `instance-attribute` #

`mixed_dtypes = mixed_dtypes` `instance-attribute` #

`evaluate_condition(condition, data_dict)` #

`satisfies_conditions(data_dict)` #

`apply_function_to_attributes(iterator, function, location)` #

`apply_mapping_to_attributes(iterator, mapping, location)` #

`apply_to_attributes(iterator, to_apply, location)` #

`build_attribute_dataframe(iterator, keys, index_name=None)` #

`consolidate_link_indices(left, right)` #

`consolidate_node_indices(left, right)` #

`convert_list_of_link_ids_to_network_nodes(network, link_ids)` #

`extract_on_attributes(iterator, conditions, how=any, mixed_dtypes=True)` #

`find_shortest_path_link(link_attribute_dictionary, modes=None)` #

`get_attribute_data_under_key(iterator, key)` #

`get_attribute_schema(iterator, data=False)` #

`parse_leaf(leaf)` #

`render_tree(root, data=False)` #