directed_structures.py

from __future__ import absolute_import
import numpy as np
import itertools
from sys import hexversion
if hexversion >= 0x3080000:
    from functools import cached_property
elif hexversion >= 0x3060000:
    from backports.cached_property import cached_property
else:
    cached_property = property

from radix import bitarray_to_int
import networkx as nx
from utilities import stringify_in_set, stringify_in_list, partsextractor
from more_itertools import chunked

from functools import lru_cache, total_ordering
from adjmat_class import AdjMat

@lru_cache(maxsize=5)
def empty_digraph(n):
    baseg = nx.DiGraph()
    baseg.add_nodes_from(range(n))
    return baseg

# def transitive_closure(adjmat):
#     n=len(adjmat)
#     closure_mat = np.bitwise_or(np.asarray(adjmat, dtype=bool),np.identity(n, dtype=bool))
#     while n>0:
#         n = np.floor_divide(n,2)
#         next_closure_mat = np.matmul(closure_mat, closure_mat)
#         if np.array_equal(closure_mat,next_closure_mat):
#             break
#         else:
#             closure_mat=next_closure_mat
#     return np.bitwise_and(closure_mat,np.invert(np.identity(len(adjmat), dtype=bool)))
#
# def transitive_reduction(adjmat):
#     # n = len(adjmat)
#     closure_mat=transitive_closure(adjmat)
#     # closure_minus_identity = np.bitwise_and(transitive_closure(adjmat),np.invert(np.identity(n, dtype=bool)))
#     return np.bitwise_and(closure_mat, np.invert(np.matmul(closure_mat, closure_mat)))


@total_ordering
class DirectedStructure:
    """
    This class is NOT meant to encode mDAGs. As such, we do not get into an implementation of predecessors or successors here.
    """
    def __init__(self, numeric_edge_list, n):
        # assert all(isinstance(v, int) for v in
        #            set(itertools.chain.from_iterable(numeric_edge_list))), 'Somehow we have a non integer node!'+stringify_in_set(
        #     map(stringify_in_list, numeric_edge_list))
        self.number_of_visible = n
        self.visible_nodes = list(range(self.number_of_visible))
        self.as_set_of_tuples = set(map(tuple, numeric_edge_list))
        self.edge_list = sorted(set(self.as_set_of_tuples))
        self.as_tuples = tuple(self.edge_list)
        self.number_of_edges = len(self.edge_list)
        if self.edge_list:
            assert max(map(max, self.edge_list)) + 1 <= self.number_of_visible, "More nodes referenced than expected."


    @property
    def as_edges_array(self):
        return np.asarray(self.edge_list, dtype=int).reshape((-1,2)) #No sorting or deduplication.

    @cached_property
    def as_bit_square_matrix(self):
        r = np.zeros((self.number_of_visible, self.number_of_visible), dtype=bool)
        r[tuple(self.as_edges_array.T)] = True
        return r

    @cached_property
    def nodes_with_no_parents(self):
        return np.flatnonzero(np.logical_not(self.as_bit_square_matrix.any(axis=0)))

    @cached_property
    def nodes_with_no_children(self):
        return np.flatnonzero(np.logical_not(self.as_bit_square_matrix.any(axis=1)))

    @cached_property
    def as_bit_square_matrix_plus_eye(self):
        #Used for computing parents_plus
        return np.bitwise_or(self.as_bit_square_matrix, np.identity(self.number_of_visible, dtype=bool))


    @cached_property
    def observable_parentsplus_list(self):
        return list(map(frozenset, map(np.flatnonzero, self.as_bit_square_matrix_plus_eye.T)))

    @cached_property
    def adjMat(self):
        return AdjMat(self.as_bit_square_matrix)

    @cached_property
    def as_integer(self):
        return bitarray_to_int(self.as_bit_square_matrix)

    def permute_bit_square_matrix(self, perm):
        return self.as_bit_square_matrix[perm][:, perm]

    @cached_property
    def bit_square_matrix_permutations(self):
        return tuple(self.permute_bit_square_matrix(perm) for perm in map(list,itertools.permutations(self.visible_nodes)))

    @cached_property
    def as_integer_permutations(self):
        return tuple(bitarray_to_int(ba) for ba in self.bit_square_matrix_permutations)

    @cached_property
    def as_unlabelled_integer(self):
        return min(self.as_integer_permutations)

    @classmethod
    def directedStructure_from_bit_square_matrix(cls, bit_square_matrix):
        return cls(np.vstack(np.nonzero(bit_square_matrix)).T.tolist(), len(bit_square_matrix))

    @cached_property
    def equivalents_under_symmetry(self):
        return [self.directedStructure_from_bit_square_matrix(bitmat) for bitmat in
                np.take(self.bit_square_matrix_permutations,
                        np.unique(self.as_integer_permutations, return_index=True, axis=0)[-1],
                        axis=0)]

    @cached_property
    def as_string(self):
        return stringify_in_set(
            str(partsextractor(self.visible_nodes, i)) + ':' + stringify_in_list(partsextractor(self.visible_nodes, v))
                # for i, v in nx.to_dict_of_lists(self.DirectedStructure).items()
                for i, v in enumerate(map(np.flatnonzero, self.as_bit_square_matrix))
                )

    def __str__(self):
        return self.as_string

    def __repr__(self):
        return self.as_string

    def __hash__(self):
        return int(self.as_integer)

    def __eq__(self, other):
        """Whether the Monomial is equal to the ``other`` Monomial."""
        return self.__hash__() == other.__hash__()

    def __lt__(self, other):
        """Whether the Monomial is lexicographically smaller than the ``other``
        Monomial.
        """
        return self.__hash__() < other.__hash__()

    # @cached_property
    # def parents_of_for_supports_analysis(self):
    #     return list(map(np.flatnonzero, self.as_bit_square_matrix.T))

    #I'm hoping to eventually transition away from networkx entirely.
    @cached_property
    def as_networkx_graph(self):
        g = empty_digraph(self.number_of_visible).copy()
        g.add_edges_from(self.edge_list)
        return g

    def can_D1_minimally_simulate_D2(D1, D2):
        """
        D1 and D2 are networkx.DiGraph objects.
        We say that D1 can 'simulate' D2 if the edges of D2 are contained within those of D1.
        """
        # return D1.number_of_edges == D2.number_of_edges + 1 and D2.as_set_of_tuples.issubset(D1.as_set_of_tuples)
        if D1.number_of_edges == D2.number_of_edges + 1:
            return np.logical_or(np.logical_not(D2.as_bit_square_matrix), D1.as_bit_square_matrix).all()
        return False


    def is_D1_strictly_above_D2(D1, D2):
        """
        D1 and D2 are networkx.DiGraph objects.
        We say that D1 can 'simulate' D2 if the edges of D2 are contained within those of D1.
        """
        # return D1.number_of_edges > D2.number_of_edges and D2.as_set_of_tuples.issubset(D1.as_set_of_tuples)
        return np.logical_or(np.logical_not(D2.as_bit_square_matrix), D1.as_bit_square_matrix).all()


class LabelledDirectedStructure(DirectedStructure):
    """
    This class is NOT meant to encode mDAGs. As such, we do not get into an implementation of predecessors or successors here.
    """
    def __init__(self, variable_names, edge_list):
        self.variable_names = tuple(variable_names)
        self.variable_names_as_frozenset = frozenset(self.variable_names)
        self.number_of_variables = len(variable_names)
        assert self.number_of_variables == len(self.variable_names_as_frozenset), "A variable name appears in duplicate."

        implicit_variable_names = set(itertools.chain.from_iterable(edge_list))
        self.edge_list_with_variable_names = sorted(set(edge_list), key=str)
        if not implicit_variable_names.issubset(self.variable_names_as_frozenset):
            self.edge_list_with_variable_names = [edge for edge in self.edge_list_with_variable_names if self.variable_names_as_frozenset.issuperset(edge)]

        self.variables_as_range = tuple(range(self.number_of_variables))
        self.translation_dict = dict(zip(self.variable_names, self.variables_as_range))

        # self.variable_are_range = False
        # if all(isinstance(v, int) for v in self.variable_names):
        #     if np.array_equal(self.variable_names, self.variables_as_range):
        #         self.variable_are_range = True
        #         self.edge_list = self.edge_list_with_variable_names
        # if not self.variable_are_range:
        self.edge_list = list(chunked(partsextractor(self.translation_dict, tuple(
                    itertools.chain.from_iterable(self.edge_list_with_variable_names))), 2))

        assert set(self.variables_as_range).issuperset(itertools.chain.from_iterable(self.edge_list)), 'The translation to integers has failed.'
        super().__init__(self.edge_list, self.number_of_variables)

    @cached_property
    def as_string(self):
        return stringify_in_set(
            str(partsextractor(self.variable_names, i)) + ':' + stringify_in_list(partsextractor(self.variable_names, v))
                # for i, v in nx.to_dict_of_lists(self.DirectedStructure).items()
                for i, v in enumerate(map(np.flatnonzero, self.as_bit_square_matrix))
                )

    @cached_property
    def as_networkx_graph_arbitrary_names(self):
        g=nx.DiGraph()
        g.add_nodes_from(self.variable_names)
        g.add_edges_from(self.edge_list_with_variable_names)
        return g

    def __str__(self):
        return self.as_string

    def __repr__(self):
        return self.as_string