exact.py

"""
Module to compute exact lnZ of graphical model by enumeration of FVS and kacward solution

TODO:
"""

import torch
import networkx as nx
import numpy as np
from numba import jit


@jit()
def exact_config(D):
    config = np.empty((2 ** D, D))
    for i in range(2 ** D - 1, -1, -1):
        num = i
        for j in range(D - 1, -1, -1):
            config[i, D - j - 1] = num // 2 ** j
            if num - 2 ** j >= 0:
                num -= 2 ** j

    return config * 2.0 - 1.0


class exact:
    def __init__(self, G, J, h, beta, device, seed):
        self.G = G
        self.beta = beta
        self.device = device
        self.seed = seed
        self.dtype = torch.float64
        self.D = self.G.number_of_nodes()
        self.J = J
        # self.J = torch.from_numpy(nx.adjacency_matrix(self.G, np.arange(self.D)).todense()).to(self.dtype).to(
        #     self.device)
        self.h = h

    def FVS_decomposition(self):
        rng = np.random.RandomState(self.seed)
        G1 = self.G.copy()
        fvs = []
        while G1.number_of_nodes():
            flag = True
            while flag:
                temp = []
                flag = False
                for i in list(G1.node):
                    if G1.degree[i] <= 1:
                        temp.append(i)
                        flag = True
                if not flag:
                    break
                G1.remove_nodes_from(temp)
            if not G1.number_of_nodes():
                break
            degrees = np.array(G1.degree)
            degree_max = degrees[rng.choice(np.where(degrees[:, 1] == max(degrees[:, 1]))[0]), 0]
            fvs.append(degree_max)
            G1.remove_node(degree_max)

        tree_hierarchy, tree_order = self.tree_hierarchize(fvs)

        return fvs, tree_order, tree_hierarchy

    def tree_hierarchize(self, frozen_nodes):
        G1 = self.G.copy()
        G1.remove_nodes_from(frozen_nodes)
        ccs = list(nx.connected_components(G1))
        trees = {}.fromkeys(np.arange(len(ccs)))
        for key in trees.keys():
            trees[key] = []
        for l in range(len(ccs)):
            tree = self.G.subgraph(ccs[l]).copy()
            while tree.number_of_nodes():
                temp = []
                for j in list(tree.node):
                    if tree.number_of_nodes() == 1 or tree.number_of_nodes() == 2:
                        temp.append(j)
                        break
                    if tree.degree[j] == 1:
                        temp.append(j)
                tree.remove_nodes_from(temp)
                trees[l].append(temp)

        tree_order = []
        tree_hierarchy = []
        max_length = 0
        for key in trees.keys():
            l = len(trees[key])
            if l >= max_length:
                max_length = l

        for j in range(max_length):
            tree_hierarchy.append([])
            for key in trees.keys():
                if j < len(trees[key]):
                    tree_hierarchy[j] += trees[key][j]
            tree_order += tree_hierarchy[j]

        return tree_hierarchy, tree_order

    def effective_energy(self, sample, frozen_nodes, tree_order, tree_hierarchy):
        h = sample.matmul(self.J[frozen_nodes, :]) + self.h
        tree_energy = torch.zeros(sample.shape[0], device=self.device, dtype=sample.dtype)
        tree = torch.from_numpy(np.array(tree_order)).to(self.device)
        for layer in tree_hierarchy:
            index_matrix = torch.zeros(len(layer), 2, dtype=torch.int64,
                                       device=self.device)
            index_matrix[:, 0] = torch.arange(len(layer))
            if len(self.J[layer][:, tree].nonzero()) != 0:
                index_matrix.index_copy_(0,
                                         self.J[layer][:, tree].nonzero()[:, 0],
                                         self.J[layer][:, tree].nonzero())
            index = index_matrix[:, 1]
            root = tree[index]

            hpj = self.J[layer, root] + h[:, layer]
            hmj = -self.J[layer, root] + h[:, layer]

            tree_energy += -torch.log(2 * (torch.cosh(self.beta * hpj) *
                                           torch.cosh(self.beta * hmj)).sqrt()).sum(dim=1) / self.beta
            for k in range(len(root)):
                h[:, root[k]] += torch.log(torch.cosh(self.beta * hpj) /
                                           torch.cosh(self.beta * hmj))[:, k] / (2 * self.beta)
            tree = tree[len(layer):]

        batch = sample.shape[0]
        assert sample.shape[1] == len(frozen_nodes)
        J = self.J[frozen_nodes][:, frozen_nodes].to_sparse()
        fvs_energy = -torch.bmm(sample.view(batch, 1, len(frozen_nodes)),
                                torch.sparse.mm(J, sample.t()).t().view(batch, len(frozen_nodes), 1)).reshape(batch) / 2
        fvs_energy -= sample @ self.h[frozen_nodes]

        energy = fvs_energy + tree_energy

        return self.beta * energy

    '''
    def sum_up_tree(self, sample, J, frozen_set, tree1, tree_hierarchy):
        h = sample.matmul(J[frozen_set, :])
        fe_tree = torch.zeros(sample.shape[0], device=self.device, dtype=self.dtype)
        tree = torch.from_numpy(np.array(tree1)).to(self.device)
        for layer in tree_hierarchy:
            index_matrix = torch.zeros(len(layer), 2, dtype=torch.int64,
                                       device=self.device)
            index_matrix[:, 0] = torch.arange(len(layer))
            if len(J[layer][:, tree].nonzero()) != 0:
                index_matrix.index_copy_(0,
                                         J[layer][:, tree].nonzero()[:, 0],
                                         J[layer][:, tree].nonzero())
            index = index_matrix[:, 1]
            root = tree[index]

            hpj = J[layer, root] + h[:, layer]
            hmj = -J[layer, root] + h[:, layer]

            fe_tree += -torch.log(2 * (torch.cosh(self.beta * hpj) * torch.cosh(self.beta * hmj)).sqrt()).sum(
                dim=1) / self.beta
            for k in range(len(root)):
                h[:, root[k]] += torch.log(torch.cosh(self.beta * hpj) / torch.cosh(self.beta * hmj))[:, k] / (
                            2 * self.beta)
            tree = tree[len(layer):]

        return fe_tree
    '''

    def correlation(self):
        edges = list(self.G.edges)
        FVS, tree1, tree_hierarchy = self.FVS_decomposition()
        sample = torch.from_numpy(exact_config(len(FVS))).to(self.dtype).to(self.device)
        calc = sample.shape[0]
        effective_energy = self.effective_energy(sample, FVS, tree1, tree_hierarchy)
        lnZ = torch.logsumexp(-effective_energy, dim=0)
        config_prob = torch.exp(-effective_energy - lnZ)
        logZ = -effective_energy
        correlation = torch.empty(self.G.number_of_edges(), device=self.device, dtype=self.dtype)
        connected_correlation = torch.empty(self.G.number_of_edges(), device=self.device, dtype=self.dtype)
        sample_add = torch.ones([calc, 1], device=self.device, dtype=self.dtype)

        for i in range(self.G.number_of_edges()):
            m, n = edges[i][0], edges[i][1]
            frozen_nodes = list(FVS)
            if m not in frozen_nodes:
                frozen_nodes.append(m)
            if n not in frozen_nodes:
                frozen_nodes.append(n)
            frozen_tree_hierarchy, frozen_tree = self.tree_hierarchize(frozen_nodes)

            if len(frozen_nodes) - len(FVS) == 2:
                sample_prime = torch.empty([4, calc, len(frozen_nodes)],
                                           device=self.device, dtype=self.dtype)
                sample_prime[0] = torch.cat((sample, sample_add, sample_add), dim=1)
                sample_prime[1] = torch.cat((sample, -sample_add, -sample_add), dim=1)
                sample_prime[2] = torch.cat((sample, -sample_add, sample_add), dim=1)
                sample_prime[3] = torch.cat((sample, sample_add, -sample_add), dim=1)

                fe_tree_prime = torch.zeros([4, calc], device=self.device, dtype=self.dtype)
                for k in range(4):
                    fe_tree_prime[k] = self.effective_energy(sample_prime[k],
                                                             frozen_nodes,
                                                             frozen_tree,
                                                             frozen_tree_hierarchy)

                p11 = torch.exp(-fe_tree_prime[0] - lnZ).sum()
                p00 = torch.exp(-fe_tree_prime[1] - lnZ).sum()
                p01 = torch.exp(-fe_tree_prime[2] - lnZ).sum()
                p10 = torch.exp(-fe_tree_prime[3] - lnZ).sum()

                correlation[i] = p11 + p00 - p01 - p10
                connected_correlation[i] = p11 + p00 - p01 - p10 - (p11 + p10 - p01 - p00) * (p11 + p01 - p10 - p00)

            elif len(frozen_nodes) - len(FVS) == 1:
                sample_prime = torch.empty([2, calc, len(frozen_nodes)],
                                           device=self.device, dtype=self.dtype)
                if m in FVS:
                    FVS_node = m
                else:
                    FVS_node = n
                FVS_index = FVS.index(FVS_node)
                sample_prime[0] = torch.cat((sample, sample_add), dim=1)
                sample_prime[1] = torch.cat((sample, -sample_add), dim=1)

                fe_tree_prime = torch.zeros([2, calc], device=self.device, dtype=self.dtype)
                for k in range(2):
                    fe_tree_prime[k] = self.effective_energy(sample_prime[k],
                                                             frozen_nodes,
                                                             frozen_tree,
                                                             frozen_tree_hierarchy)
                p1 = torch.exp(-fe_tree_prime[0] - lnZ)
                p0 = torch.exp(-fe_tree_prime[1] - lnZ)
                correlation[i] = (sample[:, FVS_index] * (p1 - p0)).sum()
                connected_correlation[i] = (sample[:, FVS_index] * (p1 - p0)).sum() - \
                                           (p1 - p0).sum() * config_prob @ sample[:, FVS_index]

            else:
                correlation[i] = (sample[:, FVS.index(m)] * sample[:, FVS.index(n)] * config_prob).sum()
                connected_correlation[i] = (sample[:, FVS.index(m)] * sample[:, FVS.index(n)] * config_prob).sum() - \
                                           config_prob @ sample[:, FVS.index(m)] * config_prob @ sample[:, FVS.index(n)]

        return correlation, edges# , connected_correlation

    def magnetization(self):
        FVS, tree1, tree_hierarchy = self.FVS_decomposition()
        sample = torch.from_numpy(exact_config(len(FVS))).to(self.dtype).to(self.device)
        sample_size = sample.shape[0]
        sample_add = torch.ones([sample_size, 1],
                                dtype=self.dtype).to(self.device)
        FVS_energy = self.effective_energy(sample,
                                           FVS,
                                           tree1,
                                           tree_hierarchy)
        config_prob = torch.exp(-FVS_energy - torch.logsumexp(-FVS_energy, dim=0))

        sample_compeltion = torch.empty([sample_size, self.D],
                                        dtype=self.dtype).to(self.device)
        for i in range(self.D):
            if i not in FVS:
                frozen_nodes = list(FVS)
                frozen_nodes.append(i)
                tree_hierarchy, tree_order = self.tree_hierarchize(frozen_nodes)
                sample_positive = torch.cat((sample, sample_add), dim=1)
                sample_negative = torch.cat((sample, -sample_add), dim=1)

                energy_positive = self.effective_energy(sample_positive,
                                                        frozen_nodes,
                                                        tree_order,
                                                        tree_hierarchy)
                energy_negative = self.effective_energy(sample_negative,
                                                        frozen_nodes,
                                                        tree_order,
                                                        tree_hierarchy)
                p_positive = torch.exp(FVS_energy - energy_positive)
                p_negative = torch.exp(FVS_energy - energy_negative)
                sample_compeltion[:, i] = p_positive - p_negative
            else:
                sample_compeltion[:, i] = sample[:, FVS.index(i)]

        magnetization = config_prob @ sample_compeltion

        return magnetization

    def energy(self, sample, J, h):
        batch = sample.shape[0]
        D = sample.shape[1]
        J = J.to_sparse()
        energy = - torch.bmm(sample.view(batch, 1, D),
                             torch.sparse.mm(J, sample.t()).t().view(batch, D, 1)).reshape(batch) / 2 - sample @ h

        return energy

    def lnZ(self):
        config = torch.from_numpy(exact_config(self.D)).to(self.dtype).to(self.device)
        energy = self.energy(config, self.J, self.h)
        lnZ = torch.logsumexp(-self.beta * energy, dim=0)
        """
        config_prob = torch.exp(-self.beta * energy - lnZ)
        F = -lnZ / self.beta
        E = (energy * config_prob).sum()
        S = self.beta * E - F
        mag = config_prob @ config
        edges = list(self.G.edges)
        cor = torch.empty(len(edges), dtype=self.dtype, device=self.device)
        c_cor = torch.empty(len(edges), dtype=self.dtype, device=self.device)
        for i in range(len(edges)):
            m, n = edges[i]
            cor[i] = (config[:, m] * config[:, n] * config_prob).sum()
            c_cor[i] = (config[:, m] * config[:, n] * config_prob).sum() - mag[m] * mag[n]

        print(edges)
        print('cor:', cor)
        print('mag:', mag)
        print('connected_cor:', c_cor)
        """
        return lnZ.item()

    def lnZ_fvs(self):
        FVS, tree1, tree_hierarchy = self.FVS_decomposition()

        sample = torch.from_numpy(exact_config(len(FVS))).to(self.dtype).to(self.device)
        effective_energy = self.effective_energy(sample, FVS, tree1, tree_hierarchy)
        lnZ = torch.logsumexp(-effective_energy, dim=0)

        return lnZ.item()


class kacward:
    """
    Kac-Ward exact Ising
    See Theorem 1 of https://arxiv.org/abs/1011.3494
    """

    def __init__(self, L, J, beta):
        self.L = L
        self.beta = beta
        self.phi = np.array([[0., np.pi / 2, -np.pi / 2, np.nan],
                             [-np.pi / 2, 0.0, np.nan, np.pi / 2],
                             [np.pi / 2, np.nan, 0.0, -np.pi / 2],
                             [np.nan, -np.pi / 2, np.pi / 2, 0]
                             ])

        K = np.ones((self.L ** 2, 4)) * self.beta
        for i in range(self.L ** 2):
            for j in range(4):
                site = self.neighborsite(i, j)
                if site is not None:
                    K[i, j] *= J[i, site].item()
        self.lnZ = self.kacward_solution(K)

    def logcosh(self, x):
        xp = np.abs(x)
        if xp < 12:
            return np.log(np.cosh(x))
        else:
            return xp - np.log(2.)

    def neighborsite(self, i, n):
        """
        The coordinate system is geometrically left->right, down -> up
              y|
               |
               |
               |________ x
              (0,0)
        So as a definition, l means x-1, r means x+1, u means y+1, and d means y-1
        """
        x = i % self.L
        y = i // self.L  # y denotes
        site = None
        # ludr :
        if n == 0:
            if x - 1 >= 0:
                site = (x - 1) + y * self.L
        elif n == 1:
            if y + 1 < self.L:
                site = x + (y + 1) * self.L
        elif n == 2:
            if y - 1 >= 0:
                site = x + (y - 1) * self.L
        elif n == 3:
            if x + 1 < self.L:
                site = (x + 1) + y * self.L
        return site

    # K: ludr
    def kacward_solution(self, K):
        V = self.L ** 2  # number of vertex
        E = 2 * (V - self.L)  # number of edge

        D = np.zeros((2 * E, 2 * E), np.complex128)
        ij = 0
        ijdict = {}
        for i in range(V):
            for j in range(4):
                if self.neighborsite(i, j) is not None:
                    D[ij, ij] = np.tanh(K[i, j])
                    ijdict[(i, j)] = ij  # mapping for (site, neighbor) to index
                    ij += 1

        A = np.zeros((2 * E, 2 * E), np.complex128)
        for i in range(V):
            for j in range(4):
                for l in range(4):
                    k = self.neighborsite(i, j)
                    if (not np.isnan(self.phi[j, l])) and (k is not None) and (self.neighborsite(k, l) is not None):
                        ij = ijdict[(i, j)]
                        kl = ijdict[(k, l)]
                        A[ij, kl] = np.exp(1J * self.phi[j, l] / 2.)

        res = V * np.log(2)
        for i in range(V):
            for j in [1, 3]:  # only u, r to avoid double counting
                if self.neighborsite(i, j) is not None:
                    res += self.logcosh(K[i, j])
        _, logdet = np.linalg.slogdet(np.eye(2 * E, 2 * E, dtype=np.float64) - A @ D)
        res += 0.5 * logdet

        return res


"""
if __name__ == '__main__':
    import sys

    sys.path.append('..')

    beta = 1

    n = 10
    graph = nx.random_regular_graph(3, n)
    edges = list(graph.edges)
    '''
    L = 2
    graph = nx.grid_2d_graph(L, L, create_using=nx.Graph)
    graph = nx.Graph(graph)
    edges_2d = list(graph.edges)
    edges = [(i[0] * L + i[1], j[0] * L + j[1]) for i, j in edges_2d]
    n = L ** 2
    '''
    edges = np.unique(np.array([sorted(a) for a in edges]), axis=0)
    G = nx.Graph()
    G.add_nodes_from(np.arange(n))
    G.add_edges_from(edges)
    weight = torch.ones(len(edges), dtype=torch.float64,
                        requires_grad=True)  # torch.randn(len(edges), dtype=torch.float64) / np.sqrt(n)
    J = torch.zeros([G.number_of_nodes(), G.number_of_nodes()], dtype=torch.float64)
    J[np.array(edges).transpose()] = weight
    J = J + J.t()
    h = torch.randn(n, dtype=torch.float64, requires_grad=True)

    from tensor_network import Tensor_Network

    tn = Tensor_Network(n, edges, weight, beta * h, beta, seed=1, maxdim=32,
                        verbose=-1, Dmax=32, chi=100, node_type='raw')
    lnZ_tn = tn.contraction()
    (lnZ_tn / beta).backward()
    lnZ_tn = lnZ_tn / tn.n
    print('cor_tn:', weight.grad)
    print('mag_tn:', h.grad)

    exact1 = exact(G, J, h, beta, 'cpu', 1)
    lnZ_exact = exact1.lnZ()
    lnZ_FVS = exact1.lnZ_fvs()

    print(h)
    cor_FVS, edges, con_cor_FVS = exact1.correlation()
    print('cor_FVS:', cor_FVS)
    print('con_cor_FVS', con_cor_FVS)
    print('mag_FVS:', exact1.magnetization())

    print(lnZ_exact / n)
    print(lnZ_FVS / n)
    print("lnZ_tn = {:.15g}".format(lnZ_tn.item()))

    print(torch.allclose(cor_FVS, weight.grad))
"""