Source code for gammagl.layers.conv.han_conv

# !/usr/bin/env python3
# -*- coding:utf-8 -*-

# @Time    : 2022/04/21 20:30
# @Author  : clear
# @FileName: hanconv.py
import tensorlayerx as tlx
from gammagl.layers.conv import MessagePassing
from gammagl.utils import segment_softmax
from gammagl.layers.conv import GATConv
from tensorlayerx.nn import Module, Sequential, ModuleDict, Linear, Tanh


class SemAttAggr(Module):
    def __init__(self, in_size, hidden_size):
        super().__init__()

        self.project = Sequential(
            Linear(in_features=in_size, out_features=hidden_size), # W
            Tanh(),
            Linear(in_features=hidden_size, out_features=1, b_init=None) # q
        )

    def forward(self, z):
        w = tlx.reduce_mean(self.project(z), axis=1)    # (M, 1)
        beta = tlx.softmax(w, axis=0)                   # (M, 1)
        beta = tlx.expand_dims(beta, axis=-1)  # (M, 1, 1) # auto expand
        return tlx.reduce_sum(beta * z, axis=0) # (N, H)



[docs]
class HANConv(MessagePassing):
    r"""
        The Heterogenous Graph Attention Operator from the
        `"Heterogenous Graph Attention Network"
        <https://arxiv.org/pdf/1903.07293.pdf>`_ paper.

        .. note::

            For an example of using HANConv, see `examples/han_trainer.py
            <https://github.com/BUPT-GAMMA/GammaGL/tree/main/examples/han>`_.

        Parameters
        ----------
        in_channels: int, dict[str, int]
            Size of each input sample of every
            node type, or :obj:`-1` to derive the size from the first input(s)
            to the forward method.
        out_channels: int
            Size of each output sample.
        metadata: tuple[list[str], list[tuple[str, str, str]]]
            The metadata
            of the heterogeneous graph, *i.e.* its node and edge types given
            by a list of strings and a list of string triplets, respectively.
            See :meth:`gammagl.data.HeteroGraph.metadata` for more
            information.
        heads: int, optional
            Number of multi-head-attentions.
            (default: :obj:`1`)
        negative_slope: float, optional
            LeakyReLU angle of the negative
            slope. (default: :obj:`0.2`)
        dropout: float, optional
            Dropout probability of the normalized
            attention coefficients which exposes each node to a stochastically
            sampled neighborhood during training. (default: :obj:`0`)
        **kwargs: optional
            Additional arguments of
            :class:`gammagl.layers.conv.MessagePassing`.

        """
    def __init__(self,
                 in_channels,
                 out_channels,
                 metadata,
                 heads=1,
                 negative_slope=0.2,
                 dropout_rate=0.5):
        super().__init__()
        if not isinstance(in_channels, dict):
            in_channels = {node_type: in_channels for node_type in metadata[0]}
        self.in_channels = in_channels
        self.out_channels = out_channels
        self.metadata = metadata
        self.heads = heads
        self.negetive_slop = negative_slope
        self.dropout_rate = dropout_rate


        self.gat_dict = ModuleDict({})
        for edge_type in metadata[1]:
            src_type, _, dst_type = edge_type
            edge_type = '__'.join(edge_type)
            self.gat_dict[edge_type] = GATConv(in_channels=in_channels[src_type],
                                               out_channels=out_channels,
                                               heads=heads,
                                               dropout_rate=dropout_rate,
                                               concat=True)

        self.sem_att_aggr = SemAttAggr(in_size=out_channels*heads,
                                       hidden_size=out_channels)


[docs]
    def forward(self, x_dict, edge_index_dict, num_nodes_dict):
        out_dict = {}
        # Iterate over node types:
        for node_type, x_node in x_dict.items():
            out_dict[node_type] = []

        # node level attention aggregation
        for edge_type, edge_index in edge_index_dict.items():
            src_type, _, dst_type = edge_type
            edge_type = '__'.join(edge_type)
            out = self.gat_dict[edge_type](x_dict[src_type],
                                           edge_index,
                                           num_nodes = num_nodes_dict[dst_type])
            out = tlx.relu(out)
            out_dict[dst_type].append(out)

        # semantic attention aggregation
        for node_type, outs in out_dict.items():
            outs = tlx.stack(outs)
            out_dict[node_type] = self.sem_att_aggr(outs)

        return out_dict


    def __repr__(self) -> str:
        return (f'{self.__class__.__name__}({self.out_channels}, '
                f'heads={self.heads})')