Source code for autogllight.nas.space.graph_nas_macro

import torch
import typing as _typ
import torch.nn as nn
import torch.nn.functional as F

from .base import BaseSpace
from .operation import map_nn, act_map, GeoLayer
from autogllight.utils.backend import BackendOperator as BK

DEFAULT_GNN = [
    "gat",
    "gcn",
    "cos",
    "const",
    "gat_sym",
    "linear",
    "generalized_linear",
]
DEFAULT_AGG = [
    "sum",
    "mean",
    "max",
    "mlp",
]

DEFAULT_ACT = [
    "sigmoid",
    "tanh",
    "relu",
    "linear",
    "softplus",
    "leaky_relu",
    "relu6",
    "elu",
]
DEFAULT_HEAD = [1, 2, 4, 6, 8, 16]
DEFAULT_OUT = [4, 8, 16, 32, 64, 128, 256]


[docs]class GraphNasMacroNodeClassificationSpace(BaseSpace):
    def __init__(
        self,
        hidden_dim: _typ.Optional[int] = 64,
        layer_number: _typ.Optional[int] = 2,
        dropout: _typ.Optional[float] = 0.6,
        input_dim: _typ.Optional[int] = None,
        output_dim: _typ.Optional[int] = None,
        gnns: _typ.Tuple = DEFAULT_GNN,
        aggs=DEFAULT_AGG,
        acts=DEFAULT_ACT,
        heads=DEFAULT_HEAD,
        outs=DEFAULT_OUT,
        search_act_con=False,
    ):
        super().__init__()
        self.layer_number = layer_number
        self.hidden_dim = hidden_dim
        self.input_dim = input_dim
        self.output_dim = output_dim
        self.gnns = gnns
        self.aggs = aggs
        self.acts = acts
        self.heads = heads
        self.outs = outs
        self.dropout = dropout
        self.search_act_con = search_act_con

[docs]    def build_graph(self):
        layer_nums = self.layer_number
        state_num = 5

        # build hidden layer
        for i in range(layer_nums):
            # message choice
            layer = i * state_num + 0
            op_candidates = map_nn(self.gnns)
            key = f"attention_{i}"
            self.setLayerChoice(layer, op_candidates, key=key)

            # aggregation choice
            layer = i * state_num + 1
            op_candidates = map_nn(self.aggs)
            key = f"aggregator_{i}"
            self.setLayerChoice(layer, op_candidates, key=key)

            # activation choice
            layer = i * state_num + 0
            op_candidates = map_nn(self.acts)
            key = f"act_{i}"
            self.setLayerChoice(layer, op_candidates, key=key)

            # head choice
            layer = i * state_num + 0
            op_candidates = map_nn(self.heads)
            key = f"head_{i}"
            self.setLayerChoice(layer, op_candidates, key=key)

            # out choice
            if i < layer_nums - 1:
                layer = i * state_num + 0
                op_candidates = map_nn(self.outs)
                key = f"out_channels_{i}"
                self.setLayerChoice(layer, op_candidates, key=key)

[docs]    def parse_model(self, selection):
        sel_list = []
        for i in range(self.layer_number):
            sel_list.append(self.gnns[selection[f"attention_{i}"]])
            sel_list.append(self.aggs[selection[f"aggregator_{i}"]])
            sel_list.append(self.acts[selection[f"act_{i}"]])
            sel_list.append(self.heads[selection[f"head_{i}"]])
            if i < self.layer_number - 1:
                sel_list.append(self.outs[selection[f"out_channels_{i}"]])
        sel_list.append(self.output_dim)
        # sel_list = ['const', 'sum', 'relu6', 2, 128, 'gat', 'sum', 'linear', 2, 7]
        model = GraphNet(
            sel_list,
            self.input_dim,
            self.output_dim,
            self.dropout,
            multi_label=False,
            batch_normal=False,
            layers=self.layer_number,
        ).wrap()
        return model


class GraphNet(BaseSpace):
    def __init__(
        self,
        actions,
        num_feat,
        num_label,
        drop_out=0.6,
        multi_label=False,
        batch_normal=True,
        state_num=5,
        residual=False,
        layers=2,
    ):
        self.residual = residual
        self.batch_normal = batch_normal
        self.layer_nums = layers
        self.multi_label = multi_label
        self.num_feat = num_feat
        self.num_label = num_label
        self.input_dim = num_feat
        self.output_dim = num_label
        self.dropout = drop_out

        super().__init__()
        self.build_model(
            actions, batch_normal, drop_out, num_feat, num_label, state_num
        )

    def build_model(
        self, actions, batch_normal, drop_out, num_feat, num_label, state_num
    ):
        if self.residual:
            self.fcs = torch.nn.ModuleList()
        if self.batch_normal:
            self.bns = torch.nn.ModuleList()
        self.layers = torch.nn.ModuleList()
        self.acts = []
        self.gates = torch.nn.ModuleList()
        self.build_hidden_layers(
            actions,
            batch_normal,
            drop_out,
            self.layer_nums,
            num_feat,
            num_label,
            state_num,
        )

    def build_hidden_layers(
        self,
        actions,
        batch_normal,
        drop_out,
        layer_nums,
        num_feat,
        num_label,
        state_num=6,
    ):

        # build hidden layer
        for i in range(layer_nums):

            if i == 0:
                in_channels = num_feat
            else:
                in_channels = out_channels * head_num

            # extract layer information
            attention_type = actions[i * state_num + 0]
            aggregator_type = actions[i * state_num + 1]
            act = actions[i * state_num + 2]
            head_num = actions[i * state_num + 3]
            out_channels = actions[i * state_num + 4]
            concat = True
            if i == layer_nums - 1:
                concat = False
            if self.batch_normal:
                self.bns.append(torch.nn.BatchNorm1d(in_channels, momentum=0.5))
            self.layers.append(
                GeoLayer(
                    in_channels,
                    out_channels,
                    head_num,
                    concat,
                    dropout=self.dropout,
                    att_type=attention_type,
                    agg_type=aggregator_type,
                )
            )
            self.acts.append(act_map(act))
            if self.residual:
                if concat:
                    self.fcs.append(
                        torch.nn.Linear(in_channels, out_channels * head_num)
                    )
                else:
                    self.fcs.append(torch.nn.Linear(in_channels, out_channels))

    def forward(self, data):
        output = BK.feat(data)
        # output, edge_index_all = data.x, data.edge_index  # x [2708,1433] ,[2, 10556]
        if self.residual:
            for i, (act, layer, fc) in enumerate(zip(self.acts, self.layers, self.fcs)):
                output = F.dropout(output, p=self.dropout, training=self.training)
                if self.batch_normal:
                    output = self.bns[i](output)

                # output = act(layer(output, edge_index_all) + fc(output))
                output = act(BK.gconv(layer, data, output) + fc(output))
        else:
            for i, (act, layer) in enumerate(zip(self.acts, self.layers)):
                output = F.dropout(output, p=self.dropout, training=self.training)
                if self.batch_normal:
                    output = self.bns[i](output)
                # output = act(layer(output, edge_index_all))
                output = act(BK.gconv(layer, data, output))

        if not self.multi_label:
            output = F.log_softmax(output, dim=1)
        return output

    def __repr__(self):
        result_lines = ""
        for each in self.layers:
            result_lines += str(each)
        return result_lines

    @staticmethod
    def merge_param(old_param, new_param, update_all):
        for key in new_param:
            if update_all or key not in old_param:
                old_param[key] = new_param[key]
        return old_param

    def get_param_dict(self, old_param=None, update_all=True):
        if old_param is None:
            result = {}
        else:
            result = old_param
        for i in range(self.layer_nums):
            key = "layer_%d" % i
            new_param = self.layers[i].get_param_dict()
            if key in result:
                new_param = self.merge_param(result[key], new_param, update_all)
                result[key] = new_param
            else:
                result[key] = new_param
        if self.residual:
            for i, fc in enumerate(self.fcs):
                key = f"layer_{i}_fc_{fc.weight.size(0)}_{fc.weight.size(1)}"
                result[key] = self.fcs[i]
        if self.batch_normal:
            for i, bn in enumerate(self.bns):
                key = f"layer_{i}_fc_{bn.weight.size(0)}"
                result[key] = self.bns[i]
        return result

    def load_param(self, param):
        if param is None:
            return

        for i in range(self.layer_nums):
            self.layers[i].load_param(param["layer_%d" % i])

        if self.residual:
            for i, fc in enumerate(self.fcs):
                key = f"layer_{i}_fc_{fc.weight.size(0)}_{fc.weight.size(1)}"
                if key in param:
                    self.fcs[i] = param[key]
        if self.batch_normal:
            for i, bn in enumerate(self.bns):
                key = f"layer_{i}_fc_{bn.weight.size(0)}"
                if key in param:
                    self.bns[i] = param[key]