Source code for cogdl.models.nn.gcnii

import math

import torch
import torch.nn as nn
import torch.nn.functional as F

from .. import register_model, BaseModel
from cogdl.utils import spmm, symmetric_normalization, row_normalization, add_remaining_self_loops


[docs]class GCNIILayer(nn.Module): def __init__(self, n_channels, alpha=0.1, beta=1, residual=False): super(GCNIILayer, self).__init__() self.n_channels = n_channels self.alpha = alpha self.beta = beta self.residual = residual self.weight = nn.Parameter(torch.FloatTensor(n_channels, n_channels)) self.reset_parameters()
[docs] def reset_parameters(self): stdv = 1./ math.sqrt(self.n_channels) self.weight.data.uniform_(-stdv, stdv)
[docs] def forward(self, x, edge_index, edge_attr, init_x): hidden = spmm(edge_index, edge_attr, x) hidden = (1 - self.alpha) * hidden + self.alpha * init_x h = self.beta * torch.matmul(hidden, self.weight) + (1 - self.beta) * hidden if self.residual: h = h + x return h
[docs]@register_model("gcnii") class GCNII(BaseModel): @staticmethod
[docs] def add_args(parser): parser.add_argument("--hidden-size", type=int, default=64) parser.add_argument("--num-layers", type=int, default=64) parser.add_argument("--lambda", dest="lmbda", type=float, default=0.5) parser.add_argument("--alpha", type=float, default=0.1) parser.add_argument("--dropout", type=float, default=0.6) parser.add_argument("--wd1", type=float, default=0.01) parser.add_argument("--wd2", type=float, default=5e-4)
@classmethod
[docs] def build_model_from_args(cls, args): return cls( in_feats=args.num_features, hidden_size=args.hidden_size, out_feats=args.num_classes, num_layers=args.num_layers, dropout=args.dropout, alpha=args.alpha, lmbda=args.lmbda, wd1=args.wd1, wd2=args.wd2,
) def __init__(self, in_feats, hidden_size, out_feats, num_layers, dropout=0.5, alpha=0.1, lmbda=1, wd1=0.0, wd2=0.0): super(GCNII, self).__init__() self.fc_layers = nn.ModuleList() self.fc_layers.append(nn.Linear(in_features=in_feats, out_features=hidden_size)) self.fc_layers.append(nn.Linear(in_features=hidden_size, out_features=out_feats)) self.fc_layers.append(nn.Linear(in_features=hidden_size, out_features=out_feats)) self.dropout = dropout self.alpha = alpha self.lmbda = lmbda self.wd1 = wd1 self.wd2 = wd2 self.layers = nn.ModuleList( GCNIILayer(hidden_size, self.alpha, math.log(self.lmbda / (i+1) + 1)) for i in range(num_layers) ) self.activation = F.relu self.fc_parameters = list(self.fc_layers.parameters()) self.conv_parameters = list(self.layers.parameters()) self.edge_attr = None
[docs] def forward(self, x, edge_index, edge_attr=None): if self.edge_attr is None: if edge_attr is not None: self.edge_attr = edge_attr else: edge_index, edge_weight = add_remaining_self_loops( edge_index=edge_index, edge_weight=torch.ones(edge_index.shape[1]).to(x.device), fill_value=1, num_nodes=x.shape[0] ) self.edge_attr = symmetric_normalization( num_nodes=x.shape[0], edge_index=edge_index, edge_weight=edge_weight, ) else: edge_index, _ = add_remaining_self_loops( edge_index=edge_index, edge_weight=torch.ones(edge_index.shape[1]).to(x.device), fill_value=1, num_nodes=x.shape[0] ) init_h = F.dropout(x, p=self.dropout, training=self.training) init_h = F.relu(self.fc_layers[0](init_h)) h = init_h for layer in self.layers: h = F.dropout(h, p=self.dropout, training=self.training) h = layer(h, edge_index, self.edge_attr, init_h) h = self.activation(h) h = F.dropout(h, p=self.dropout, training=self.training) out = self.fc_layers[1](h) return F.log_softmax(out, dim=-1)
[docs] def loss(self, data): loss_n = F.nll_loss( self.forward(data.x, data.edge_index)[data.train_mask], data.y[data.train_mask] ) return loss_n
[docs] def predict(self, data): return self.forward(data.x, data.edge_index)
[docs] def get_optimizer(self, args): return torch.optim.Adam([ {"params": self.fc_parameters, "weight_decay": self.wd1}, {"params": self.conv_parameters, "weight_decay": self.wd2} ], lr=args.lr)