You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

base.py 4.8 kB

4 years ago
4 years ago
4 years ago
4 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137
  1. """
  2. Performance check of DGL model + trainer + dataset
  3. """
  4. import numpy as np
  5. from tqdm import tqdm
  6. import torch
  7. import torch.nn.functional as F
  8. from dgl.data import CoraGraphDataset, PubmedGraphDataset, CiteseerGraphDataset
  9. from dgl.nn.pytorch import GraphConv, GATConv, SAGEConv
  10. import logging
  11. logging.basicConfig(level=logging.ERROR)
  12. class GCN(torch.nn.Module):
  13. def __init__(self, num_features, num_classes):
  14. super(GCN, self).__init__()
  15. self.conv1 = GraphConv(num_features, 16)
  16. self.conv2 = GraphConv(16, num_classes)
  17. def forward(self, graph):
  18. features = graph.ndata['feat']
  19. features = F.relu(self.conv1(graph, features))
  20. features = F.dropout(features, training=self.training)
  21. features = self.conv2(graph, features)
  22. return F.log_softmax(features, dim=-1)
  23. class GAT(torch.nn.Module):
  24. def __init__(self, num_features, num_classes):
  25. super(GAT, self).__init__()
  26. self.conv1 = GATConv(num_features, 8, 8, feat_drop=.6, attn_drop=.6, activation=F.relu)
  27. self.conv2 = GATConv(8 * 8, num_classes, 1, feat_drop=.6, attn_drop=.6)
  28. def forward(self, graph):
  29. features = graph.ndata['feat']
  30. features = self.conv1(graph, features).flatten(1)
  31. features = self.conv2(graph, features).mean(1)
  32. return F.log_softmax(features, dim=-1)
  33. class SAGE(torch.nn.Module):
  34. def __init__(self, num_features, hidden_channels, num_layers, num_classes):
  35. super(SAGE, self).__init__()
  36. self.num_layers = num_layers
  37. self.convs = torch.nn.ModuleList()
  38. for i in range(num_layers):
  39. inc = outc = hidden_channels
  40. if i == 0:
  41. inc = num_features
  42. if i == num_layers - 1:
  43. outc = num_classes
  44. self.convs.append(SAGEConv(inc, outc, "gcn"))
  45. self.dropout = torch.nn.Dropout()
  46. def forward(self, graph):
  47. h = graph.ndata['feat']
  48. h = self.dropout(h)
  49. for i, conv in enumerate(self.convs):
  50. h = conv(graph, h)
  51. if i != self.num_layers - 1:
  52. h = h.relu()
  53. h = self.dropout(h)
  54. return F.log_softmax(h, dim=-1)
  55. def test(model, graph, mask, label):
  56. model.eval()
  57. pred = model(graph)[mask].max(1)[1]
  58. acc = pred.eq(label[mask]).sum().item() / mask.sum().item()
  59. return acc
  60. def train(model, graph, args, label, train_mask, val_mask):
  61. optimizer = torch.optim.Adam(model.parameters(), lr=args.lr, weight_decay=args.weight_decay)
  62. parameters = model.state_dict()
  63. best_acc = 0.
  64. for epoch in range(args.epoch):
  65. model.train()
  66. optimizer.zero_grad()
  67. output = model(graph)
  68. loss = F.nll_loss(output[train_mask], label[train_mask])
  69. loss.backward()
  70. optimizer.step()
  71. val_acc = test(model, graph, val_mask, label)
  72. if val_acc > best_acc:
  73. best_acc = val_acc
  74. parameters = model.state_dict()
  75. model.load_state_dict(parameters)
  76. return model
  77. if __name__ == '__main__':
  78. import argparse
  79. parser = argparse.ArgumentParser('dgl')
  80. parser.add_argument('--device', type=str, default='cuda')
  81. parser.add_argument('--dataset', type=str, choices=['Cora', 'CiteSeer', 'PubMed'], default='Cora')
  82. parser.add_argument('--repeat', type=int, default=50)
  83. parser.add_argument('--model', type=str, choices=['gat', 'gcn', 'sage'], default='gat')
  84. parser.add_argument('--lr', type=float, default=0.01)
  85. parser.add_argument('--weight_decay', type=float, default=0.0)
  86. parser.add_argument('--epoch', type=int, default=200)
  87. args = parser.parse_args()
  88. # seed = 100
  89. if args.dataset == 'Cora':
  90. dataset = CoraGraphDataset()
  91. elif args.dataset == 'CiteSeer':
  92. dataset = CiteseerGraphDataset()
  93. elif args.dataset == 'PubMed':
  94. dataset = PubmedGraphDataset()
  95. graph = dataset[0].to(args.device)
  96. label = graph.ndata['label']
  97. train_mask = graph.ndata['train_mask']
  98. val_mask = graph.ndata['val_mask']
  99. test_mask = graph.ndata['test_mask']
  100. accs = []
  101. for seed in tqdm(range(args.repeat)):
  102. np.random.seed(seed)
  103. torch.manual_seed(seed)
  104. if args.model == 'gat':
  105. model = GAT(graph.ndata['feat'].size(1), dataset.num_classes)
  106. elif args.model == 'gcn':
  107. model = GCN(graph.ndata['feat'].size(1), dataset.num_classes)
  108. elif args.model == 'sage':
  109. model = SAGE(graph.ndata['feat'].size(1), 64, 2, dataset.num_classes)
  110. model.to(args.device)
  111. train(model, graph, args, label, train_mask, val_mask)
  112. acc = test(model, graph, test_mask, label)
  113. accs.append(acc)
  114. print('{:.4f} ~ {:.4f}'.format(np.mean(accs), np.std(accs)))