forked from TristanBilot/phishGNN
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
✨ add MemPool + move train() and test() to model classes
- Loading branch information
1 parent
b63f414
commit fe473a4
Showing
5 changed files
with
224 additions
and
46 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -2,3 +2,4 @@ | |
|
||
from .gcn import GCN | ||
from .gin import GIN | ||
from .mem_pool import MemPool |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,125 @@ | ||
import os.path as osp | ||
|
||
import torch | ||
import torch.nn.functional as F | ||
from torch.nn import BatchNorm1d, LeakyReLU, Linear | ||
|
||
from torch_geometric.datasets import TUDataset | ||
from torch_geometric.loader import DataLoader | ||
from torch_geometric.nn import DeepGCNLayer, GATConv, MemPooling | ||
|
||
# path = osp.join('data', 'TUD') | ||
# dataset = TUDataset(path, name="MUTAG", use_node_attr=True) | ||
# dataset.data.x = dataset.data.x[:, :-3] # only use non-binary features. | ||
# dataset = dataset.shuffle() | ||
|
||
# n = (len(dataset)) // 10 | ||
# test_dataset = dataset[:n] | ||
# val_dataset = dataset[n:2 * n] | ||
# train_dataset = dataset[2 * n:] | ||
|
||
# test_loader = DataLoader(test_dataset, batch_size=20) | ||
# val_loader = DataLoader(val_dataset, batch_size=20) | ||
# train_loader = DataLoader(train_dataset, batch_size=20) | ||
|
||
|
||
class MemPool(torch.nn.Module): | ||
def __init__(self, in_channels, hidden_channels, out_channels, device, dropout=0.5): | ||
super().__init__() | ||
self.device = device | ||
self.to(device) | ||
self.dropout = dropout | ||
|
||
self.lin = Linear(in_channels, hidden_channels) | ||
|
||
self.convs = torch.nn.ModuleList() | ||
for i in range(2): | ||
conv = GATConv(hidden_channels, hidden_channels, dropout=dropout) | ||
norm = BatchNorm1d(hidden_channels) | ||
act = LeakyReLU() | ||
self.convs.append( | ||
DeepGCNLayer(conv, norm, act, block='res+', dropout=dropout)) | ||
|
||
self.mem1 = MemPooling(hidden_channels, 80, heads=5, num_clusters=10) | ||
self.mem2 = MemPooling(80, out_channels, heads=5, num_clusters=1) | ||
|
||
|
||
def forward(self, x, edge_index, batch): | ||
x = x.float() | ||
x = self.lin(x) | ||
for conv in self.convs: | ||
x = conv(x, edge_index) | ||
|
||
x, S1 = self.mem1(x, batch) | ||
x = F.leaky_relu(x) | ||
x = F.dropout(x, p=self.dropout) | ||
x, S2 = self.mem2(x) | ||
|
||
return ( | ||
F.log_softmax(x.squeeze(1), dim=-1), | ||
MemPooling.kl_loss(S1) + MemPooling.kl_loss(S2), | ||
) | ||
|
||
|
||
def fit( | ||
self, | ||
train_loader, | ||
optimizer, | ||
loss_fn, | ||
device, | ||
): | ||
self.train() | ||
|
||
self.mem1.k.requires_grad = False | ||
self.mem2.k.requires_grad = False | ||
for data in train_loader: | ||
optimizer.zero_grad() | ||
data = data.to(self.device) | ||
out = self(data.x, data.edge_index, data.batch)[0] | ||
loss = F.nll_loss(out, data.y.long()) | ||
loss.backward() | ||
optimizer.step() | ||
|
||
kl_loss = 0. | ||
self.mem1.k.requires_grad = True | ||
self.mem2.k.requires_grad = True | ||
optimizer.zero_grad() | ||
for data in train_loader: | ||
data = data.to(self.device) | ||
kl_loss += self(data.x, data.edge_index, data.batch)[1] | ||
|
||
kl_loss /= len(train_loader.dataset) | ||
kl_loss.backward() | ||
optimizer.step() | ||
|
||
return kl_loss | ||
|
||
|
||
@torch.no_grad() | ||
def test(self, loader): | ||
self.eval() | ||
correct = 0 | ||
for data in loader: | ||
data = data.to(self.device) | ||
out = self(data.x, data.edge_index, data.batch)[0] | ||
pred = out.argmax(dim=-1) | ||
correct += int((pred == data.y).sum()) | ||
return correct / len(loader.dataset) | ||
|
||
|
||
# patience = start_patience = 250 | ||
# test_acc = best_val_acc = 0. | ||
# for epoch in range(1, 2001): | ||
# train() | ||
# val_acc = test(val_loader) | ||
# if epoch % 500 == 0: | ||
# optimizer.param_groups[0]['lr'] *= 0.5 | ||
# if best_val_acc < val_acc: | ||
# patience = start_patience | ||
# best_val_acc = val_acc | ||
# test_acc = test(test_loader) | ||
# else: | ||
# patience -= 1 | ||
# print(f'Epoch {epoch:02d}, Val: {val_acc:.3f}, Test: {test_acc:.3f}') | ||
# if patience <= 0: | ||
# break |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters