I am pretty new to using Graph Neural Networks (GNN). I am using PyTorch Geometric. I am creating a reinforcement learning algorithm, and I would therefore like to avoid using the inbuilt DataLoader as I generate data/observations on the go. However, I am encountering an issue when passing a batch of PyTorch Geometric Graphs. I have a numpy memory array with PyG graphs. I pick from this memory and try to push it through the neural network (NN).
import torch as T
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
from torch_geometric.nn import GCNConv
from torch_geometric.data import Batch
from torch_geometric.data import Data
import numpy as np
class DeepNetworkGCN(nn.Module):
def __init__(self, lr=0.001, input_dims=[1], fc1_dims=128, fc2_dims=128, out_dims=[1]):
super(DeepNetworkGCN, self).__init__()
# CNN part of network
self.GCNconv1 = GCNConv(*input_dims, fc1_dims)
self.GCNconv2 = GCNConv(fc1_dims, fc2_dims)
# conform to output dimension
self.fc1 = nn.Linear(fc2_dims, *out_dims)
self.optimizer = optim.Adam(self.parameters(), lr=lr)
self.loss = nn.MSELoss()
self.device = T.device( cuda:0 if T.cuda.is_available() else cpu )
def forward(self, state):
# Process graph data using GCN layers
x = self.GCNconv1(state.x, state.edge_index)
x = F.relu(x)
x = self.GCNconv2(x, state.edge_index)
# Final fully connected layer
out = self.fc1(x)
return out
def random_pyg_graph(num_nodes=3):
# random node features
node_features = T.randint(0, 5, (num_nodes, 1), dtype=T.float)
# random edge features
edge_features = T.randn(num_nodes, num_nodes)
# random edge indices
edge_index = T.randint(0, num_nodes, (2, num_nodes * 2))
# Remove self-loops
edge_index = edge_index[:, edge_index[0] != edge_index[1]]
# graph
graph_data = Data(x=node_features, edge_index=edge_index, edge_attr=edge_features)
return graph_data
# setup example
batch_size = 3
memory = np.zeros(batch_size, dtype=object)
# fill memory
for i in range(batch_size):
memory[i] = random_pyg_graph()
# define model
CNN = DeepNetworkGCN()
# test for single PyG
output = CNN.forward(memory[0])
# output 1 for each node e.g.
# tensor([[0.3770],
# [0.6119],
# [0.2014]], grad_fn=<AddmmBackward0>)
# test for numpy.ndarray
# output = CNN.forward(memory[:]) # FAILS!
# Create batch and do forward pass.
output = CNN.forward(Batch.from_data_list(memory[:]))
# output dimension is weird. ( n_nodes*batch_size).
# tensor([[ 0.0173],
# [ 0.0316],
# [ 0.0282],
# [ 0.0147],
# [-0.0201],
# [-0.0264],
# [ 0.0147],
# [-0.0084],
# [ 0.0021]], grad_fn=<AddmmBackward0>)