gcn

Module: gcn.py

This module implements Graph Convolution Networks (GCNs)

It provides functionality to

Perform transformations on Graphs using GCN
Train GCNs for a loss function

Key Features

Built on top of base class getting all its functionalities
Efficient neural networks implementation using equinox modules

Authors

Rajarshi Dasgupta (rajarshid@iisc.ac.in)

Version Info

10/01/2025: Initial version

`GCN`

Bases: Module

Source code in scirex/core/dl/gcn.py

class GCN(eqx.Module):
    num_layers: int
    W_list: list
    B_list: list

    activations: list

    def __init__(self, layers, activations, key):
        """
        Initialize a GCN instance with random initial parameters

        Inputs:
            layers: a python list indicating the size of the node embeddings at each layer
            activations: a python list of activation functions
            key: to generate random numbers for initialising the W and B matrices
        """

        self.num_layers = len(layers)
        self.W_list = []
        self.B_list = []

        self.activations = activations

        for i in range(self.num_layers - 1):
            weights_key, bias_key, key = jax.random.split(key, num=3)
            W = jax.random.normal(weights_key, (layers[i], layers[i + 1]))
            B = jax.random.normal(bias_key, (layers[i], layers[i + 1]))

            self.W_list.append(W)
            self.B_list.append(B)

    def __call__(self, z, adj_mat, degree):
        """
        Initialize the gcn model with network architecture and training parameters.

        Args:
            z: jnp array for which the i-th row is the i-th node embedding
            adj_mat: the adjacency matrix. Ideally it should be a sparse matrix
            degree: jnp array where the i-th element is the degree of the i-th node

        Output:
            node embeddings of the output
        """

        # activation = jnp.tanh
        # for W,B in zip(self.W_list,self.B_list):
        for activation, W, B in zip(self.activations, self.W_list, self.B_list):
            z = activation(jnp.diagflat(1.0 / degree) @ adj_mat @ z @ W + z @ B)
        return z

`call(z, adj_mat, degree)`

Initialize the gcn model with network architecture and training parameters.

Parameters:

Name	Description	Default
`z`	jnp array for which the i-th row is the i-th node embedding	required
`adj_mat`	the adjacency matrix. Ideally it should be a sparse matrix	required
`degree`	jnp array where the i-th element is the degree of the i-th node	required

Output

node embeddings of the output

Source code in scirex/core/dl/gcn.py

def __call__(self, z, adj_mat, degree):
    """
    Initialize the gcn model with network architecture and training parameters.

    Args:
        z: jnp array for which the i-th row is the i-th node embedding
        adj_mat: the adjacency matrix. Ideally it should be a sparse matrix
        degree: jnp array where the i-th element is the degree of the i-th node

    Output:
        node embeddings of the output
    """

    # activation = jnp.tanh
    # for W,B in zip(self.W_list,self.B_list):
    for activation, W, B in zip(self.activations, self.W_list, self.B_list):
        z = activation(jnp.diagflat(1.0 / degree) @ adj_mat @ z @ W + z @ B)
    return z

`init(layers, activations, key)`

Initialize a GCN instance with random initial parameters

Inputs

layers: a python list indicating the size of the node embeddings at each layer activations: a python list of activation functions key: to generate random numbers for initialising the W and B matrices

Source code in scirex/core/dl/gcn.py

def __init__(self, layers, activations, key):
    """
    Initialize a GCN instance with random initial parameters

    Inputs:
        layers: a python list indicating the size of the node embeddings at each layer
        activations: a python list of activation functions
        key: to generate random numbers for initialising the W and B matrices
    """

    self.num_layers = len(layers)
    self.W_list = []
    self.B_list = []

    self.activations = activations

    for i in range(self.num_layers - 1):
        weights_key, bias_key, key = jax.random.split(key, num=3)
        W = jax.random.normal(weights_key, (layers[i], layers[i + 1]))
        B = jax.random.normal(bias_key, (layers[i], layers[i + 1]))

        self.W_list.append(W)
        self.B_list.append(B)

`GCNModel`

Source code in scirex/core/dl/gcn.py

class GCNModel:

    def __init__(
        self,
        gcn: GCN,
        loss_fn: callable,
        metrics: list[callable] = [],
    ):
        """
        Initialize the gcn model with network architecture and training parameters.

        Args:
            gcn: Neural network architecture to train.
            loss_fn (Callable): Loss function for training.
            metrics (list[Callable]): List of metric functions for evaluation.
        """

        self.gcn = gcn
        self.loss_fn = loss_fn
        self.metrics = metrics

    def fit(
        self,
        features: jnp.ndarray,
        adjacency_matrix: jnp.ndarray,
        degree_array: jnp.ndarray,
        target: jnp.ndarray,
        learning_rate: float,
        num_iters: int = 10,
        num_check_points: int = 5,
    ):
        """
        Train the gcn

        Args:
            features: jnp.ndarray,
            adjacency_matrix: jnp.ndarray,
            degree_array: jnp.ndarray,
            target: jnp.ndarray,
            learning_rate: Parameter of the gradient based optimisation method
            num_iters: Number of iterations of the gradient based optimisation method
            num_check_points

        Returns:
            Trained gcn
        """
        gcn = self.gcn

        self.optimizer = optax.adam(learning_rate)
        opt_state = self.optimizer.init(eqx.filter(gcn, eqx.is_array))

        check_point_gap = num_iters / num_check_points

        for iter_id in tqdm(range(num_iters), desc="Training", total=num_iters):

            loss, gcn, opt_state = self._update_step(
                gcn, features, adjacency_matrix, degree_array, target, opt_state
            )

            if iter_id % check_point_gap == 0:
                output = gcn(features, adjacency_matrix, degree_array)
                metric_vals = [m(output) for m in self.metrics]
                print(f"Iter: {iter_id} | Loss: {loss:.2e} | Metrics {metric_vals}")

        return gcn

    @eqx.filter_jit
    def _update_step(
        self,
        gcn: GCN,
        features: jnp.ndarray,
        adjacency_matrix: jnp.ndarray,
        degree_array: jnp.ndarray,
        target: jnp.ndarray,
        opt_state,
    ):
        """
        Perform single training step with JIT compilation.

        Args:
            gcn: GCN,
            features: Input feature vectors
            adjacency_matrix
            degree_array
            target
            opt_state

        Returns:
            tuple: Tuple containing:
                - Average loss for the batch
                - Updated network
                - Updated optimizer state
        """
        loss, grads = eqx.filter_value_and_grad(self._loss_fn)(
            gcn, features, adjacency_matrix, degree_array, target
        )

        updates, opt_state = self.optimizer.update(
            grads, opt_state, eqx.filter(gcn, eqx.is_array)
        )
        gcn = eqx.apply_updates(gcn, updates)

        return loss, gcn, opt_state

    def _loss_fn(
        self,
        gcn: GCN,
        features: jnp.ndarray,
        adjacency_matrix,
        degree_array,
        target: jnp.ndarray,
    ):
        """
        Compute loss for the given input data.
        Required for getting gradients during training and JIT.

        Args:
            gcn: Instance of GCN
            features: Input feature vectors
            adjacency_matrix,
            degree_array,
            target: jnp.ndarray

        Returns:
            jnp.ndarray: Loss value.
        """
        return self.loss_fn(
            gcn(features, adjacency_matrix, degree_array), target
        ).mean()

`init(gcn, loss_fn, metrics=[])`

Initialize the gcn model with network architecture and training parameters.

Parameters:

Name	Type	Description	Default
`gcn`	`GCN`	Neural network architecture to train.	required
`loss_fn`	`Callable`	Loss function for training.	required
`metrics`	`list[Callable]`	List of metric functions for evaluation.	`[]`

Source code in scirex/core/dl/gcn.py

def __init__(
    self,
    gcn: GCN,
    loss_fn: callable,
    metrics: list[callable] = [],
):
    """
    Initialize the gcn model with network architecture and training parameters.

    Args:
        gcn: Neural network architecture to train.
        loss_fn (Callable): Loss function for training.
        metrics (list[Callable]): List of metric functions for evaluation.
    """

    self.gcn = gcn
    self.loss_fn = loss_fn
    self.metrics = metrics

`fit(features, adjacency_matrix, degree_array, target, learning_rate, num_iters=10, num_check_points=5)`

Train the gcn

Parameters:

Name	Type	Description	Default
`features`	`ndarray`	jnp.ndarray,	required
`adjacency_matrix`	`ndarray`	jnp.ndarray,	required
`degree_array`	`ndarray`	jnp.ndarray,	required
`target`	`ndarray`	jnp.ndarray,	required
`learning_rate`	`float`	Parameter of the gradient based optimisation method	required
`num_iters`	`int`	Number of iterations of the gradient based optimisation method	`10`

Returns:

Type	Description
	Trained gcn

Source code in scirex/core/dl/gcn.py

def fit(
    self,
    features: jnp.ndarray,
    adjacency_matrix: jnp.ndarray,
    degree_array: jnp.ndarray,
    target: jnp.ndarray,
    learning_rate: float,
    num_iters: int = 10,
    num_check_points: int = 5,
):
    """
    Train the gcn

    Args:
        features: jnp.ndarray,
        adjacency_matrix: jnp.ndarray,
        degree_array: jnp.ndarray,
        target: jnp.ndarray,
        learning_rate: Parameter of the gradient based optimisation method
        num_iters: Number of iterations of the gradient based optimisation method
        num_check_points

    Returns:
        Trained gcn
    """
    gcn = self.gcn

    self.optimizer = optax.adam(learning_rate)
    opt_state = self.optimizer.init(eqx.filter(gcn, eqx.is_array))

    check_point_gap = num_iters / num_check_points

    for iter_id in tqdm(range(num_iters), desc="Training", total=num_iters):

        loss, gcn, opt_state = self._update_step(
            gcn, features, adjacency_matrix, degree_array, target, opt_state
        )

        if iter_id % check_point_gap == 0:
            output = gcn(features, adjacency_matrix, degree_array)
            metric_vals = [m(output) for m in self.metrics]
            print(f"Iter: {iter_id} | Loss: {loss:.2e} | Metrics {metric_vals}")

    return gcn

gcn

GCN

__call__(z, adj_mat, degree)

__init__(layers, activations, key)

GCNModel

__init__(gcn, loss_fn, metrics=[])

fit(features, adjacency_matrix, degree_array, target, learning_rate, num_iters=10, num_check_points=5)

`GCN`

`call(z, adj_mat, degree)`

`init(layers, activations, key)`

`GCNModel`

`init(gcn, loss_fn, metrics=[])`

`fit(features, adjacency_matrix, degree_array, target, learning_rate, num_iters=10, num_check_points=5)`