Source code for gflownet.policy.simple_tree

from typing import Optional

import torch
import torch_geometric
from torch_geometric.data import Batch
from torch_geometric.nn import global_add_pool

from gflownet.envs.tree import Tree
from gflownet.policy.base import Policy



[docs]
class Backbone(torch.nn.Module):
    """
    GNN backbone: a stack of GNN layers that can be used for processing graphs.
    """

    def __init__(
        self,
        input_dim: int,
        n_layers: int = 3,
        hidden_dim: int = 128,
        layer: str = "GINEConv",
        activation: str = "LeakyReLU",
    ):
        super().__init__()


[docs]
        self.hidden_dim = hidden_dim


        layer = getattr(torch_geometric.nn, layer)
        activation = getattr(torch.nn, activation)

        layers = []
        for i in range(n_layers):
            layers.append(
                (
                    layer(
                        torch.nn.Linear(
                            input_dim if i == 0 else hidden_dim, hidden_dim
                        ),
                        edge_dim=2,
                    ),
                    "x, edge_index, edge_attr -> x",
                )
            )
            layers.append(activation())


[docs]
        self.model = torch_geometric.nn.Sequential(
            "x, edge_index, edge_attr, batch", layers
        )



[docs]
    def forward(self, data: torch_geometric.data.Data) -> torch.Tensor:
        x, edge_index, edge_attr, batch = (
            data.x,
            data.edge_index,
            data.edge_attr,
            data.batch,
        )

        return self.model(x, edge_index, edge_attr, batch)





[docs]
class Head(torch.nn.Module):
    """
    GNN head: a combination of a pooling layer and a stack of linear layers,
    that takes the input graphs processed by the provided backbone and outputs
    ``out_dim`` values.

    This is a naive variant of a Tree policy model, that in particular doesn't
    do any node-level prediction, but instead predicts the whole policy output
    all at once.
    """

    def __init__(
        self,
        backbone: torch.nn.Module,
        out_dim: int,
        n_layers: int = 2,
        hidden_dim: int = 256,
        activation: str = "LeakyReLU",
    ):
        super().__init__()


[docs]
        self.backbone = backbone


        activation = getattr(torch.nn, activation)

        layers = []
        for i in range(n_layers):
            layers.append(
                torch.nn.Linear(
                    backbone.hidden_dim if i == 0 else hidden_dim,
                    out_dim if i == n_layers - 1 else hidden_dim,
                )
            )
            if i < n_layers - 1:
                layers.append(activation())


[docs]
        self.head = torch.nn.Sequential(*layers)



[docs]
    def forward(self, data: torch_geometric.data.Data) -> (torch.Tensor, torch.Tensor):
        x, edge_index, edge_attr, k, batch = (
            data.x,
            data.edge_index,
            data.edge_attr,
            data.k,
            data.batch,
        )
        x = self.backbone(data)
        x = global_add_pool(x, batch)
        x = self.head(x)

        return x





[docs]
class SimpleTreeModel(torch.nn.Module):
    """
    Combination of backbone and head models. In forward, it converts the states
    to a batch of graphs, and passes them through both models.
    """

    def __init__(
        self,
        n_features: int,
        policy_output_dim: int,
        base: Optional["SimpleTreePolicy"] = None,
        backbone_args: Optional[dict] = None,
        head_args: Optional[dict] = None,
    ):
        super().__init__()


[docs]
        self.n_features = n_features


[docs]
        self.policy_output_dim = policy_output_dim


        if base is None:
            self.backbone = Backbone(**backbone_args)
        else:
            self.backbone = base.model.backbone


[docs]
        self.model = Head(
            backbone=self.backbone, out_dim=policy_output_dim, **head_args
        )



[docs]
    def forward(self, x):
        batch = Batch.from_data_list(
            [Tree.state2pyg(state, self.n_features) for state in x]
        )
        return self.model(batch)





[docs]
class SimpleTreePolicy(Policy):
    """
    Policy wrapper using SimpleTreeModel as the policy model.
    """

    def __init__(self, config, env, device, float_precision, base=None):

[docs]
        self.backbone_args = {"input_dim": env.get_pyg_input_dim()}


[docs]
        self.head_args = {}


[docs]
        self.n_features = env.n_features


[docs]
        self.policy_output_dim = env.policy_output_dim


        super().__init__(
            config=config,
            env=env,
            device=device,
            float_precision=float_precision,
            base=base,
        )


[docs]
        self.is_model = True



[docs]
    def parse_config(self, config):
        if config is not None:
            self.backbone_args.update(config.get("backbone_args", {}))
            self.head_args.update(config.get("head_args", {}))



[docs]
    def instantiate(self):
        self.model = SimpleTreeModel(
            n_features=self.n_features,
            policy_output_dim=self.policy_output_dim,
            base=self.base,
            backbone_args=self.backbone_args,
            head_args=self.head_args,
        ).to(self.device)



[docs]
    def __call__(self, states):
        return self.model(states)