Source code for gflownet.envs.tree

"""
IMPORTANT: this environment is not up to date.
"""

import pickle
import warnings
from collections import Counter
from pathlib import Path
from typing import List, Optional, Tuple, Union

import matplotlib.pyplot as plt
import networkx as nx
import numpy as np
import numpy.typing as npt
import pandas as pd
import torch
import torch.nn.functional as F
import torch_geometric as pyg
from networkx.drawing.nx_pydot import graphviz_layout
from sklearn.metrics import accuracy_score, balanced_accuracy_score
from sklearn.preprocessing import MinMaxScaler
from torch.distributions import Beta, Categorical, MixtureSameFamily, Uniform
from torchtyping import TensorType

from gflownet.envs.base import GFlowNetEnv



[docs]
class NodeType:
    """
    Encodes two types of nodes present in a tree:
    0 - condition node (node other than leaf), that stores the information
        about on which feature to make the decision, and using what threshold.
    1 - classifier node (leaf), that stores the information about class output
        that will be predicted once that node is reached.
    """


[docs]
    CONDITION = 0


[docs]
    CLASSIFIER = 1





[docs]
class Operator:
    """
    Operator based on which the decision is made (< or >=).

    We assume the convention of having left child output label = 0
    and right child label = 1 if operator is <, and the opposite if
    operator is >=. That way, during prediction, we can act as if
    the operator was always the same (and only care about the output
    label).
    """


[docs]
    LT = 0


[docs]
    GTE = 1





[docs]
class Status:
    """
    Status of the node. Every node except the one on which a macro step
    was initiated will be marked as inactive; the node will be marked
    as active iff the process of its splitting is in progress.
    """


[docs]
    INACTIVE = 0


[docs]
    ACTIVE = 1





[docs]
class Stage:
    """
    Current stage of the tree, encoded as part of the state.
    0 - complete, indicates that there is no macro step initiated, and
        the only allowed action is to pick one of the leaves for splitting.
    1 - leaf, indicates that a leaf was picked for splitting, and the only
        allowed action is picking a feature on which it will be split.
    2 - feature, indicates that a feature was picked, and the only allowed
        action is picking a threshold for splitting.
    3 - threshold, indicates that a threshold was picked, and the only
        allowed action is picking an operator.
    4 - operator, indicates that operator was picked. The only allowed
        action from here is finalizing the splitting process and spawning
        two new leaves, which should be done automatically, upon which
        the stage should be changed to complete.
    """


[docs]
    COMPLETE = 0


[docs]
    LEAF = 1


[docs]
    FEATURE = 2


[docs]
    THRESHOLD = 3


[docs]
    OPERATOR = 4





[docs]
class ActionType:
    """
    Type of action that will be passed to Tree.step. Refer to Stage for details.
    """


[docs]
    PICK_LEAF = 0


[docs]
    PICK_FEATURE = 1


[docs]
    PICK_THRESHOLD = 2


[docs]
    PICK_OPERATOR = 3





[docs]
class Attribute:
    """
    Contains indices of individual attributes in a state tensor.

    Types of attributes defining each node of the tree:

        0 - node type (condition or classifier),
        1 - index of the feature used for splitting (condition node only, -1 otherwise),
        2 - decision threshold (condition node only, -1 otherwise),
        3 - class output (classifier node only, -1 otherwise), in the case of < operator
            the left child will have class = 0, and the right child will have class = 1;
            the opposite for the >= operator,
        4 - whether the node has active status (1 if node was picked and the macro step
            didn't finish yet, 0 otherwise).
    """


[docs]
    TYPE = 0


[docs]
    FEATURE = 1


[docs]
    THRESHOLD = 2


[docs]
    CLASS = 3


[docs]
    ACTIVE = 4


[docs]
    N = 5  # Total number of attributes.





[docs]
class Tree(GFlowNetEnv):
    """
    GFlowNet environment representing a decision tree.

    Constructing a tree consists of a combination of macro steps (picking a leaf
    to split using a given feature, threshold and operator), which are divided
    into a series of consecutive micro steps (1 - pick a leaf, 2 - pick a feature,
    3 - pick a threshold, 4 - pick an operator). A consequence of that is, as long
    as a macro step is not in progress, the tree constructed so far is always a
    valid decision tree, which means that forward-looking loss etc. can be used.

    Internally, the tree is represented as a fixed-shape tensor (thus, specifying
    the maximum depth is required), with nodes indexed from k = 0 to 2**max_depth - 2,
    and each node containing a 5-element attribute tensor (see class Attribute for
    details). The nodes are indexed from top left to bottom right, as follows:

                0
        1               2
    3       4       5       6

    States are represented by a tensor with shape [n_nodes + 1, 5], where each k-th row
    corresponds to the attributes of the k-th node of the tree. The last row contains
    the information about the stage of the tree (see class Stage).
    """

    def __init__(
        self,
        X_train: Optional[npt.NDArray] = None,
        y_train: Optional[npt.NDArray] = None,
        X_test: Optional[npt.NDArray] = None,
        y_test: Optional[npt.NDArray] = None,
        data_path: Optional[str] = None,
        scale_data: bool = True,
        max_depth: int = 10,
        continuous: bool = True,
        n_thresholds: Optional[int] = 9,
        threshold_components: int = 1,
        beta_params_min: float = 1.0,
        beta_params_max: float = 2.0,
        fixed_distr_params: dict = {
            "beta_alpha": 2.0,
            "beta_beta": 5.0,
        },
        random_distr_params: dict = {
            "beta_alpha": 1.0,
            "beta_beta": 1.0,
        },
        policy_format: str = "mlp",
        test_args: dict = {"top_k_trees": 0},
        **kwargs,
    ):
        """
        Attributes
        ----------
        X_train : np.array
            Train dataset, with dimensionality (n_observations, n_features). It may be
            None if a data set is provided via data_path.

        y_train : np.array
            Train labels, with dimensionality (n_observations,). It may be
            None if a data set is provided via data_path.

        X_test : np.array
            Test dataset, with dimensionality (n_observations, n_features). It may be
            None if a data set is provided via data_path, or if you don't want to perform
            test set evaluation.

        y_train : np.array
            Test labels, with dimensionality (n_observations,). It may be
            None if a data set is provided via data_path, or if you don't want to perform
            test set evaluation.

        data_path : str
            A path to a data set, with the following options:
            - *.pkl: Pickled dict with X_train, y_train, and (optional) X_test and y_test
              variables.
            - *.csv: CSV containing an optional 'Split' column in the last place, containing
              'train' and 'test' values, and M remaining columns, where the first (M - 1)
              columns will be taken to construct the input X, and M-th column will be the
              target y.
            Ignored if X_train and y_train are not None.

        scale_data : bool
            Whether to perform min-max scaling on the provided data (to a [0; 1] range).

        max_depth : int
            Maximum depth of a tree.

        continuous : bool
            Whether the environment should operate in a continuous mode (in which distribution
            parameters are predicted for the threshold) or the discrete mode (in which there
            is a discrete set of possible thresholds to choose from).

        n_thresholds : int
            Number of uniformly distributed thresholds in a (0; 1) range that will be used
            in the discrete mode. Ignored if continuous is True.

        policy_format : str
            Type of policy that will be used with the environment, either 'mlp' or 'gnn'.
            Influences which state2policy functions will be used.

        threshold_components : int
            The number of mixture components that will be used for sampling
            the threshold.
        """
        if X_train is not None and y_train is not None:
            self.X_train = X_train
            self.y_train = y_train
            if X_test is not None and y_test is not None:
                self.X_test = X_test
                self.y_test = y_test
            else:
                self.X_test = None
                self.y_test = None
        elif data_path is not None:
            self.X_train, self.y_train, self.X_test, self.y_test = Tree._load_dataset(
                data_path
            )
        else:
            raise ValueError(
                "A Tree must be initialised with a data set. X_train, y_train and data_path cannot "
                "be all None"
            )
        if scale_data:
            self.scaler = MinMaxScaler().fit(self.X_train)
            self.X_train = self.scaler.transform(self.X_train)
            if self.X_test is not None:
                self.X_test = self.scaler.transform(self.X_test)

[docs]
        self.y_train = self.y_train.astype(int)

        if self.y_test is not None:
            self.y_test = self.y_test.astype(int)
        if not set(self.y_train).issubset({0, 1}):
            raise ValueError(
                f"Expected y_train to have values in {{0, 1}}, received {set(self.y_train)}."
            )

[docs]
        self.n_features = self.X_train.shape[1]


[docs]
        self.max_depth = max_depth


[docs]
        self.continuous = continuous

        if not continuous:
            self.thresholds = np.linspace(0, 1, n_thresholds + 2)[1:-1]

[docs]
        self.test_args = test_args

        # Parameters of the policy distribution

[docs]
        self.components = threshold_components


[docs]
        self.beta_params_min = beta_params_min


[docs]
        self.beta_params_max = beta_params_max

        # Source will contain information about the current stage (on the last position),
        # and up to 2**max_depth - 1 nodes, each with Attribute.N attributes, for a total of
        # 1 + Attribute.N * (2**max_depth - 1) values. The root (0-th node) of the
        # source is initialized with a classifier.

[docs]
        self.n_nodes = 2**max_depth - 1


[docs]
        self.source = torch.full((self.n_nodes + 1, Attribute.N), torch.nan)

        self._set_stage(Stage.COMPLETE, self.source)
        attributes_root = self.source[0]
        attributes_root[Attribute.TYPE] = NodeType.CLASSIFIER
        attributes_root[Attribute.FEATURE] = -1
        attributes_root[Attribute.THRESHOLD] = -1

[docs]
        self.default_class = Counter(self.y_train).most_common()[0][0]

        attributes_root[Attribute.CLASS] = self.default_class
        attributes_root[Attribute.ACTIVE] = Status.INACTIVE

        # End-of-sequence action.

[docs]
        self.eos = (-1, -1, -1)


        # Conversions
        policy_format = policy_format.lower()
        if policy_format == "mlp":
            self.states2policy = self.states2policy_mlp
        elif policy_format != "gnn":
            raise ValueError(
                f"Unrecognized policy_format = {policy_format}, expected either 'mlp' or 'gnn'."
            )

        super().__init__(
            fixed_distr_params=fixed_distr_params,
            random_distr_params=random_distr_params,
            continuous=continuous,
            **kwargs,
        )

    @staticmethod
    def _get_parent(k: int) -> Optional[int]:
        """
        Get node index of a parent of k-th node.
        """
        if k == 0:
            return None
        return (k - 1) // 2

    @staticmethod
    def _get_left_child(k: int) -> int:
        """
        Get node index of a left child of k-th node.
        """
        return 2 * k + 1

    @staticmethod
    def _get_right_child(k: int) -> int:
        """
        Get node index of a right child of k-th node.
        """
        return 2 * k + 2

    @staticmethod
    def _get_sibling(k: int) -> Optional[int]:
        """
        Get node index of the sibling of k-th node.
        """
        parent = Tree._get_parent(k)
        if parent is None:
            return None
        left = Tree._get_left_child(parent)
        right = Tree._get_right_child(parent)
        return left if k == right else right

    def _get_stage(self, state: Optional[torch.Tensor] = None) -> int:
        """
        Returns the stage of the current environment from self.state[-1, 0] or from the
        state passed as an argument.
        """
        state = self._get_state(state)
        return state[-1, 0]

    def _set_stage(
        self, stage: int, state: Optional[torch.Tensor] = None
    ) -> torch.Tensor:
        """
        Sets the stage of the current environment (self.state) or of the state passed
        as an argument by updating state[-1, 0].
        """
        state = self._get_state(state)
        state[-1, 0] = stage
        return state

    def _pick_leaf(self, k: int) -> None:
        """
        Select one of the leaves (classifier nodes) that will be split, and initiate
        macro step.
        """
        attributes = self.state[k]

        assert self._get_stage() == Stage.COMPLETE
        assert attributes[Attribute.TYPE] == NodeType.CLASSIFIER
        assert not torch.any(torch.isnan(attributes))
        assert torch.all(attributes[1:3] == -1)
        assert attributes[Attribute.ACTIVE] == Status.INACTIVE

        attributes[Attribute.TYPE] = NodeType.CONDITION
        attributes[1:4] = -1
        attributes[Attribute.ACTIVE] = Status.ACTIVE

        self._set_stage(Stage.LEAF)

    def _pick_feature(self, k: int, feature: float) -> None:
        """
        Select the feature on which currently selected leaf will be split.
        """
        attributes = self.state[k]

        assert self._get_stage() == Stage.LEAF
        assert attributes[Attribute.TYPE] == NodeType.CONDITION
        assert torch.all(attributes[1:4] == -1)
        assert attributes[Attribute.ACTIVE] == Status.ACTIVE

        attributes[Attribute.FEATURE] = feature

        self._set_stage(Stage.FEATURE)

    def _pick_threshold(self, k: int, threshold: float) -> None:
        """
        Select the threshold for splitting the currently selected leaf ond
        the selected feature.
        """
        attributes = self.state[k]

        assert self._get_stage() == Stage.FEATURE
        assert attributes[Attribute.TYPE] == NodeType.CONDITION
        assert attributes[Attribute.FEATURE] >= 0
        assert torch.all(attributes[2:4] == -1)
        assert attributes[Attribute.ACTIVE] == Status.ACTIVE

        attributes[Attribute.THRESHOLD] = threshold

        self._set_stage(Stage.THRESHOLD)

    def _pick_operator(self, k: int, operator: float) -> None:
        """
        Select the operator (< or >=) for splitting the currently selected
        left, feature and threshold, temporarily encode it in attributes,
        and initiate final splitting.
        """
        attributes = self.state[k]

        assert self._get_stage() == Stage.THRESHOLD
        assert attributes[Attribute.TYPE] == NodeType.CONDITION
        assert torch.all(attributes[1:3] >= 0)
        assert attributes[Attribute.CLASS] == -1
        assert attributes[Attribute.ACTIVE] == Status.ACTIVE

        attributes[Attribute.CLASS] = operator

        self._set_stage(Stage.OPERATOR)

        self._split_leaf(k)

    def _split_leaf(self, k: int) -> None:
        """
        Finalize the splitting of a leaf using set feature, threshold
        and operator: transform the leaf into a condition node and
        spawn two children.

        We assume the convention of having left child output label = 0
        and right child label = 1 if operator is <, and the opposite if
        operator is >=. That way, during prediction, we can act as if
        the operator was always the same (and only care about the output
        label).
        """
        attributes = self.state[k]

        assert self._get_stage() == Stage.OPERATOR
        assert attributes[Attribute.TYPE] == NodeType.CONDITION
        assert torch.all(attributes[1:4] >= 0)
        assert attributes[Attribute.ACTIVE] == Status.ACTIVE

        k_left = Tree._get_left_child(k)
        k_right = Tree._get_right_child(k)

        if attributes[Attribute.CLASS] == Operator.LT:
            self._insert_classifier(k_left, output=0)
            self._insert_classifier(k_right, output=1)
        else:
            self._insert_classifier(k_left, output=1)
            self._insert_classifier(k_right, output=0)

        attributes[Attribute.CLASS] = -1
        attributes[Attribute.ACTIVE] = Status.INACTIVE

        self._set_stage(Stage.COMPLETE)

    def _insert_classifier(self, k: int, output: int) -> None:
        """
        Replace attributes of k-th node with those of a classifier node.
        """
        attributes = self.state[k]

        assert torch.all(torch.isnan(attributes))

        attributes[Attribute.TYPE] = NodeType.CLASSIFIER
        attributes[Attribute.FEATURE] = -1
        attributes[Attribute.THRESHOLD] = -1
        attributes[Attribute.CLASS] = output
        attributes[Attribute.ACTIVE] = Status.INACTIVE


[docs]
    def get_action_space(self) -> List[Tuple[int, int, int]]:
        """
        Actions are a tuple containing:
            1) action type:
                0 - pick leaf to split,
                1 - pick feature,
                2 - pick threshold,
                3 - pick operator,
            2) node index,
            3) action value, depending on the action type:
                pick leaf: current class output,
                pick feature: feature index,
                pick threshold: threshold value,
                pick operator: operator index.
        """
        actions = []
        # Pick leaf
        self._action_index_pick_leaf = 0
        # For loops have to be done in this order to be compatible
        # with flattening in the GNN-based policy.
        actions.extend(
            [
                (ActionType.PICK_LEAF, idx, output)
                for idx in range(self.n_nodes)
                for output in [0, 1]
            ]
        )
        # Pick feature
        self._action_index_pick_feature = len(actions)
        actions.extend(
            [(ActionType.PICK_FEATURE, -1, idx) for idx in range(self.n_features)]
        )
        # Pick threshold
        self._action_index_pick_threshold = len(actions)
        if self.continuous:
            actions.extend([(ActionType.PICK_THRESHOLD, -1, -1)])
        else:
            actions.extend(
                [
                    (ActionType.PICK_THRESHOLD, -1, idx)
                    for idx, thr in enumerate(self.thresholds)
                ]
            )
        # Pick operator
        self._action_index_pick_operator = len(actions)
        # For loops have to be done in this order to be compatible
        # with flattening in the GNN-based policy.
        actions.extend(
            [
                (ActionType.PICK_OPERATOR, idx, op)
                for idx in range(self.n_nodes)
                for op in [Operator.LT, Operator.GTE]
            ]
        )
        # EOS
        self._action_index_eos = len(actions)
        actions.append(self.eos)

        return actions



[docs]
    def step(
        self, action: Tuple[int, int, Union[int, float]], skip_mask_check: bool = False
    ) -> Tuple[List[int], Tuple[int, int, Union[int, float]], bool]:
        """
        Executes step given an action.

        Args
        ----
        action : tuple
            Action to be executed.
            See: self.get_action_space()

        skip_mask_check : bool
            If True, skip computing forward mask of invalid actions to check if the
            action is valid.

        Returns
        -------
        self.state : list
            The sequence after executing the action

        action : tuple
            Action executed

        valid : bool
            False, if the action is not allowed for the current state.
        """
        # Replace the continuous value of threshold by -1 to allow checking it.
        action_to_check = self.action2representative(action)
        do_step, self.state, action_to_check = self._pre_step(
            action_to_check,
            skip_mask_check=(skip_mask_check or self.skip_mask_check),
        )
        if not do_step:
            return self.state, action, False

        self.n_actions += 1

        if action != self.eos:
            action_type, k, action_value = action

            if action_type == ActionType.PICK_LEAF:
                self._pick_leaf(k)
            else:
                if k == -1:
                    k = self.find_active(self.state)

                if action_type == ActionType.PICK_FEATURE:
                    self._pick_feature(k, action_value)
                elif action_type == ActionType.PICK_THRESHOLD:
                    if self.continuous:
                        self._pick_threshold(k, action_value)
                    else:
                        self._pick_threshold(k, self.thresholds[action_value])
                elif action_type == ActionType.PICK_OPERATOR:
                    self._pick_operator(k, action_value)
                else:
                    raise NotImplementedError(
                        f"Unrecognized action type: {action_type}."
                    )

            return self.state, action, True
        else:
            self.done = True
            return self.state, action, True



[docs]
    def step_backwards(
        self, action: Tuple[int], skip_mask_check: bool = False
    ) -> Tuple[List[int], Tuple[int], bool]:
        """
        Executes a backward step given an action.

        Args
        ----
        action : tuple
            Action from the action space.

        skip_mask_check : bool
            If True, skip computing forward mask of invalid actions to check if the
            action is valid.

        Returns
        -------
        self.state : list
            The state after executing the action.

        action : int
            Given action.

        valid : bool
            False, if the action is not allowed for the current state.
        """
        # Replace the continuous value of threshold by -1 to allow checking it.
        action_to_check = self.action2representative(action)
        _, _, valid = super().step_backwards(
            action_to_check, skip_mask_check=skip_mask_check
        )
        return self.state, action, valid



[docs]
    def set_state(self, state: List, done: Optional[bool] = False):
        """
        Sets the state and done. If done is True but incompatible with state (Stage is
        not COMPLETE), then force done False and print warning.
        """
        if done is True and self._get_stage() != Stage.COMPLETE:
            done = False
            warnings.warn(f"""
            Attempted to set state {self.state2readable(state)} with done = True, which
            is not compatible with the environment. Forcing done = False.
            """)
        return super().set_state(state, done)


    # TODO: needs to be update

[docs]
    def sample_actions_batch_continuous(
        self,
        policy_outputs: TensorType["n_states", "policy_output_dim"],
        mask: Optional[TensorType["n_states", "policy_output_dim"]] = None,
        states_from: Optional[List] = None,
        is_backward: Optional[bool] = False,
        random_action_prob: Optional[float] = 0.0,
        temperature_logits: Optional[float] = 1.0,
    ) -> Tuple[List[Tuple], TensorType["n_states"]]:
        """
        Samples a batch of actions from a batch of policy outputs in the continuous mode.
        """
        n_states = policy_outputs.shape[0]
        # Discrete actions
        is_discrete = mask[:, self._action_index_pick_threshold]
        if torch.any(is_discrete):
            policy_outputs_discrete = policy_outputs[
                is_discrete, : self._index_continuous_policy_output
            ]
            # states_from can be None because it will be ignored
            actions_discrete = super().sample_actions_batch(
                policy_outputs_discrete,
                mask[is_discrete, : self._index_continuous_policy_output],
                None,
                is_backward,
                random_action_prob,
                temperature_logits,
            )
        if torch.all(is_discrete):
            return actions_discrete
        # Continuous actions
        is_continuous = torch.logical_not(is_discrete)
        n_cont = is_continuous.sum()
        policy_outputs_cont = policy_outputs[
            is_continuous, self._index_continuous_policy_output :
        ]
        mix_logits = policy_outputs_cont[:, 0::3]
        mix = Categorical(logits=mix_logits)
        alphas = policy_outputs_cont[:, 1::3]
        alphas = self.beta_params_max * torch.sigmoid(alphas) + self.beta_params_min
        betas = policy_outputs_cont[:, 2::3]
        betas = self.beta_params_max * torch.sigmoid(betas) + self.beta_params_min
        beta_distr = Beta(alphas, betas)
        distr_threshold = MixtureSameFamily(mix, beta_distr)
        thresholds = distr_threshold.sample()
        # Build actions
        actions_cont = [(ActionType.PICK_THRESHOLD, -1, th.item()) for th in thresholds]
        actions = []
        for is_discrete_i in is_discrete:
            if is_discrete_i:
                actions.append(actions_discrete.pop(0))
            else:
                actions.append(actions_cont.pop(0))
        return actions



[docs]
    def sample_actions_batch(
        self,
        policy_outputs: TensorType["n_states", "policy_output_dim"],
        mask: Optional[TensorType["n_states", "policy_output_dim"]] = None,
        states_from: Optional[List] = None,
        is_backward: Optional[bool] = False,
        random_action_prob: Optional[float] = 0.0,
        temperature_logits: Optional[float] = 1.0,
    ) -> Tuple[List[Tuple], TensorType["n_states"]]:
        """
        Samples a batch of actions from a batch of policy outputs.
        """
        if self.continuous:
            return self.sample_actions_batch_continuous(
                policy_outputs=policy_outputs,
                mask=mask,
                states_from=states_from,
                is_backward=is_backward,
                random_action_prob=random_action_prob,
                temperature_logits=temperature_logits,
            )
        else:
            return super().sample_actions_batch(
                policy_outputs=policy_outputs,
                mask=mask,
                states_from=states_from,
                is_backward=is_backward,
                random_action_prob=random_action_prob,
                temperature_logits=temperature_logits,
            )



[docs]
    def get_logprobs_continuous(
        self,
        policy_outputs: TensorType["n_states", "policy_output_dim"],
        actions: Union[List, TensorType["n_states", "action_dim"]],
        mask: TensorType["n_states", "1"] = None,
        states_from: Optional[List] = None,
        is_backward: bool = False,
    ) -> TensorType["batch_size"]:
        """
        Computes log probabilities of actions given policy outputs and actions.
        """
        actions = tfloat(actions, float_type=self.float, device=self.device)
        n_states = policy_outputs.shape[0]
        # TODO: make nicer
        if states_from is None:
            states_from = torch.empty(
                (n_states, self.policy_input_dim), device=self.device
            )
        logprobs = torch.zeros(n_states, device=self.device, dtype=self.float)
        # Discrete actions
        mask_discrete = mask[:, self._action_index_pick_threshold]
        if torch.any(mask_discrete):
            policy_outputs_discrete = policy_outputs[
                mask_discrete, : self._index_continuous_policy_output
            ]
            # states_from can be None because it will be ignored
            logprobs_discrete = super().get_logprobs(
                policy_outputs_discrete,
                actions[mask_discrete],
                mask[mask_discrete, : self._index_continuous_policy_output],
                None,
                is_backward,
            )
            logprobs[mask_discrete] = logprobs_discrete
        if torch.all(mask_discrete):
            return logprobs
        # Continuous actions
        mask_cont = torch.logical_not(mask_discrete)
        policy_outputs_cont = policy_outputs[
            mask_cont, self._index_continuous_policy_output :
        ]
        mix_logits = policy_outputs_cont[:, 0::3]
        mix = Categorical(logits=mix_logits)
        alphas = policy_outputs_cont[:, 1::3]
        alphas = self.beta_params_max * torch.sigmoid(alphas) + self.beta_params_min
        betas = policy_outputs_cont[:, 2::3]
        betas = self.beta_params_max * torch.sigmoid(betas) + self.beta_params_min
        beta_distr = Beta(alphas, betas)
        distr_threshold = MixtureSameFamily(mix, beta_distr)
        thresholds = actions[mask_cont, -1]
        logprobs[mask_cont] = distr_threshold.log_prob(thresholds)
        return logprobs



[docs]
    def get_logprobs(
        self,
        policy_outputs: TensorType["n_states", "policy_output_dim"],
        actions: Union[List, TensorType["n_states", "action_dim"]],
        mask: TensorType["n_states", "1"] = None,
        states_from: Optional[List] = None,
        is_backward: bool = False,
    ) -> TensorType["batch_size"]:
        """
        Computes log probabilities of actions given policy outputs and actions.
        """
        if self.continuous:
            return self.get_logprobs_continuous(
                policy_outputs,
                actions,
                mask,
                states_from,
                is_backward,
            )
        else:
            return super().get_logprobs(
                policy_outputs,
                actions,
                mask,
                states_from,
                is_backward,
            )



[docs]
    def states2policy_mlp(
        self,
        states: Union[
            List[TensorType["state_dim"]], TensorType["batch_size", "state_dim"]
        ],
    ) -> TensorType["batch_size", "policy_input_dim"]:
        """
        Prepares a batch of states in torch "GFlowNet format" for an MLP policy model.
        It replaces the NaNs by -2s, removes the activity attribute, and explicitly
        appends the attribute vector of the active node (if present).
        """
        if isinstance(states, list):
            states = torch.stack(states)
        rows, cols = torch.where(states[:, :-1, Attribute.ACTIVE] == Status.ACTIVE)
        active_features = torch.full((states.shape[0], 1, 4), -2.0)
        active_features[rows] = states[rows, cols, : Attribute.ACTIVE].unsqueeze(1)
        states[states.isnan()] = -2
        states = torch.cat([states[:, :, : Attribute.ACTIVE], active_features], dim=1)
        return states.flatten(start_dim=1)


    def _attributes_to_readable(self, attributes: List) -> str:
        # Node type
        if attributes[Attribute.TYPE] == NodeType.CONDITION:
            node_type = "condition, "
        elif attributes[Attribute.TYPE] == NodeType.CLASSIFIER:
            node_type = "classifier, "
        else:
            return ""
        # Feature
        feature = f"feat. {str(attributes[Attribute.FEATURE])}, "
        # Decision threshold
        if attributes[Attribute.THRESHOLD] != -1:
            assert attributes[Attribute.TYPE] == 0
            threshold = f"th. {str(attributes[Attribute.THRESHOLD])}, "
        else:
            threshold = "th. -1, "
        # Class output
        if attributes[Attribute.CLASS] != -1:
            assert attributes[Attribute.TYPE] == 1
            class_output = f"class {str(attributes[Attribute.CLASS])}, "
        else:
            class_output = "class -1, "
        if attributes[Attribute.ACTIVE] == Status.ACTIVE:
            active = " (active)"
        else:
            active = ""
        return node_type + feature + threshold + class_output + active


[docs]
    def state2readable(self, state=None):
        """
        Converts a state into human-readable representation.
        """
        # TODO: call to _get_state(state) might need do_copy=True
        state = self._get_state(state)
        state = state.cpu().numpy()
        readable = ""
        for idx in range(self.n_nodes):
            attributes = self._attributes_to_readable(state[idx])
            if len(attributes) == 0:
                continue
            readable += f"{idx}: {attributes} | "
        readable += f"stage: {self._get_stage(state)}"
        return readable


    def _readable_to_attributes(self, readable: str) -> List:
        attributes_list = readable.split(", ")
        # Node type
        if attributes_list[0] == "condition":
            node_type = NodeType.CONDITION
        elif attributes_list[0] == "classifier":
            node_type = NodeType.CLASSIFIER
        else:
            node_type = -1
        # Feature
        feature = float(attributes_list[1].split("feat. ")[-1])
        # Decision threshold
        threshold = float(attributes_list[2].split("th. ")[-1])
        # Class output
        class_output = float(attributes_list[3].split("class ")[-1])
        # Active
        if "(active)" in readable:
            active = Status.ACTIVE
        else:
            active = Status.INACTIVE
        return [node_type, feature, threshold, class_output, active]


[docs]
    def readable2state(self, readable):
        """
        Converts a human-readable representation of a state into the standard format.
        """
        readable_list = readable.split(" | ")
        state = torch.full((self.n_nodes + 1, Attribute.N), torch.nan)
        for el in readable_list[:-1]:
            node_index, attributes_str = el.split(": ")
            node_index = int(node_index)
            attributes = self._readable_to_attributes(attributes_str)
            for idx, att in enumerate(attributes):
                state[node_index, idx] = att
        stage = float(readable_list[-1].split("stage: ")[-1])
        state = self._set_stage(stage, state)
        return state


    @staticmethod
    def _find_leaves(state: torch.Tensor) -> List[int]:
        """
        Compute indices of leaves from a state.
        """
        return torch.where(state[:-1, Attribute.TYPE] == NodeType.CLASSIFIER)[
            0
        ].tolist()

    @staticmethod

[docs]
    def find_active(state: torch.Tensor) -> int:
        """
        Get index of the (only) active node. Assumes that active node exists
        (that we are in the middle of a macro step).
        """
        active = torch.where(state[:-1, Attribute.ACTIVE] == Status.ACTIVE)[0]
        assert len(active) == 1
        return active.item()


    @staticmethod

[docs]
    def get_n_nodes(state: torch.Tensor) -> int:
        """
        Returns the number of nodes in a tree represented by the given state.
        """
        return (~torch.isnan(state[:-1, Attribute.TYPE])).sum()



[docs]
    def get_policy_output_continuous(
        self, params: dict
    ) -> TensorType["policy_output_dim"]:
        """
        Defines the structure of the output of the policy model, from which an
        action is to be determined or sampled. It initializes the output tensor
        by using the parameters provided in the argument params.

        The output of the policy of a Tree environment consists of a discrete and
        continuous part. The discrete part (first part) corresponds to the discrete
        actions, while the continuous part (second part) corresponds to the single
        continuous action, that is the sampling of the threshold of a node classifier.

        The latter is modelled by a mixture of Beta distributions. Therefore, the
        continuous part of the policy output is vector of dimensionality c * 3,
        where c is the number of components in the mixture (self.components).
        The three parameters of each component are the following:

          1) the weight of the component in the mixture
          2) the logit(alpha) parameter of the Beta distribution to sample the
             threshold.
          3) the logit(beta) parameter of the Beta distribution to sample the
             threshold.

        Note: contrary to other environments where there is a need to model a mixture
        of discrete and continuous distributions (for example to consider the
        possibility of sampling the EOS action instead of a continuous action), there
        is no such need here because either the continuous action is the only valid
        action or it is not valid.
        """
        policy_output_discrete = torch.ones(
            self.action_space_dim, device=self.device, dtype=self.float
        )
        self._index_continuous_policy_output = len(policy_output_discrete)
        self._len_continuous_policy_output = self.components * 3
        policy_output_continuous = torch.ones(
            self._len_continuous_policy_output,
            device=self.device,
            dtype=self.float,
        )
        policy_output_continuous[1::3] = params["beta_alpha"]
        policy_output_continuous[2::3] = params["beta_beta"]
        return torch.cat([policy_output_discrete, policy_output_continuous])



[docs]
    def get_policy_output(self, params: dict) -> TensorType["policy_output_dim"]:
        """
        Defines the structure of the output of the policy model, from which an
        action is to be determined or sampled.
        """
        if self.continuous:
            return self.get_policy_output_continuous(params=params)
        else:
            return super().get_policy_output(params=params)



[docs]
    def get_mask_invalid_actions_forward(
        self, state: Optional[torch.Tensor] = None, done: Optional[bool] = None
    ) -> List[bool]:
        state = self._get_state(state)
        done = self._get_done(done)

        if done:
            return [True] * self.policy_output_dim

        leaves = Tree._find_leaves(state)
        stage = self._get_stage(state)
        mask = [True] * self.policy_output_dim

        if stage == Stage.COMPLETE:
            # In the "complete" stage (in which there are no ongoing micro steps)
            # only valid actions are the ones for picking one of the leaves or EOS.
            for k in leaves:
                # Check if splitting the node wouldn't exceed max depth.
                if Tree._get_right_child(k) < self.n_nodes:
                    current_class = state[k, Attribute.CLASS].long()
                    mask[self._action_index_pick_leaf + 2 * k + current_class] = False
            mask[self._action_index_eos] = False
        elif stage == Stage.LEAF:
            # Leaf was picked, only picking the feature actions are valid.
            for idx in range(
                self._action_index_pick_feature, self._action_index_pick_threshold
            ):
                mask[idx] = False
        elif stage == Stage.FEATURE:
            # Feature was picked, only picking the threshold action is valid.
            for idx in range(
                self._action_index_pick_threshold, self._action_index_pick_operator
            ):
                mask[idx] = False
        elif stage == Stage.THRESHOLD:
            # Threshold was picked, only picking the operator actions are valid.
            k = self.find_active(state)
            for idx in range(self._action_index_pick_operator, self._action_index_eos):
                if self.action_space[idx][1] == k:
                    mask[idx] = False
        else:
            raise ValueError(f"Unrecognized stage {stage}.")

        return mask



[docs]
    def get_mask_invalid_actions_backward_continuous(
        self,
        state: Optional[torch.Tensor] = None,
        done: Optional[bool] = None,
        parents_a: Optional[List] = None,
    ) -> List:
        """
        Simply appends to the standard "discrete part" of the mask a dummy part
        corresponding to the continuous part of the policy output so as to match the
        dimensionality.
        """
        return (
            super().get_mask_invalid_actions_backward(state, done, parents_a)
            + [True] * self._len_continuous_policy_output
        )



[docs]
    def get_mask_invalid_actions_backward(
        self,
        state: Optional[torch.Tensor] = None,
        done: Optional[bool] = None,
        parents_a: Optional[List] = None,
    ) -> List:
        if self.continuous:
            return self.get_mask_invalid_actions_backward_continuous(
                state=state, done=done, parents_a=parents_a
            )
        else:
            return super().get_mask_invalid_actions_backward(
                state=state, done=done, parents_a=parents_a
            )



[docs]
    def get_parents(
        self,
        state: Optional[torch.Tensor] = None,
        done: Optional[bool] = None,
        action: Optional[Tuple] = None,
    ) -> Tuple[List, List]:
        state = self._get_state(state)
        done = self._get_done(done)

        if done:
            return [state], [self.eos]

        leaves = Tree._find_leaves(state)
        stage = self._get_stage(state)
        parents = []
        actions = []

        if stage == Stage.COMPLETE:
            # In the "complete" stage (in which there are no ongoing micro steps),
            # to find parents we first look for the nodes for which both children
            # are leaves, and then undo the last "pick operator" micro step.
            # In other words, reverse self._pick_operator, self._split_leaf and
            # self._insert_classifier (for both children).
            leaves = set(leaves)
            triplets = []
            for k in leaves:
                if k % 2 == 1 and k + 1 in leaves:
                    triplets.append((Tree._get_parent(k), k, k + 1))
            for k_parent, k_left, k_right in triplets:
                parent = state.clone()
                attributes_parent = parent[k_parent]
                attributes_left = parent[k_left]
                attributes_right = parent[k_right]

                # Set action operator as class of left child.
                action = (
                    ActionType.PICK_OPERATOR,
                    k_parent,
                    int(attributes_left[Attribute.CLASS].item()),
                )

                # Revert stage (to "threshold": we skip "operator" because from it,
                # finalizing splitting should be automatically executed).
                parent = self._set_stage(Stage.THRESHOLD, parent)

                # Reset children attributes.
                attributes_left[:] = torch.nan
                attributes_right[:] = torch.nan

                # Revert parent attributes to the previous state.
                attributes_parent[Attribute.CLASS] = -1
                attributes_parent[Attribute.ACTIVE] = Status.ACTIVE

                parents.append(parent)
                actions.append(action)
        else:
            k = Tree.find_active(state)

            if stage == Stage.LEAF:
                # Reverse self._pick_leaf.
                if k == 0:
                    outputs = [self.default_class]
                else:
                    attributes_sibling = state[Tree._get_sibling(k)]
                    if attributes_sibling[Attribute.TYPE] == NodeType.CLASSIFIER:
                        outputs = [0 if attributes_sibling[Attribute.CLASS] == 1 else 1]
                    else:
                        outputs = [0, 1]

                for output in outputs:
                    parent = state.clone()
                    attributes = parent[k]

                    parent = self._set_stage(Stage.COMPLETE, parent)
                    attributes[Attribute.TYPE] = NodeType.CLASSIFIER
                    attributes[Attribute.FEATURE] = -1
                    attributes[Attribute.THRESHOLD] = -1
                    attributes[Attribute.CLASS] = output
                    attributes[Attribute.ACTIVE] = Status.INACTIVE

                    parents.append(parent)
                    actions.append((ActionType.PICK_LEAF, k, output))
            elif stage == Stage.FEATURE:
                # Reverse self._pick_feature.
                parent = state.clone()
                attributes = parent[k]

                parent = self._set_stage(Stage.LEAF, parent)
                attributes[Attribute.FEATURE] = -1

                parents.append(parent)
                actions.append(
                    (ActionType.PICK_FEATURE, -1, state[k][Attribute.FEATURE].item())
                )
            elif stage == Stage.THRESHOLD:
                # Reverse self._pick_threshold.
                parent = state.clone()
                attributes = parent[k]

                parent = self._set_stage(Stage.FEATURE, parent)
                attributes[Attribute.THRESHOLD] = -1

                parents.append(parent)
                if self.continuous:
                    actions.append((ActionType.PICK_THRESHOLD, -1, -1))
                else:
                    threshold_idx = np.where(
                        np.isclose(
                            self.thresholds, state[k][Attribute.THRESHOLD].item()
                        )
                    )[0].item()
                    actions.append((ActionType.PICK_THRESHOLD, -1, threshold_idx))
            else:
                raise ValueError(f"Unrecognized stage {stage}.")

        return parents, actions


    @staticmethod

[docs]
    def action2representative_continuous(action: Tuple) -> Tuple:
        """
        Replaces the continuous value of a PICK_THRESHOLD action by -1 so that it can
        be contrasted with the action space and masks.
        """
        if action[0] == ActionType.PICK_THRESHOLD:
            action = (ActionType.PICK_THRESHOLD, -1, -1)
        return action



[docs]
    def action2representative(self, action: Tuple) -> Tuple:
        if self.continuous:
            return self.action2representative_continuous(action=action)
        else:
            return super().action2representative(action=action)


    def _get_max_trajectory_length(self) -> int:
        """
        Returns the maximum trajectory length of the environment, including the EOS
        action.
        """
        return self.n_nodes * Attribute.N + 1

    @staticmethod
    def _get_graph(
        state: torch.Tensor,
        bidirectional: bool,
        *,
        graph: Optional[nx.DiGraph] = None,
        k: int = 0,
    ) -> nx.DiGraph:
        """
        Recursively convert state into a networkx directional graph.
        """
        if graph is None:
            graph = nx.DiGraph()

        attributes = state[k]
        graph.add_node(k, x=attributes, k=k)

        if attributes[Attribute.TYPE] != NodeType.CLASSIFIER:
            k_left = Tree._get_left_child(k)
            if not torch.any(torch.isnan(state[k_left])):
                Tree._get_graph(state, bidirectional, graph=graph, k=k_left)
                graph.add_edge(k, k_left)
                if bidirectional:
                    graph.add_edge(k_left, k)

            k_right = Tree._get_right_child(k)
            if not torch.any(torch.isnan(state[k_right])):
                Tree._get_graph(state, bidirectional, graph=graph, k=k_right)
                graph.add_edge(k, k_right)
                if bidirectional:
                    graph.add_edge(k_right, k)

        return graph


[docs]
    def get_pyg_input_dim(self) -> int:
        return Tree.state2pyg(self.state, self.n_features).x.shape[1]


    @staticmethod

[docs]
    def state2pyg(
        state: torch.Tensor,
        n_features: int,
        one_hot: bool = True,
        add_self_loop: bool = False,
    ) -> pyg.data.Data:
        """
        Convert given state into a PyG graph.
        """
        k = torch.nonzero(~state[:-1, Attribute.TYPE].isnan()).squeeze(-1)
        x = state[k].clone().detach()
        if one_hot:
            x = torch.cat(
                [
                    x[:, [Attribute.TYPE, Attribute.THRESHOLD, Attribute.ACTIVE]],
                    F.one_hot((x[:, Attribute.FEATURE] + 1).long(), n_features + 1),
                    F.one_hot((x[:, Attribute.CLASS] + 1).long(), 3),
                ],
                dim=1,
            )

        k_array = k.detach().cpu().numpy()
        k_mapping = {value: index for index, value in enumerate(k_array)}
        k_set = set(k_array)
        edges = []
        edge_attrs = []
        for k_i in k_array:
            if add_self_loop:
                edges.append([k_mapping[k_i], k_mapping[k_i]])
            if k_i > 0:
                k_parent = (k_i - 1) // 2
                if k_parent in k_set:
                    edges.append([k_mapping[k_parent], k_mapping[k_i]])
                    edge_attrs.append([1.0, 0.0])
                    edges.append([k_mapping[k_i], k_mapping[k_parent]])
                    edge_attrs.append([0.0, 1.0])
        if len(edges) == 0:
            edge_index = torch.empty((2, 0)).long()
            edge_attr = torch.empty((0, 2)).float()
        else:
            edge_index = torch.Tensor(edges).T.long()
            edge_attr = torch.Tensor(edge_attrs)

        return pyg.data.Data(x=x, edge_index=edge_index, edge_attr=edge_attr, k=k)


    def _state2pyg(self) -> pyg.data.Data:
        """
        Convert self.state into a PyG graph.
        """
        return Tree.state2pyg(self.state, self.n_features)

    @staticmethod
    def _load_dataset(data_path):
        data_path = Path(data_path)
        if data_path.suffix == ".csv":
            df = pd.read_csv(data_path)
            if df.columns[-1].lower() != "split":
                X_train = df.iloc[:, 0:-1].values
                y_train = df.iloc[:, -1].values
                X_test = None
                y_test = None
            else:
                if set(df.iloc[:, -1]) != {"train", "test"}:
                    raise ValueError(
                        f"Expected df['Split'] to have values in {{'train', 'test'}}, "
                        f"received {set(df.iloc[:, -1])}."
                    )
                X_train = df[df.iloc[:, -1] == "train"].iloc[:, 0:-2].values
                y_train = df[df.iloc[:, -1] == "train"].iloc[:, -2].values
                X_test = df[df.iloc[:, -1] == "test"].iloc[:, 0:-2].values
                y_test = df[df.iloc[:, -1] == "test"].iloc[:, -2].values
        elif data_path.suffix == ".pkl":
            with open(data_path, "rb") as f:
                dct = pickle.load(f)
                X_train = dct["X_train"]
                y_train = dct["y_train"]
                X_test = dct.get("X_test")
                y_test = dct.get("y_test")
        else:
            raise ValueError(
                "data_path must be a CSV (*.csv) or a pickled dict (*.pkl)."
            )
        return X_train, y_train, X_test, y_test

    @staticmethod

[docs]
    def predict(
        state: torch.Tensor, x: npt.NDArray, *, return_k: bool = False, k: int = 0
    ) -> Union[int, Tuple[int, int]]:
        """
        Recursively predict output label given a feature vector x of a single
        observation.

        If return_k is True, will also return the index of the node in which
        prediction was made.
        """
        attributes = state[k]

        if attributes[Attribute.TYPE] == NodeType.CLASSIFIER:
            if return_k:
                return attributes[Attribute.CLASS], k
            return attributes[Attribute.CLASS]

        if (
            x[attributes[Attribute.FEATURE].long().item()]
            < attributes[Attribute.THRESHOLD]
        ):
            return Tree.predict(state, x, return_k=return_k, k=Tree._get_left_child(k))
        else:
            return Tree.predict(state, x, return_k=return_k, k=Tree._get_right_child(k))


    def _predict(
        self, x: npt.NDArray, *, return_k: bool = False
    ) -> Union[int, Tuple[int, int]]:
        return Tree.predict(self.state, x, return_k=return_k)

    @staticmethod

[docs]
    def plot(state, path: Optional[Union[Path, str]] = None) -> None:
        """
        Plot current state of the tree.
        """
        graph = Tree._get_graph(state, bidirectional=False)

        labels = {}
        node_color = []
        for node in graph:
            x = graph.nodes[node]["x"]
            if x[0] == NodeType.CONDITION:
                labels[node] = rf"$x_{int(x[1].item())}$ < {np.round(x[2].item(), 4)}"
                node_color.append("white")
            else:
                labels[node] = f"C={int(x[3].item())}"
                node_color.append("red")

        nx.draw(
            graph,
            graphviz_layout(graph, prog="dot"),
            labels=labels,
            node_color=node_color,
            with_labels=True,
            node_size=800,
        )
        if path is None:
            plt.show()
        else:
            plt.savefig(path)
            plt.close()


    @staticmethod
    def _predict_samples(states: torch.Tensor, X: npt.NDArray) -> npt.NDArray:
        """
        Compute a matrix of predictions.

        Args
        ----
        states : Tensor
            Collection of sampled states with dimensionality (n_states, state_dim).

        X : NDArray
            Feature matrix with dimensionality (n_observations, n_features).

        Returns
        -------
        Prediction matrix with dimensionality (n_states, n_observations).

        """
        predictions = np.empty((len(states), len(X)))
        for i, state in enumerate(states):
            for j, x in enumerate(X):
                predictions[i, j] = Tree.predict(state, x)
        return predictions

    @staticmethod
    def _compute_scores(
        predictions: npt.NDArray, y: npt.NDArray
    ) -> (dict, npt.NDArray):
        """
        Computes accuracy and balanced accuracy metrics for given predictions and ground
        truth labels.

        The metrics are computed in two modes: either as an average of scores calculated
        for individual trees (mean_tree_*), or as a single score calculated on a prediction
        made by the whole ensemble (forest_*), with ensembling done via prediction averaging.

        Args
        ----
        predictions: NDArray
            Prediction matrix with dimensionality (n_states, n_observations).

        y : NDArray
            Target vector with dimensionality (n_observations,).

        Returns
        -------
        Dictionary of (metric_name, score) key-value pairs.
        """
        scores = {}
        metrics = {"acc": accuracy_score, "bac": balanced_accuracy_score}

        for metric_name, metric_function in metrics.items():
            scores[f"mean_tree_{metric_name}"] = np.mean(
                [metric_function(y, y_pred) for y_pred in predictions]
            )
            scores[f"forest_{metric_name}"] = metric_function(
                y, predictions.mean(axis=0).round()
            )

        return scores

    @staticmethod
    def _plot_trees(
        states: List[torch.Tensor],
        scores: npt.NDArray,
        iteration: int,
    ):
        """
        Plots decision trees present in the given collection of states.

        Args
        ----
        states : Tensor
            Collection of sampled states with dimensionality (n_states, state_dim).

        scores : NDArray
            Collection of scores computed for the given states.

        iteration : int
            Current iteration (will be used to name the folder with trees).
        """
        path = Path(Path.cwd() / f"trees_{iteration}")
        path.mkdir()

        for i, (state, score) in enumerate(zip(states, scores)):
            Tree.plot(state, path / f"tree_{i}_{score:.4f}.png")


[docs]
    def test(
        self,
        samples: Union[
            TensorType["n_trajectories", "..."], npt.NDArray[np.float32], List
        ],
    ) -> dict:
        """
        Computes a dictionary of metrics, as described in Tree._compute_scores, for
        both training and, if available, test data. If self.test_args['top_k_trees'] != 0,
        also plots top n trees and saves them in the log directory.

        Args
        ----
        samples : Tensor
            Collection of sampled states representing the ensemble.

        Returns
        -------
        Dictionary of (metric_name, score) key-value pairs.
        """
        result = {}

        result["mean_n_nodes"] = np.mean([Tree.get_n_nodes(state) for state in samples])

        train_predictions = Tree._predict_samples(samples, self.X_train)
        train_scores = Tree._compute_scores(train_predictions, self.y_train)
        for k, v in train_scores.items():
            result[f"train_{k}"] = v

        top_k_indices = None

        if self.test_args["top_k_trees"] != 0:
            if not hasattr(self, "test_iteration"):
                self.test_iteration = 0

            # Select top-k trees.
            accuracies = np.array(
                [accuracy_score(self.y_train, y_pred) for y_pred in train_predictions]
            )
            order = np.argsort(accuracies)[::-1]
            top_k_indices = order[: self.test_args["top_k_trees"]]

            # Plot trees.
            Tree._plot_trees(
                [samples[i] for i in top_k_indices],
                accuracies[top_k_indices],
                self.test_iteration,
            )

            # Compute metrics for top-k trees.
            top_k_scores = Tree._compute_scores(
                train_predictions[top_k_indices], self.y_train
            )
            for k, v in top_k_scores.items():
                result[f"train_top_k_{k}"] = v

            self.test_iteration += 1

        if self.X_test is not None:
            test_predictions = Tree._predict_samples(samples, self.X_test)
            for k, v in Tree._compute_scores(test_predictions, self.y_test).items():
                result[f"test_{k}"] = v

            if top_k_indices is not None:
                # Compute metrics for top-k trees.
                top_k_scores = Tree._compute_scores(
                    test_predictions[top_k_indices], self.y_test
                )
                for k, v in top_k_scores.items():
                    result[f"eval_top_k_{k}"] = v

        return result