autora.theorist.bsr.funcs

`Action`

Bases: int, Enum

Enum class that represents a MCMC step with a certain action

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

class Action(int, Enum):
    """
    Enum class that represents a MCMC step with a certain action
    """

    STAY = 0
    GROW = 1
    PRUNE = 2
    DE_TRANSFORM = 3
    TRANSFORM = 4
    REASSIGN_OP = 5
    REASSIGN_FEAT = 6

    @classmethod
    def rand_action(
        cls, lt_num: int, term_num: int, de_trans_num: int
    ) -> Tuple[int, List[float]]:
        """
        Draw a random action for MCMC algorithm to take a step

        Arguments:
            lt_num: the number of linear (`lt`) nodes in the tree
            term_num: the number of terminal nodes in the tree
            de_trans_num: the number of de-trans qualified nodes in the tree
                          (see `propose` for details)

        Returns:
            action: the MCMC action to perform
            weights: the probabilities for each action
        """
        # from the BSR paper
        weights = []
        weights.append(0.25 * lt_num / (lt_num + 3))  # p_stay
        weights.append((1 - weights[0]) * min(1, 4 / (term_num + 2)) / 3)  # p_grow
        weights.append((1 - weights[0]) / 3 - weights[1])  # p_prune
        weights.append(
            ((1 - weights[0]) * (1 / 3) * de_trans_num / (3 + de_trans_num))
        )  # p_detrans
        weights.append((1 - weights[0]) / 3 - weights[3])  # p_trans
        weights.append((1 - weights[0]) / 6)  # p_reassign_op
        weights.append(1 - sum(weights))  # p_reassign_feat
        assert weights[-1] >= 0

        action = random.choices(range(7), weights=weights, k=1)[0]
        return action, weights

`rand_action(lt_num, term_num, de_trans_num)` `classmethod`

Draw a random action for MCMC algorithm to take a step

Parameters:

Name	Type	Description	Default
`lt_num`	`int`	the number of linear (`lt`) nodes in the tree	required
`term_num`	`int`	the number of terminal nodes in the tree	required
`de_trans_num`	`int`	the number of de-trans qualified nodes in the tree (see `propose` for details)	required

Returns:

Name	Type	Description
`action`	`int`	the MCMC action to perform
`weights`	`List[float]`	the probabilities for each action

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

@classmethod
def rand_action(
    cls, lt_num: int, term_num: int, de_trans_num: int
) -> Tuple[int, List[float]]:
    """
    Draw a random action for MCMC algorithm to take a step

    Arguments:
        lt_num: the number of linear (`lt`) nodes in the tree
        term_num: the number of terminal nodes in the tree
        de_trans_num: the number of de-trans qualified nodes in the tree
                      (see `propose` for details)

    Returns:
        action: the MCMC action to perform
        weights: the probabilities for each action
    """
    # from the BSR paper
    weights = []
    weights.append(0.25 * lt_num / (lt_num + 3))  # p_stay
    weights.append((1 - weights[0]) * min(1, 4 / (term_num + 2)) / 3)  # p_grow
    weights.append((1 - weights[0]) / 3 - weights[1])  # p_prune
    weights.append(
        ((1 - weights[0]) * (1 / 3) * de_trans_num / (3 + de_trans_num))
    )  # p_detrans
    weights.append((1 - weights[0]) / 3 - weights[3])  # p_trans
    weights.append((1 - weights[0]) / 6)  # p_reassign_op
    weights.append(1 - sum(weights))  # p_reassign_feat
    assert weights[-1] >= 0

    action = random.choices(range(7), weights=weights, k=1)[0]
    return action, weights

`calc_aux_ll(node, **hyper_params)`

Calculate the likelihood of generating auxiliary parameters

Parameters:

Name	Type	Description	Default
`node`	`Node`	the node from which the auxiliary params are generated	required
`hyper_params`		hyperparameters for generating auxiliary params	`{}`

Returns:

Name	Type	Description
`log_aux`	`float`	log likelihood of auxiliary params
`lt_count`	`int`	number of nodes with `lt` operator in the tree with `node` as its root

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

def calc_aux_ll(node: Node, **hyper_params) -> Tuple[float, int]:
    """
    Calculate the likelihood of generating auxiliary parameters

    Arguments:
        node: the node from which the auxiliary params are generated
        hyper_params: hyperparameters for generating auxiliary params

    Returns:
        log_aux: log likelihood of auxiliary params
        lt_count: number of nodes with `lt` operator in the tree with
            `node` as its root
    """
    sigma_a, sigma_b = hyper_params["sigma_a"], hyper_params["sigma_b"]
    log_aux = np.log(invgamma.pdf(sigma_a, 1)) + np.log(invgamma.pdf(sigma_b, 1))

    all_nodes = get_all_nodes(node)
    lt_count = 0
    for i in range(all_nodes):
        if all_nodes[i].op_name == "ln":
            lt_count += 1
            a, b = all_nodes[i].params["a"], all_nodes[i].params["b"]
            log_aux += np.log(norm.pdf(a, 1, np.sqrt(sigma_a)))
            log_aux += np.log(norm.pdf(b, 0, np.sqrt(sigma_b)))

    return log_aux, lt_count

`calc_tree_ll(node, ops_priors, n_feature=1, **hyper_params)`

Calculate the likelihood-related quantities of the given tree node.

Parameters:

Name	Type	Description	Default
`node`	`Node`	the tree node for which the calculations are done	required
`ops_priors`	`Dict[str, Dict]`	the dictionary that maps operation names to their prior info	required
`n_feature`	`int`	number of features in the input data	`1`
`hyperparams`		hyperparameters for initialization	required

Returns:

Name	Type	Description
`struct_ll`		tree structure-related likelihood
`params_ll`		tree parameters-related likelihood

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

@check_empty
def calc_tree_ll(
    node: Node, ops_priors: Dict[str, Dict], n_feature: int = 1, **hyper_params
):
    """
    Calculate the likelihood-related quantities of the given tree `node`.

    Arguments:
        node: the tree node for which the calculations are done
        ops_priors: the dictionary that maps operation names to their prior info
        n_feature: number of features in the input data
        hyperparams: hyperparameters for initialization

    Returns:
        struct_ll: tree structure-related likelihood
        params_ll: tree parameters-related likelihood
    """
    struct_ll = 0  # log likelihood of tree structure S = (T,M)
    params_ll = 0  # log likelihood of linear params
    depth = node.depth
    beta = hyper_params.get("beta", -1)
    sigma_a, sigma_b = hyper_params.get("sigma_a", 1), hyper_params.get("sigma_b", 1)

    # contribution of hyperparameter sigma_theta
    if not depth:  # root node
        struct_ll += np.log(invgamma.pdf(sigma_a, 1))
        struct_ll += np.log(invgamma.pdf(sigma_b, 1))

    # contribution of splitting the node or becoming leaf node
    if node.node_type == NodeType.LEAF:
        # contribution of choosing terminal
        struct_ll += np.log(1 - 1 / np.power((1 + depth), -beta))
        # contribution of feature selection
        struct_ll -= np.log(n_feature)
        return struct_ll, params_ll
    elif node.node_type == NodeType.UNARY:  # unitary operator
        # contribution of child nodes are added since the log likelihood is additive
        # if we assume the parameters are independent.
        left = cast(Node, node.left)
        struct_ll_left, params_ll_left = calc_tree_ll(
            left, ops_priors, n_feature, **hyper_params
        )
        struct_ll += struct_ll_left
        params_ll += params_ll_left
        # contribution of parameters of linear nodes
        # make sure the below parameter ll calculation is extendable
        if node.op_name == "ln":
            params_ll -= np.power((node.params["a"] - 1), 2) / (2 * sigma_a)
            params_ll -= np.power(node.params["b"], 2) / (2 * sigma_b)
            params_ll -= 0.5 * np.log(4 * np.pi**2 * sigma_a * sigma_b)
    else:  # binary operator
        left = cast(Node, node.left)
        right = cast(Node, node.right)
        struct_ll_left, params_ll_left = calc_tree_ll(
            left, ops_priors, n_feature, **hyper_params
        )
        struct_ll_right, params_ll_right = calc_tree_ll(
            right, ops_priors, n_feature, **hyper_params
        )
        struct_ll += struct_ll_left + struct_ll_right
        params_ll += params_ll_left + params_ll_right

    op_weight = ops_priors[node.op_name]["weight"]
    # for unary & binary nodes, additionally consider the contribution of splitting
    if not depth:  # root node
        struct_ll += np.log(op_weight)
    else:
        struct_ll += np.log((1 + depth)) * beta + np.log(op_weight)

    return struct_ll, params_ll

`calc_y_ll(y, outputs, sigma_y)`

Calculate the log likelihood f(y|S,Theta,x) where (S,Theta) is represented by the node prior is y ~ N(output,sigma) and output is the matrix of outputs corresponding to different roots.

Returns:

Name	Type	Description
`log_sum`		the data log likelihood

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

def calc_y_ll(y: np.ndarray, outputs: Union[np.ndarray, pd.DataFrame], sigma_y: float):
    """
    Calculate the log likelihood f(y|S,Theta,x) where (S,Theta) is represented by the
    node prior is y ~ N(output,sigma) and output is the matrix of outputs corresponding to
    different roots.

    Returns:
        log_sum: the data log likelihood
    """
    outputs = copy.deepcopy(outputs)
    scale = np.max(np.abs(outputs))
    outputs = outputs / scale
    epsilon = np.eye(outputs.shape[1]) * 1e-6
    beta = np.linalg.inv(np.matmul(outputs.transpose(), outputs) + epsilon)
    beta = np.matmul(beta, np.matmul(outputs.transpose(), y))
    # perform the linear combination
    output = np.matmul(outputs, beta)
    # calculate the squared error
    error = np.sum(np.square(y - output[:, 0]))

    log_sum = error
    var = 2 * sigma_y * sigma_y
    log_sum = -log_sum / var
    log_sum -= 0.5 * len(y) * np.log(np.pi * var)
    return log_sum

`check_empty(func)`

A decorator that, if applied to func, checks whether an argument in func is an un-initialized node (i.e. node.node_type == NodeType.Empty). If so, an error is raised.

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

def check_empty(func: Callable):
    """
    A decorator that, if applied to `func`, checks whether an argument in `func` is an
    un-initialized node (i.e. node.node_type == NodeType.Empty). If so, an error is raised.
    """

    @wraps(func)
    def func_wrapper(*args, **kwargs):
        for arg in args:
            if isinstance(arg, Node):
                if arg.node_type == NodeType.EMPTY:
                    raise TypeError(
                        "uninitialized node found in {}".format(func.__name__)
                    )
                break
        return func(*args, **kwargs)

    return func_wrapper

`de_transform(node)`

ACTION 4: De-transform deletes the current node and replaces it with children according to the following rule: if the node is unary, simply replace with its child; if node is binary and root, choose any children that's not leaf; if node is binary and not root, pick any children.

Parameters:

Name	Type	Description	Default
`node`	`Node`	the tree node that gets de-transformed	required

Returns:

Type	Description
`Node`	first node is the replaced node when `node` has been de-transformed
`Optional[Node]`	second node is the discarded node

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

@check_empty
def de_transform(node: Node) -> Tuple[Node, Optional[Node]]:
    """
    ACTION 4: De-transform deletes the current `node` and replaces it with children
    according to the following rule: if the `node` is unary, simply replace with its
    child; if `node` is binary and root, choose any children that's not leaf; if `node`
    is binary and not root, pick any children.

    Arguments:
        node: the tree node that gets de-transformed

    Returns:
        first node is the replaced node when `node` has been de-transformed
        second node is the discarded node
    """
    left = cast(Node, node.left)
    if node.node_type == NodeType.UNARY:
        return left, None

    r = random.random()
    right = cast(Node, node.right)
    # picked node is root
    if not node.depth:
        if left.node_type == NodeType.LEAF:
            return right, left
        elif right.node_type == NodeType.LEAF:
            return left, right
        else:
            return (left, right) if r < 0.5 else (right, left)
    elif r < 0.5:
        return left, right
    else:
        return right, left

`get_all_nodes(node)`

Get all the nodes below (and including) the given node via pre-order traversal

Return

a list with all the nodes below (and including) the given node

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

@check_empty
def get_all_nodes(node: Node) -> List[Node]:
    """
    Get all the nodes below (and including) the given `node` via pre-order traversal

    Return:
        a list with all the nodes below (and including) the given `node`
    """
    nodes = [node]
    if node.node_type == NodeType.UNARY:
        nodes.extend(get_all_nodes(node.left))
    elif node.node_type == NodeType.BINARY:
        nodes.extend(get_all_nodes(node.left))
        nodes.extend(get_all_nodes(node.right))
    return nodes

`get_height(node)`

Get the height of a tree starting from node as root. The height of a leaf is defined as 0.

Parameters:

Name	Type	Description	Default
`node`	`Node`	the Node that we hope to calculate `height` for	required

Returns: height: the height of node

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

@check_empty
def get_height(node: Node) -> int:
    """
    Get the height of a tree starting from `node` as root. The height of a leaf is defined as 0.

    Arguments:
        node: the Node that we hope to calculate `height` for
    Returns:
        height: the height of `node`
    """
    if node.node_type == NodeType.LEAF:
        return 0
    elif node.node_type == NodeType.UNARY:
        return 1 + get_height(node.left)
    else:  # binary node
        return 1 + max(get_height(node.left), get_height(node.right))

`get_num_lt_nodes(node)`

Get the number of nodes with lt operation in a tree starting from node

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

@check_empty
def get_num_lt_nodes(node: Node) -> int:
    """
    Get the number of nodes with `lt` operation in a tree starting from `node`
    """
    if node.node_type == NodeType.LEAF:
        return 0
    else:
        base = 1 if node.op_name == "ln" else 0
        if node.node_type == NodeType.UNARY:
            return base + get_num_lt_nodes(node.left)
        else:
            return base + get_num_lt_nodes(node.left) + get_num_lt_nodes(node.right)

`grow(node, ops_name_lst, ops_weight_lst, ops_priors, n_feature=1, **hyper_params)`

ACTION 2: Grow represents the action of growing a subtree from a given node

Parameters:

Name	Type	Description	Default
`node`	`Node`	the tree node from where the subtree starts to grow	required
`ops_name_lst`	`List[str]`	list of operation names	required
`ops_weight_lst`	`List[float]`	list of operation prior weights	required
`ops_priors`	`Dict[str, Dict]`	the dictionary of operation prior properties	required
`n_feature`	`int`	the number of features in input data	`1`
`hyper_params`		hyperparameters for re-initialization	`{}`

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

def grow(
    node: Node,
    ops_name_lst: List[str],
    ops_weight_lst: List[float],
    ops_priors: Dict[str, Dict],
    n_feature: int = 1,
    **hyper_params,
):
    """
    ACTION 2: Grow represents the action of growing a subtree from a given `node`

    Arguments:
        node: the tree node from where the subtree starts to grow
        ops_name_lst: list of operation names
        ops_weight_lst: list of operation prior weights
        ops_priors: the dictionary of operation prior properties
        n_feature: the number of features in input data
        hyper_params: hyperparameters for re-initialization
    """
    depth = node.depth
    p = 1 / np.power((1 + depth), -hyper_params.get("beta", -1))

    if depth > 0 and p < random.random():  # create leaf node
        node.setup(feature=random.randint(0, n_feature - 1))
    else:
        ops_name = random.choices(ops_name_lst, ops_weight_lst, k=1)[0]
        ops_prior = ops_priors[ops_name]
        node.setup(ops_name, ops_prior, hyper_params=hyper_params)

        # recursively set up downstream nodes
        grow(
            cast(Node, node.left),
            ops_name_lst,
            ops_weight_lst,
            ops_priors,
            n_feature,
            **hyper_params,
        )
        if node.node_type == NodeType.BINARY:
            grow(
                cast(Node, node.right),
                ops_name_lst,
                ops_weight_lst,
                ops_priors,
                n_feature,
                **hyper_params,
            )

`prop(node, ops_name_lst, ops_weight_lst, ops_priors, n_feature=1, **hyper_params)`

Propose a new tree from an existing tree with root node.

Parameters:

Name	Type	Description	Default
`node`	`Node`	the existing tree node	required
`ops_name_lst`	`List[str]`	the list of operator names	required
`ops_weight_lst`	`List[float]`	the list of operator weights	required
`ops_priors`	`Dict[str, Dict]`	the dictionary of operator prior information	required
`n_feature`	`int`	the number of features in input data	`1`
`hyper_params`		hyperparameters for initialization	`{}`

Return

new_node: the new node after some action is applied expand_node: whether the node has been expanded shrink_node: whether the node has been shrunk q: quantities for calculating acceptance prob q_inv: quantities for calculating acceptance prob

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

@check_empty
def prop(
    node: Node,
    ops_name_lst: List[str],
    ops_weight_lst: List[float],
    ops_priors: Dict[str, Dict],
    n_feature: int = 1,
    **hyper_params,
):
    """
    Propose a new tree from an existing tree with root `node`.

    Arguments:
        node: the existing tree node
        ops_name_lst: the list of operator names
        ops_weight_lst: the list of operator weights
        ops_priors: the dictionary of operator prior information
        n_feature: the number of features in input data
        hyper_params: hyperparameters for initialization

    Return:
        new_node: the new node after some action is applied
        expand_node: whether the node has been expanded
        shrink_node: whether the node has been shrunk
        q: quantities for calculating acceptance prob
        q_inv: quantities for calculating acceptance prob
    """
    # PART 1: collect necessary information
    new_node = copy.deepcopy(node)
    term_nodes, nterm_nodes, lt_nodes, de_trans_nodes = _get_tree_classified_nodes(
        new_node
    )

    # PART 2: sample random action and perform the action
    # this step also calculates q and q_inv, quantities necessary for calculating
    # the acceptance probability in MCMC algorithm
    action, probs = Action.rand_action(
        len(lt_nodes), len(term_nodes), len(de_trans_nodes)
    )
    # flags indicating potential dimensionality change (expand or shrink) in node
    expand_node, shrink_node = False, False

    # ACTION 1: STAY
    # q and q_inv simply equal the probability of choosing this action
    if action == Action.STAY:
        q = probs[Action.STAY]
        q_inv = probs[Action.STAY]
        stay(lt_nodes, **hyper_params)
    # ACTION 2: GROW
    # q and q_inv simply equal the probability if the grown node is a leaf node
    # otherwise, we calculate new information of the `new_node` after the action is applied
    elif action == Action.GROW:
        i = random.randint(0, len(term_nodes) - 1)
        grown_node: Node = term_nodes[i]
        grow(
            grown_node,
            ops_name_lst,
            ops_weight_lst,
            ops_priors,
            n_feature,
            **hyper_params,
        )
        if grown_node.node_type == NodeType.LEAF:
            q = q_inv = 1
        else:
            tree_ll, param_ll = calc_tree_ll(
                grown_node, ops_priors, n_feature, **hyper_params
            )
            # calculate q
            q = probs[Action.GROW] * np.exp(tree_ll) / len(term_nodes)
            # calculate q_inv by using updated information of `new_node`
            (
                new_term_count,
                new_nterm_count,
                new_lt_count,
                _,
            ) = _get_tree_classified_counts(new_node)
            new_prob = (
                (1 - 0.25 * new_lt_count / (new_lt_count + 3))
                * (1 - min(1, 4 / (new_nterm_count + 2)))
                / 3
            )
            q_inv = new_prob / max(1, new_nterm_count - 1)  # except the root
            if new_lt_count > len(lt_nodes):
                expand_node = True
    # ACTION 3: PRUNE
    elif action == Action.PRUNE:
        i = random.randint(0, len(nterm_nodes) - 1)
        pruned_node: Node = nterm_nodes[i]
        prune(pruned_node, n_feature)
        tree_ll, param_ll = calc_tree_ll(
            pruned_node, ops_priors, n_feature, **hyper_params
        )

        new_term_count, new_nterm_count, new_lt_count, _ = _get_tree_classified_counts(
            new_node
        )
        # pruning any tree with `ln` operator will result in shrinkage
        if new_lt_count < len(lt_nodes):
            shrink_node = True

        # calculate q
        q = probs[Action.PRUNE] / ((len(nterm_nodes) - 1) * n_feature)
        pg = 1 - 0.25 * new_lt_count / (new_lt_count + 3) * 0.75 * min(
            1, 4 / (new_nterm_count + 2)
        )
        # calculate q_inv
        q_inv = pg * np.exp(tree_ll) / new_term_count
    # ACTION 4: DE_TRANSFORM
    elif action == Action.DE_TRANSFORM:
        num_de_trans = len(de_trans_nodes)
        i = random.randint(0, num_de_trans - 1)
        de_trans_node: Node = de_trans_nodes[i]
        replaced_node, discarded_node = de_transform(de_trans_node)
        par_node = de_trans_node.parent

        q = probs[Action.DE_TRANSFORM] / num_de_trans
        if (
            not par_node
            and de_trans_node.left
            and de_trans_node.right
            and de_trans_node.left.node_type != NodeType.LEAF
            and de_trans_node.right.node_type != NodeType.LEAF
        ):
            q = q / 2
        elif de_trans_node.node_type == NodeType.BINARY:
            q = q / 2

        if not par_node:  # de-transformed the root
            new_node = replaced_node
            new_node.parent = None
            update_depth(new_node, 0)
        elif par_node.left is de_trans_node:
            par_node.left = replaced_node
            replaced_node.parent = par_node
            update_depth(replaced_node, par_node.depth + 1)
        else:
            par_node.right = replaced_node
            replaced_node.parent = par_node
            update_depth(replaced_node, par_node.depth + 1)

        (
            new_term_count,
            new_nterm_count,
            new_lt_count,
            new_det_count,
        ) = _get_tree_classified_counts(new_node)

        if new_lt_count < len(lt_nodes):
            shrink_node = True

        new_prob = 0.25 * new_lt_count / (new_lt_count + 3)
        # calculate q_inv
        new_pdetr = (1 - new_prob) * (1 / 3) * new_det_count / (new_det_count + 3)
        new_ptr = (1 - new_prob) / 3 - new_pdetr
        q_inv = (
            new_ptr
            * ops_priors[de_trans_node.op_name]["weight"]
            / (new_term_count + new_nterm_count)
        )
        if discarded_node:
            tree_ll, _ = calc_tree_ll(
                discarded_node, ops_priors, n_feature, **hyper_params
            )
            q_inv = q_inv * np.exp(tree_ll)
    # ACTION 5: TRANSFORM
    elif action == Action.TRANSFORM:
        all_nodes = get_all_nodes(new_node)
        i = random.randint(0, len(all_nodes) - 1)
        trans_node: Node = all_nodes[i]
        inserted_node: Node = transform(
            trans_node,
            ops_name_lst,
            ops_weight_lst,
            ops_priors,
            n_feature,
            **hyper_params,
        )

        if inserted_node.right:
            ll_right, _ = calc_tree_ll(
                inserted_node.right, ops_priors, n_feature, **hyper_params
            )
        else:
            ll_right = 0
        # calculate q
        q = (
            probs[Action.TRANSFORM]
            * ops_priors[inserted_node.op_name]["weight"]
            * np.exp(ll_right)
            / len(all_nodes)
        )

        (
            new_term_count,
            new_nterm_count,
            new_lt_count,
            new_det_count,
        ) = _get_tree_classified_counts(new_node)
        if new_lt_count > len(lt_nodes):
            expand_node = True

        new_prob = 0.25 * new_lt_count / (new_lt_count + 3)
        # calculate q_inv
        new_pdetr = (1 - new_prob) * (1 / 3) * new_det_count / (new_det_count + 3)
        q_inv = new_pdetr / new_det_count
        if (
            inserted_node.left
            and inserted_node.right
            and inserted_node.left.node_type != NodeType.LEAF
            and inserted_node.right.node_type != NodeType.LEAF
        ):
            q_inv = q_inv / 2
    # ACTION 6: REASSIGN OPERATION
    elif action == Action.REASSIGN_OP:
        i = random.randint(0, len(nterm_nodes) - 1)
        reassign_node: Node = nterm_nodes[i]
        old_right = reassign_node.right
        old_op_name, old_type = reassign_node.op_name, reassign_node.node_type
        reassign_op(
            reassign_node,
            ops_name_lst,
            ops_weight_lst,
            ops_priors,
            n_feature,
            **hyper_params,
        )
        new_type = reassign_node.node_type
        _, new_nterm_count, new_lt_count, _ = _get_tree_classified_counts(new_node)

        if old_type == new_type:  # binary -> binary & unary -> unary
            q = ops_priors[reassign_node.op_name]["weight"]
            q_inv = ops_priors[old_op_name]["weight"]
        else:
            op_weight = ops_priors[reassign_node.op_name]["weight"]
            if old_type == NodeType.UNARY:  # unary -> binary
                tree_ll, _ = calc_tree_ll(
                    reassign_node.right, ops_priors, n_feature, **hyper_params
                )
                q = (
                    probs[Action.REASSIGN_OP]
                    * np.exp(tree_ll)
                    * op_weight
                    / len(nterm_nodes)
                )
                ll_factor = 1
            else:  # binary -> unary
                tree_ll, _ = calc_tree_ll(
                    old_right, ops_priors, n_feature, **hyper_params
                )
                q = probs[Action.REASSIGN_OP] * op_weight / len(nterm_nodes)
                ll_factor = tree_ll
            # calculate q_inv
            new_prob = new_lt_count / (4 * (new_lt_count + 3))
            q_inv = (
                0.125
                * (1 - new_prob)
                * ll_factor
                * ops_priors[old_op_name]["weight"]
                / new_nterm_count
            )
        if new_lt_count > len(lt_nodes):
            expand_node = True
        elif new_lt_count < len(lt_nodes):
            shrink_node = True
    # ACTION 7: REASSIGN FEATURE
    else:
        i = random.randint(0, len(term_nodes) - 1)
        reassign_node = term_nodes[i]
        reassign_feat(reassign_node, n_feature)
        q = q_inv = 1

    return new_node, expand_node, shrink_node, q, q_inv

`prop_new(roots, index, sigma_y, beta, sigma_a, sigma_b, X, y, ops_name_lst, ops_weight_lst, ops_priors)`

Propose new structure, sample new parameters and decide whether to accept the new tree.

Parameters:

Name	Type	Description	Default
`roots`	`List[Node]`	the list of root nodes	required
`index`	`int`	the index of the root node to update	required
`sigma_y`	`float`	scale hyperparameter for linear mixture of expression trees	required
`beta`	`float`	hyperparameter for growing an uninitialized expression tree	required
`sigma_a`	`float`	hyperparameters for `lt` operator initialization	required
`sigma_b`	`float`	hyperparameters for `lt` operator initialization	required
`X`	`Union[ndarray, DataFrame]`	input data (independent variable) matrix	required
`y`	`Union[ndarray, DataFrame]`	dependent variable vector	required
`ops_name_lst`	`List[str]`	the list of operator names	required
`ops_weight_lst`	`List[float]`	the list of operator weights	required
`ops_priors`	`Dict[str, Dict]`	the dictionary of operator prior information	required

Returns:

Name	Type	Description
`accept`	`bool`	whether to accept or reject the new expression tree
`root`	`Node`	the old or new expression tree, determined by whether to accept the new tree
`sigma_y`	`float`	the old or new sigma_y
`sigma_a`	`float`	the old or new sigma_a
`sigma_b`	`float`	the old or new sigma_b

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

def prop_new(
    roots: List[Node],
    index: int,
    sigma_y: float,
    beta: float,
    sigma_a: float,
    sigma_b: float,
    X: Union[np.ndarray, pd.DataFrame],
    y: Union[np.ndarray, pd.DataFrame],
    ops_name_lst: List[str],
    ops_weight_lst: List[float],
    ops_priors: Dict[str, Dict],
) -> Tuple[bool, Node, float, float, float]:
    """
    Propose new structure, sample new parameters and decide whether to accept the new tree.

    Arguments:
        roots: the list of root nodes
        index: the index of the root node to update
        sigma_y: scale hyperparameter for linear mixture of expression trees
        beta: hyperparameter for growing an uninitialized expression tree
        sigma_a: hyperparameters for `lt` operator initialization
        sigma_b: hyperparameters for `lt` operator initialization
        X: input data (independent variable) matrix
        y: dependent variable vector
        ops_name_lst: the list of operator names
        ops_weight_lst: the list of operator weights
        ops_priors: the dictionary of operator prior information

    Returns:
        accept: whether to accept or reject the new expression tree
        root: the old or new expression tree, determined by whether to accept the new tree
        sigma_y: the old or new sigma_y
        sigma_a: the old or new sigma_a
        sigma_b: the old or new sigma_b
    """
    # the hyper-param for linear combination, i.e. for `sigma_y`
    sig = 4
    K = len(roots)
    root = roots[index]
    use_aux_ll = True

    # sample new sigma_a and sigma_b
    new_sigma_a = invgamma.rvs(1)
    new_sigma_b = invgamma.rvs(1)

    hyper_params = {"sigma_a": sigma_a, "sigma_b": sigma_b, "beta": beta}
    new_hyper_params = {"sigma_a": new_sigma_a, "sigma_b": new_sigma_b, "beta": beta}
    # propose a new tree `node`
    new_root, expand_node, shrink_node, q, q_inv = prop(
        root, ops_name_lst, ops_weight_lst, ops_priors, X.shape[1], **new_hyper_params
    )

    n_feature = X.shape[0]
    new_outputs = np.zeros((len(y), K))
    old_outputs = np.zeros((len(y), K))

    for i in np.arange(K):
        tmp_old = root.evaluate(X)
        old_outputs[:, i] = tmp_old
        if i == index:
            new_outputs[:, i] = new_root.evaluate(X)
        else:
            new_outputs[:, i] = tmp_old

    if np.linalg.matrix_rank(new_outputs) < K:  # rejection due to insufficient rank
        return False, root, sigma_y, sigma_a, sigma_b

    y_ll_old = calc_y_ll(y, old_outputs, sigma_y)
    # a magic number here as the parameter for generating new sigma_y
    new_sigma_y = invgamma.rvs(sig)
    y_ll_new = calc_y_ll(y, new_outputs, new_sigma_y)

    log_y_ratio = y_ll_new - y_ll_old
    # contribution of f(Theta, S)
    if shrink_node or expand_node:
        struct_ll_old = sum(calc_tree_ll(root, ops_priors, n_feature, **hyper_params))
        struct_ll_new = sum(
            calc_tree_ll(new_root, ops_priors, n_feature, **hyper_params)
        )
        log_struct_ratio = struct_ll_new - struct_ll_old
    else:
        log_struct_ratio = calc_tree_ll(
            new_root, ops_priors, n_feature, **hyper_params
        )[0] - calc_tree_ll(root, ops_priors, n_feature, **hyper_params)

    # contribution of proposal Q and Qinv
    log_q_ratio = np.log(max(1e-5, q_inv / q))

    log_r = (
        log_y_ratio
        + log_struct_ratio
        + log_q_ratio
        + np.log(invgamma.pdf(new_sigma_y, sig))
        - np.log(invgamma.pdf(sigma_y, sig))
    )

    if use_aux_ll and (expand_node or shrink_node):
        old_aux_ll, old_lt_count = calc_aux_ll(root, **hyper_params)
        new_aux_ll, _ = calc_aux_ll(new_root, **new_hyper_params)
        log_r += old_aux_ll - new_aux_ll
        # log for the Jacobian matrix
        log_r += np.log(max(1e-5, 1 / np.power(2, 2 * old_lt_count)))

    alpha = min(log_r, 0)
    test = random.random()
    if np.log(test) >= alpha:  # no accept
        return False, root, sigma_y, sigma_a, sigma_b
    else:  # accept
        return True, new_root, new_sigma_y, new_sigma_a, new_sigma_b

`prune(node, n_feature=1)`

ACTION 3: Prune a non-terminal node into a terminal node and assign it a feature

Parameters:

Name	Type	Description	Default
`node`	`Node`	the tree node to be pruned	required
`n_feature`	`int`	the number of features in input data	`1`

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

@check_empty
def prune(node: Node, n_feature: int = 1):
    """
    ACTION 3: Prune a non-terminal node into a terminal node and assign it a feature

    Arguments:
        node: the tree node to be pruned
        n_feature: the number of features in input data
    """
    node.setup(feature=random.randint(0, n_feature - 1))

`reassign_feat(node, n_feature=1)`

ACTION 7: Re-assign feature randomly picks a feature and assign it to node.

Parameters:

Name	Type	Description	Default
`node`	`Node`	the tree node that gets re-assigned a feature	required
`n_feature`	`int`	the number of features in input data	`1`

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

@check_empty
def reassign_feat(node: Node, n_feature: int = 1):
    """
    ACTION 7: Re-assign feature randomly picks a feature and assign it to `node`.

    Arguments:
        node: the tree node that gets re-assigned a feature
        n_feature: the number of features in input data
    """
    # make sure we have a leaf node
    assert node.node_type == NodeType.LEAF
    node.setup(feature=random.randint(0, n_feature - 1))

`reassign_op(node, ops_name_lst, ops_weight_lst, ops_priors, n_feature=1, **hyper_params)`

ACTION 6: Re-assign action uniformly picks a non-terminal node, and assign a new operator. If the node changes from unary to binary, its original child is taken as the left child, and we grow a new subtree as right child. If the node changes from binary to unary, we preserve the left subtree (this is to make the transition reversible).

Parameters:

Name	Type	Description	Default
`node`	`Node`	the tree node that gets re-assigned an operator	required
`ops_name_lst`	`List[str]`	list of operation names	required
`ops_weight_lst`	`List[float]`	list of operation prior weights	required
`ops_priors`	`Dict[str, Dict]`	the dictionary of operation prior properties	required
`n_feature`	`int`	the number of features in input data	`1`
`hyper_params`	`Dict`	hyperparameters for re-initialization	`{}`

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

@check_empty
def reassign_op(
    node: Node,
    ops_name_lst: List[str],
    ops_weight_lst: List[float],
    ops_priors: Dict[str, Dict],
    n_feature: int = 1,
    **hyper_params: Dict,
):
    """
    ACTION 6: Re-assign action uniformly picks a non-terminal node, and assign a new operator.
    If the node changes from unary to binary, its original child is taken as the left child,
    and we grow a new subtree as right child. If the node changes from binary to unary, we
    preserve the left subtree (this is to make the transition reversible).

    Arguments:
        node: the tree node that gets re-assigned an operator
        ops_name_lst: list of operation names
        ops_weight_lst: list of operation prior weights
        ops_priors: the dictionary of operation prior properties
        n_feature: the number of features in input data
        hyper_params: hyperparameters for re-initialization
    """
    # make sure `node` is non-terminal
    old_type = node.node_type
    assert old_type != NodeType.LEAF

    # store the original children and re-setup the `node`
    old_left, old_right = node.left, node.right
    new_op = random.choices(ops_name_lst, ops_weight_lst, k=1)[0]
    node.setup(new_op, ops_priors[new_op], hyper_params=hyper_params)

    new_type = node.node_type

    node.left = old_left
    if old_type == new_type:  # binary -> binary & unary -> unary
        node.right = old_right
    elif new_type == NodeType.BINARY:  # unary -> binary
        grow(
            cast(Node, node.right),
            ops_name_lst,
            ops_weight_lst,
            ops_priors,
            n_feature,
            **hyper_params,
        )
    else:
        node.right = None

`stay(lt_nodes, **hyper_params)`

ACTION 1: Stay represents the action of doing nothing but to update the parameters for ln operators.

Parameters:

Name	Type	Description	Default
`lt_nodes`	`List[Node]`	the list of nodes with `ln` operator	required
`hyper_params`	`Dict`	hyperparameters for re-initialization	`{}`

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

def stay(lt_nodes: List[Node], **hyper_params: Dict):
    """
    ACTION 1: Stay represents the action of doing nothing but to update the parameters for `ln`
    operators.

    Arguments:
        lt_nodes: the list of nodes with `ln` operator
        hyper_params: hyperparameters for re-initialization
    """
    for lt_node in lt_nodes:
        lt_node._init_param(**hyper_params)

`transform(node, ops_name_lst, ops_weight_lst, ops_priors, n_feature=1, **hyper_params)`

ACTION 5: Transform inserts a middle node between the picked node and its parent. Assign an operation to this middle node using the priors. If the middle node is binary, grow its right child. The left child of the middle node is set to node and its parent becomes node.parent.

Parameters:

Name	Type	Description	Default
`node`	`Node`	the tree node that gets transformed	required
`ops_name_lst`	`List[str]`	list of operation names	required
`ops_weight_lst`	`List[float]`	list of operation prior weights	required
`ops_priors`	`Dict[str, Dict]`	the dictionary of operation prior properties	required
`n_feature`	`int`	the number of features in input data	`1`
`hyper_params`	`Dict`	hyperparameters for re-initialization	`{}`

Return

the middle node that gets inserted

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

@check_empty
def transform(
    node: Node,
    ops_name_lst: List[str],
    ops_weight_lst: List[float],
    ops_priors: Dict[str, Dict],
    n_feature: int = 1,
    **hyper_params: Dict,
) -> Node:
    """
    ACTION 5: Transform inserts a middle node between the picked `node` and its
    parent. Assign an operation to this middle node using the priors. If the middle
    node is binary, `grow` its right child. The left child of the middle node is
    set to `node` and its parent becomes `node.parent`.

    Arguments:
        node: the tree node that gets transformed
        ops_name_lst: list of operation names
        ops_weight_lst: list of operation prior weights
        ops_priors: the dictionary of operation prior properties
        n_feature: the number of features in input data
        hyper_params: hyperparameters for re-initialization

    Return:
        the middle node that gets inserted
    """
    parent = node.parent

    insert_node = Node(depth=node.depth, parent=parent)
    insert_op = random.choices(ops_name_lst, ops_weight_lst, k=1)[0]
    insert_node.setup(insert_op, ops_priors[insert_op], hyper_params=hyper_params)

    if parent:
        is_left = node is parent.left
        if is_left:
            parent.left = insert_node
        else:
            parent.right = insert_node

    # set the left child as `node` and grow the right child if needed (binary case)
    insert_node.left = node
    node.parent = insert_node
    if insert_node.node_type == NodeType.BINARY:
        grow(
            cast(Node, insert_node.right),
            ops_name_lst,
            ops_weight_lst,
            ops_priors,
            n_feature,
            **hyper_params,
        )

    # make sure the depth property is updated correctly
    update_depth(node, node.depth + 1)
    return insert_node

`update_depth(node, depth)`

Update the depth information of all nodes starting from root node, whose depth is set equal to the given depth.

Source code in temp_dir/bsr/src/autora/theorist/bsr/funcs.py

@check_empty
def update_depth(node: Node, depth: int):
    """
    Update the depth information of all nodes starting from root `node`, whose depth
    is set equal to the given `depth`.
    """
    node.depth = depth
    if node.node_type == NodeType.UNARY:
        update_depth(node.left, depth + 1)
    elif node.node_type == NodeType.BINARY:
        update_depth(node.left, depth + 1)
        update_depth(node.right, depth + 1)

autora.theorist.bsr.funcs

Action

rand_action(lt_num, term_num, de_trans_num) classmethod

calc_aux_ll(node, **hyper_params)

calc_tree_ll(node, ops_priors, n_feature=1, **hyper_params)

calc_y_ll(y, outputs, sigma_y)

check_empty(func)

de_transform(node)

get_all_nodes(node)

get_height(node)

get_num_lt_nodes(node)

grow(node, ops_name_lst, ops_weight_lst, ops_priors, n_feature=1, **hyper_params)

prop(node, ops_name_lst, ops_weight_lst, ops_priors, n_feature=1, **hyper_params)

prop_new(roots, index, sigma_y, beta, sigma_a, sigma_b, X, y, ops_name_lst, ops_weight_lst, ops_priors)

prune(node, n_feature=1)

reassign_feat(node, n_feature=1)

reassign_op(node, ops_name_lst, ops_weight_lst, ops_priors, n_feature=1, **hyper_params)

stay(lt_nodes, **hyper_params)

transform(node, ops_name_lst, ops_weight_lst, ops_priors, n_feature=1, **hyper_params)

update_depth(node, depth)

`Action`

`rand_action(lt_num, term_num, de_trans_num)` `classmethod`

`calc_aux_ll(node, **hyper_params)`

`calc_tree_ll(node, ops_priors, n_feature=1, **hyper_params)`

`calc_y_ll(y, outputs, sigma_y)`

`check_empty(func)`

`de_transform(node)`

`get_all_nodes(node)`

`get_height(node)`

`get_num_lt_nodes(node)`

`grow(node, ops_name_lst, ops_weight_lst, ops_priors, n_feature=1, **hyper_params)`

`prop(node, ops_name_lst, ops_weight_lst, ops_priors, n_feature=1, **hyper_params)`

`prop_new(roots, index, sigma_y, beta, sigma_a, sigma_b, X, y, ops_name_lst, ops_weight_lst, ops_priors)`

`prune(node, n_feature=1)`

`reassign_feat(node, n_feature=1)`

`reassign_op(node, ops_name_lst, ops_weight_lst, ops_priors, n_feature=1, **hyper_params)`

`stay(lt_nodes, **hyper_params)`

`transform(node, ops_name_lst, ops_weight_lst, ops_priors, n_feature=1, **hyper_params)`

`update_depth(node, depth)`