tensorneat-mend/algorithm/neat/gene/normal.py

import jax
from jax import Array, numpy as jnp

from .base import BaseGene
from .activation import Activation
from .aggregation import Aggregation
from algorithm.utils import unflatten_connections, I_INT
from ..genome import topological_sort


class NormalGene(BaseGene):
    node_attrs = ['bias', 'response', 'aggregation', 'activation']
    conn_attrs = ['weight']

    @staticmethod
    def setup(state, config):
        return state.update(
            bias_init_mean=config['bias_init_mean'],
            bias_init_std=config['bias_init_std'],
            bias_mutate_power=config['bias_mutate_power'],
            bias_mutate_rate=config['bias_mutate_rate'],
            bias_replace_rate=config['bias_replace_rate'],

            response_init_mean=config['response_init_mean'],
            response_init_std=config['response_init_std'],
            response_mutate_power=config['response_mutate_power'],
            response_mutate_rate=config['response_mutate_rate'],
            response_replace_rate=config['response_replace_rate'],

            activation_default=config['activation_default'],
            activation_options=config['activation_options'],
            activation_replace_rate=config['activation_replace_rate'],

            aggregation_default=config['aggregation_default'],
            aggregation_options=config['aggregation_options'],
            aggregation_replace_rate=config['aggregation_replace_rate'],

            weight_init_mean=config['weight_init_mean'],
            weight_init_std=config['weight_init_std'],
            weight_mutate_power=config['weight_mutate_power'],
            weight_mutate_rate=config['weight_mutate_rate'],
            weight_replace_rate=config['weight_replace_rate'],
        )

    @staticmethod
    def new_node_attrs(state):
        return jnp.array([state.bias_init_mean, state.response_init_mean,
                          state.activation_default, state.aggregation_default])

    @staticmethod
    def new_conn_attrs(state):
        return jnp.array([state.weight_init_mean])

    @staticmethod
    def mutate_node(state, attrs: Array, key):
        k1, k2, k3, k4 = jax.random.split(key, num=4)

        bias = NormalGene._mutate_float(k1, attrs[0], state.bias_init_mean, state.bias_init_std,
                                        state.bias_mutate_power, state.bias_mutate_rate, state.bias_replace_rate)
        res = NormalGene._mutate_float(k2, attrs[1], state.response_init_mean, state.response_init_std,
                                       state.response_mutate_power, state.response_mutate_rate,
                                       state.response_replace_rate)
        act = NormalGene._mutate_int(k3, attrs[2], state.activation_options, state.activation_replace_rate)
        agg = NormalGene._mutate_int(k4, attrs[3], state.aggregation_options, state.aggregation_replace_rate)

        return jnp.array([bias, res, act, agg])

    @staticmethod
    def mutate_conn(state, attrs: Array, key):
        weight = NormalGene._mutate_float(key, attrs[0], state.weight_init_mean, state.weight_init_std,
                                          state.weight_mutate_power, state.weight_mutate_rate,
                                          state.weight_replace_rate)

        return jnp.array([weight])

    @staticmethod
    def distance_node(state, node1: Array, node2: Array):
        # bias + response + activation + aggregation
        return jnp.abs(node1[1] - node2[1]) + jnp.abs(node1[2] - node2[2]) + \
            (node1[3] != node2[3]) + (node1[4] != node2[4])

    @staticmethod
    def distance_conn(state, con1: Array, con2: Array):
        return (con1[2] != con2[2]) + jnp.abs(con1[3] - con2[3])  # enable + weight

    @staticmethod
    def forward_transform(state, nodes, conns):
        u_conns = unflatten_connections(nodes, conns)
        conn_enable = jnp.where(~jnp.isnan(u_conns[0]), True, False)

        # remove enable attr
        u_conns = jnp.where(conn_enable, u_conns[1:, :], jnp.nan)
        seqs = topological_sort(nodes, conn_enable)

        return seqs, nodes, u_conns

    @staticmethod
    def create_forward(config):
        config['activation_funcs'] = [Activation.name2func[name] for name in config['activation_option_names']]
        config['aggregation_funcs'] = [Aggregation.name2func[name] for name in config['aggregation_option_names']]

        def act(idx, z):
            """
            calculate activation function for each node
            """
            idx = jnp.asarray(idx, dtype=jnp.int32)
            # change idx from float to int
            res = jax.lax.switch(idx, config['activation_funcs'], z)
            return res

        def agg(idx, z):
            """
            calculate activation function for inputs of node
            """
            idx = jnp.asarray(idx, dtype=jnp.int32)

            def all_nan():
                return 0.

            def not_all_nan():
                return jax.lax.switch(idx, config['aggregation_funcs'], z)

            return jax.lax.cond(jnp.all(jnp.isnan(z)), all_nan, not_all_nan)

        def forward(inputs, transform) -> Array:
            """
            jax forward for single input shaped (input_num, )
            nodes, connections are a single genome

            :argument inputs: (input_num, )
            :argument cal_seqs: (N, )
            :argument nodes: (N, 5)
            :argument connections: (2, N, N)

            :return (output_num, )
            """

            cal_seqs, nodes, cons = transform

            input_idx = config['input_idx']
            output_idx = config['output_idx']

            N = nodes.shape[0]
            ini_vals = jnp.full((N,), jnp.nan)
            ini_vals = ini_vals.at[input_idx].set(inputs)

            weights = cons[0, :]

            def cond_fun(carry):
                values, idx = carry
                return (idx < N) & (cal_seqs[idx] != I_INT)

            def body_func(carry):
                values, idx = carry
                i = cal_seqs[idx]

                def hit():
                    ins = values * weights[:, i]
                    z = agg(nodes[i, 4], ins)  # z = agg(ins)
                    z = z * nodes[i, 2] + nodes[i, 1]  # z = z * response + bias
                    z = act(nodes[i, 3], z)  # z = act(z)

                    new_values = values.at[i].set(z)
                    return new_values

                def miss():
                    return values

                # the val of input nodes is obtained by the task, not by calculation
                values = jax.lax.cond(jnp.isin(i, input_idx), miss, hit)

                return values, idx + 1

            vals, _ = jax.lax.while_loop(cond_fun, body_func, (ini_vals, 0))

            return vals[output_idx]

        return forward

    @staticmethod
    def _mutate_float(key, val, init_mean, init_std, mutate_power, mutate_rate, replace_rate):
        k1, k2, k3 = jax.random.split(key, num=3)
        noise = jax.random.normal(k1, ()) * mutate_power
        replace = jax.random.normal(k2, ()) * init_std + init_mean
        r = jax.random.uniform(k3, ())

        val = jnp.where(
            r < mutate_rate,
            val + noise,
            jnp.where(
                (mutate_rate < r) & (r < mutate_rate + replace_rate),
                replace,
                val
            )
        )

        return val

    @staticmethod
    def _mutate_int(key, val, options, replace_rate):
        k1, k2 = jax.random.split(key, num=2)
        r = jax.random.uniform(k1, ())

        val = jnp.where(
            r < replace_rate,
            jax.random.choice(k2, options),
            val
        )

        return val